diff merge_pcr_duplicates.py @ 14:570a7de9f151 draft

read from bam; fix header issue
author rnateam
date Mon, 30 Nov 2015 07:53:36 -0500
parents 17ef0e0dae68
children 0b9aab6aaebf
line wrap: on
line diff
--- a/merge_pcr_duplicates.py	Fri Nov 27 04:33:02 2015 -0500
+++ b/merge_pcr_duplicates.py	Mon Nov 30 07:53:36 2015 -0500
@@ -112,6 +112,9 @@
     sep="\t",
     names=["chrom", "start", "stop", "read_id", "score", "strand"])
 
+# keep id parts up to first whitespace
+alns["read_id"] = alns["read_id"].str.split(' ').str.get(0)
+
 # combine barcode library and alignments
 bcalib = pd.merge(
     bcs, alns,