changeset 2:aa7092c7a3c8 draft

Uploaded
author drosofff
date Mon, 23 Jun 2014 03:57:00 -0400
parents 06e465694fd1
children 27b40e4ccee2
files sRbowtieParser.py
diffstat 1 files changed, 35 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/sRbowtieParser.py	Mon Jun 23 03:57:00 2014 -0400
@@ -0,0 +1,35 @@
+#!/usr/bin/python
+# python parser module to analyse sRbowtie alignments
+# version 0.9
+# Usage sRbowtieParser.py  <1:index source> <2:extraction directive> <3:outputL> <4:polarity> <5:6:7 filePath:FileExt:FileLabel> <.. ad  lib>
+
+import sys
+from smRtools import *
+
+IndexSource = sys.argv[1]
+ExtractionDirective = sys.argv[2]
+if ExtractionDirective == "--do_not_extract_index":
+  genomeRefFormat = "fastaSource"
+elif  ExtractionDirective == "--extract_index":
+  genomeRefFormat = "bowtieIndex"
+Output = sys.argv[3]
+Polarity = sys.argv[4] # maybe "both", "forward", "reverse"
+Triplets = [sys.argv[5:][i:i+3] for i in xrange(0, len(sys.argv[5:]), 3)]
+MasterListOfGenomes = {}
+
+for [filePath, FileExt, FileLabel] in Triplets:
+  MasterListOfGenomes[FileLabel] = HandleSmRNAwindows (filePath, FileExt, IndexSource, genomeRefFormat) 
+
+header = ["gene"]
+for [filePath, FileExt, FileLabel] in Triplets:
+  header.append(FileLabel)
+
+F = open (sys.argv[3], "w")
+print >> F, "\t".join(header)
+for item in sorted (MasterListOfGenomes[header[1]].instanceDict.keys() ):
+  line=[item]
+  for sample in header[1:]:
+    count = str (MasterListOfGenomes[sample].instanceDict[item].readcount(polarity=Polarity))
+    line.append(count)
+  print >> F,  "\t".join(line )
+F.close()