comparison Bed.py @ 2:4ced8f116509 draft

planemo upload for repository https://github.com/goeckslab/hub-archive-creator commit 23b12dd763c0235674988ebdf6a258afd1ad629a-dirty
author yating-l
date Tue, 22 Nov 2016 17:13:18 -0500
parents 3e0c61b52a06
children
comparison
equal deleted inserted replaced
1:42337785f87b 2:4ced8f116509
24 self.name_bed_generic = self.data_bed_generic["name"] 24 self.name_bed_generic = self.data_bed_generic["name"]
25 self.priority = self.data_bed_generic["order_index"] 25 self.priority = self.data_bed_generic["order_index"]
26 self.track_color = self.data_bed_generic["track_color"] 26 self.track_color = self.data_bed_generic["track_color"]
27 # TODO: Think about how to avoid repetition of the group_name everywhere 27 # TODO: Think about how to avoid repetition of the group_name everywhere
28 self.group_name = self.data_bed_generic["group_name"] 28 self.group_name = self.data_bed_generic["group_name"]
29 29
30 modified = self._checkAndFixBed() 30
31 # Sort processing 31 # Sort processing
32 subtools.sort(self.inputBedGeneric, self.sortedBedFile.name) 32 subtools.sort(self.inputBedGeneric, self.sortedBedFile.name)
33
34
35
36 33
37 # bedToBigBed processing 34 # bedToBigBed processing
38 # TODO: Change the name of the bb, to tool + genome + possible adding if multiple + .bb 35 # TODO: Change the name of the bb, to tool + genome + possible adding if multiple + .bb
39 trackName = "".join( ( self.name_bed_generic, ".bb") ) 36 trackName = "".join( ( self.name_bed_generic, ".bb") )
40 37
41 myBigBedFilePath = os.path.join(self.myTrackFolderPath, trackName) 38 myBigBedFilePath = os.path.join(self.myTrackFolderPath, trackName)
42 with open(myBigBedFilePath, 'w') as self.bigBedFile: 39 with open(myBigBedFilePath, 'w') as self.bigBedFile:
43 subtools.bedToBigBed(self.sortedBedFile.name, 40 subtools.bedToBigBed(self.sortedBedFile.name,
44 self.chromSizesFile.name, 41 self.chromSizesFile.name,
45 self.bigBedFile.name, 42 self.bigBedFile.name)
46 typeOption='bed12+1', 43
47 tab=True)
48
49 # Create the Track Object 44 # Create the Track Object
50 self.createTrack(file_path=trackName, 45 self.createTrack(file_path=trackName,
51 track_name=trackName, 46 track_name=trackName,
52 long_label=self.name_bed_generic, track_type='bigBed', visibility='dense', 47 long_label=self.name_bed_generic, track_type='bigBed', visibility='dense',
53 priority=self.priority, 48 priority=self.priority,
54 track_file=myBigBedFilePath, 49 track_file=myBigBedFilePath,
55 track_color=self.track_color, 50 track_color=self.track_color,
56 group_name=self.group_name, 51 group_name=self.group_name)
57 )
58 52
59 # dataURL = "tracks/%s" % trackName 53 # dataURL = "tracks/%s" % trackName
60 # 54 #
61 # trackDb = TrackDb( 55 # trackDb = TrackDb(
62 # trackName=trackName, 56 # trackName=trackName,
74 # trackFile=myBigBedFilePath, 68 # trackFile=myBigBedFilePath,
75 # trackDb=trackDb, 69 # trackDb=trackDb,
76 # ) 70 # )
77 71
78 print("- Bed %s created" % self.name_bed_generic) 72 print("- Bed %s created" % self.name_bed_generic)
79 if (len(modified) != 0):
80 print("The lines that were removed: " + str(len(modified)))
81 #print("- %s created in %s" % (trackName, myBigBedFilePath)) 73 #print("- %s created in %s" % (trackName, myBigBedFilePath))
82
83 # TODO: bed verifier, check if there are invalid strands: "."
84 def _checkAndFixBed(self):
85 """
86 Call _checkAndFixBed, check the integrity of bed file,
87 if the strand is not "+" or "-" truncate that line and report to users
88 create column and move the score column to
89 """
90 # Store the lines that have been removed
91 removedLines = []
92 # Remove the lines with invalid strand
93 temp_bed = tempfile.NamedTemporaryFile(bufsize=0, suffix=".bed", delete=False)
94 with open(temp_bed.name, 'w') as tmp:
95 with open(self.inputBedGeneric, 'r') as f:
96 lines = f.readlines()
97 for line in lines:
98 fields = line.split()
99 strand = fields[5]
100 score = fields[4]
101 fields[4] = '1000'
102 fields.append(score)
103 if (strand == '+' or strand == '-'):
104 tmp.write('\t'.join(map(str, fields)))
105 tmp.write("\n")
106 else:
107 removedLines.append(line)
108 self.inputBedGeneric = temp_bed.name
109
110 return removedLines