graphclust_preprocessing: splitSHAPE.py comparison

comparison splitSHAPE.py @ 6:e31c659be8bc draft

planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust commit 6767a5ffb02052c844e9d862c79912f998f39d8e

author	rnateam
date	Mon, 20 Nov 2017 05:01:21 -0500
parents	f4ad5dceb619
children

comparison

equal deleted inserted replaced

-:f4ad5dceb619
+:e31c659be8bc
 import os
 import re
 import sys
 shape_file = sys.argv[1]
-win_size = int(sys.argv[2])
 pattern = re.compile("^>.*$")
 toWrite = ""
 count_for_id = 1
 seq_string = []
 orig_id = []
 name_file = "FASTA/data.names"
 array_all_chunks = []
 with open(name_file, 'r') as f:
-content = f.read()
+for line in f:
-lines = content.split('\n')[:-1]
+if len(line.strip()) == 0:
-for line in lines:
+continue
 seq_id.append(int(line.split()[0]))
 seq_string.append(line.split()[1])
 orig_id_srt = line.split()[3]
 orig_id_srt = orig_id_srt.rsplit('_',1)[0]
 orig_id.append(orig_id_srt)
 with open(shape_file, 'r') as shape:
 content = shape.read()
 lines = content.split('\n')
 for line in lines:
 if pattern.match(line):
-line = line.replace('>','').strip()
+line = line.replace('>','').split()[0]
 react_arr=[]
 react_dict[line] = react_arr
 continue
 else:
 react_arr.append(line)
 toWrite = ""
 chunks = []
 for i in range(len(orig_id)):
 if not orig_id[i] in react_dict:
-raise RuntimeError('Error key {} not found'.format(orig_id))
+raise RuntimeError('Error key {} {} not found'.format(i, orig_id[i]))
 react_val = react_dict[orig_id[i]]
 toWrite += '>' + str(seq_id[i]) + " " + seq_string[i] + "\n"
 chunks = re.findall(r'\d+', seq_string[i])

Mercurial > repos > rnateam > graphclust_preprocessing

comparison splitSHAPE.py @ 6:e31c659be8bc draft