view fastq_paired_end_splitter.py @ 2:eed0fe64987c draft

planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tool_collections/galaxy_sequence_utils/fastq_paired_end_splitter commit de7140295cce07e1bc1697e51dab4271c8d7a8a6
author devteam
date Fri, 18 Dec 2015 19:30:11 -0500
parents 5943afe0f24d
children
line wrap: on
line source

#Dan Blankenberg
import sys, os, shutil
from galaxy_utils.sequence.fastq import fastqReader, fastqWriter, fastqSplitter

def main():
    #Read command line arguments
    input_filename = sys.argv[1]
    input_type = sys.argv[2] or 'sanger'
    output1_filename = sys.argv[3]
    output2_filename = sys.argv[4]
    
    splitter = fastqSplitter()
    out1 = fastqWriter( open( output1_filename, 'wb' ), format = input_type )
    out2 = fastqWriter( open( output2_filename, 'wb' ), format = input_type )
    
    i = None
    skip_count = 0
    for i, fastq_read in enumerate( fastqReader( open( input_filename, 'rb' ), format = input_type ) ):
        read1, read2 = splitter.split( fastq_read )
        if read1 and read2:
            out1.write( read1 )
            out2.write( read2 )
        else:
            skip_count += 1
    out1.close()
    out2.close()
    if i is None:
        print "Your file contains no valid FASTQ reads."
    else:
        print 'Split %s of %s reads (%.2f%%).' % ( i - skip_count + 1, i + 1, float( i - skip_count + 1 ) / float( i + 1 ) * 100.0 )

if __name__ == "__main__":
    main()