changeset 0:b4cf778be846 draft

planemo upload commit 23ef4b1699065b4f6200c58328bfecfb33dd7fd1-dirty
author bebatut
date Tue, 26 Apr 2016 08:17:42 -0400
parents
children d7747e6f329f
files convert_extract_sequence_file.py convert_extract_sequence_file.xml test-data/extracted_quality_illumina_1_3_fastq_output.qual test-data/extracted_sequences_illumina_1_3_fastq_output.fasta test-data/information_lenght_fasta_output.txt test-data/input_sequence_file.fasta test-data/input_sequence_file.fastq test-data/report_illumina_1_3_fastq_output.txt test-data/report_length_fasta_output.txt
diffstat 9 files changed, 1374 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/convert_extract_sequence_file.py	Tue Apr 26 08:17:42 2016 -0400
@@ -0,0 +1,414 @@
+#!/usr/bin/python
+# -*- coding: utf-8 -*-
+
+import sys
+import os
+import argparse
+import copy
+import operator
+
+FASTA_FILE_LAST_POS = None
+
+#################
+# Parse methods #
+#################
+def text_end_of_file(row):
+    if row == '':
+        return True
+    else:
+        return False
+
+def get_new_line(input_file, generate_error = True):
+    row = input_file.readline()
+    if text_end_of_file(row):
+        if generate_error :
+            string = os.path.basename(__file__) + ': '
+            string += ' unexpected end of file'
+            raise ValueError(string)
+        else :
+            return None
+    else:
+        return row[:-1]
+
+def next_fasta_record(input_file):
+    global FASTA_FILE_LAST_POS
+    if FASTA_FILE_LAST_POS != None:
+        input_file.seek(FASTA_FILE_LAST_POS)
+    else:
+        FASTA_FILE_LAST_POS = input_file.tell()
+
+    id_line = get_new_line(input_file, generate_error = False)
+    if id_line == None:
+        return None
+    split_line = id_line[1:].split(' ')
+    seq_id = split_line[0]
+    description = ' '.join(split_line[1:])
+    new_line = get_new_line(input_file, generate_error = False)
+    seq = ''
+    while new_line != None:
+        if new_line[0] != '>':        
+            seq += new_line
+            FASTA_FILE_LAST_POS = input_file.tell()
+            new_line = get_new_line(input_file, generate_error = False)
+        else:
+            new_line = None
+    return SeqRecord(seq_id, seq, description)
+
+def next_fastq_record(input_file):
+    id_line = get_new_line(input_file, generate_error = False)
+    if id_line == None:
+        return None
+    if id_line[0] != '@':
+        string = os.path.basename(__file__) + ': '
+        string += ' issue in fastq file'
+        raise ValueError(string)
+    split_line = id_line[1:].split(' ')
+    seq_id = split_line[0]
+    description = ' '.join(split_line[1:])
+    seq = get_new_line(input_file)
+    spacer = get_new_line(input_file)
+    quals = get_new_line(input_file)
+    return SeqRecord(seq_id, seq, description, quals)
+
+def next_record(input_file, file_format):
+    if file_format == 'fasta':
+        return next_fasta_record(input_file)
+    elif file_format == 'fastq':
+        return next_fastq_record(input_file)
+    else:
+        string = os.path.basename(__file__) + ': '
+        string += file_format + ' is not managed'
+        raise ValueError(string)
+
+def write_fasta_record(record, output_sequence_file):
+    output_sequence_file.write('>' + record.get_id() + ' ' + 
+        record.get_description() + '\n')
+    seq = record.get_sequence()
+    split_seq = [seq[i:i+60] for i in xrange(0,len(seq),60)]
+    for split in split_seq:
+        output_sequence_file.write(split + '\n')
+
+def format_qual_value(qual_score, sliding_value, authorized_range, qual_format):
+    ascii_value = ord(qual_score)
+    score = ascii_value-sliding_value
+    if score < authorized_range[0] or score > authorized_range[1]:
+        string = os.path.basename(__file__) + ': wrong score ('
+        string += str(score) + ') with quality format ('
+        string += qual_format
+        raise ValueError(string)
+    return score
+
+def format_qual_string(qual_string, qual_format):
+    if qual_format == 'sanger':
+        return format_qual_value(qual_string, 33 ,[0,40], qual_format)
+    elif qual_format == "solexa":
+        return format_qual_value(qual_string, 64 ,[-5,40], qual_format)
+    elif qual_format == "illumina_1_3":
+        return format_qual_value(qual_string, 33 ,[0,40], qual_format)
+    elif qual_format == "illumina_1_5":
+        return format_qual_value(qual_string, 33 ,[3,40], qual_format)
+    elif qual_format == "illumina_1_8":
+        return format_qual_value(qual_string, 33 ,[0,41], qual_format)
+    else:
+        string = os.path.basename(__file__) + ': quality format ('
+        string += qual_format + ') is not managed'
+        raise ValueError(string) 
+
+def write_qual_record(record, output_qual_file, qual_format):
+    output_qual_file.write('>' + record.get_id() + ' ' + 
+        record.get_description() + '\n')
+    qual = record.get_quality()
+    qual = [str(format_qual_string(qual_str,qual_format)) for qual_str in qual]
+    split_seq = [qual[i:i+60] for i in xrange(0,len(qual),60)]
+    for split in split_seq:
+        output_qual_file.write(' '.join(split) + '\n')
+
+def write_fastq_record(record, output_sequence_file):
+    output_sequence_file.write('@' + record.get_id() + ' ' + 
+        record.get_description() + '\n')
+    output_sequence_file.write(record.get_sequence() + '\n')
+    output_sequence_file.write('+\n')
+    output_sequence_file.write(record.get_quality() + '\n')
+
+def write_information(record, output_file_formats, output_sequence_file, 
+    output_qual_file, qual_format):
+    if "fasta" in output_file_formats:
+        write_fasta_record(record, output_sequence_file)
+    if "qual" in output_file_formats:
+        write_qual_record(record, output_qual_file, qual_format)
+    if "fastq" in output_file_formats:
+        write_fastq_record(record, output_sequence_file)
+
+def fast_test_element_in_list(element,list_to_test):
+    to_continue = True
+    i = 0
+    while to_continue:
+        if i == len(list_to_test) or list_to_test[i] >= element:
+            to_continue = False
+        else:
+            i += 1
+
+    found = False
+    if i < len(list_to_test):
+        if list_to_test[i] == element:
+            found = True
+
+    return found
+
+#########################
+# Constraint definition #
+#########################
+constraints = {
+    'equal': operator.eq,
+    'different': operator.ne,
+    'lower': operator.le,
+    'strictly_lower': operator.lt,
+    'greater': operator.ge,
+    'strictly_greater': operator.gt,
+    'in': operator.contains,
+    'not_in': 'in'
+}
+
+extractable_information = {
+    'id': str,
+    'length': int,
+    'description': str
+}
+
+###########
+# Classes #
+###########
+class SeqRecord:
+
+    def __init__(self, seq_id, sequence, description, quality = ""):
+        self.id = seq_id
+        self.sequence = sequence
+        self.quality = quality
+        self.description = description
+        self.length = len(self.sequence)
+
+    # Getters
+    def get_id(self):
+        return self.id
+
+    def get_sequence(self):
+        return self.sequence
+
+    def get_quality(self):
+        return self.quality
+
+    def get_length(self):
+        return self.length
+
+    def get_description(self):
+        return self.description
+
+    def get(self, category):
+        if category == 'id':
+            return self.get_id()
+        elif category == 'length':
+            return self.get_length()
+        elif category == 'description':
+            return self.get_description()
+        else:
+            string = os.path.basename(__file__) + ': '
+            string += category + ' can not be extracted from SeqRecord'
+            raise ValueError(string)
+
+    # Other functions
+    def extract_information(self,to_extract):
+        extracted_info = []
+        for info_to_extract in to_extract:
+            extracted_info.append(self.get(info_to_extract))
+        return extracted_info
+
+    def test_conservation(self, constraints):
+        to_conserve = True
+        for constrained_info in constraints:
+            record_value = self.get(constrained_info)
+            for constraint in constraints[constrained_info]:
+                to_conserve &= constraint.test_constraint(record_value)
+        return to_conserve
+
+class Records:
+
+    def __init__(self, input_filepath, file_format, constraints):
+        self.records = []
+        self.conserved_records = []
+        with open(input_filepath, 'r') as input_file:
+            to_continue = True
+            while to_continue:
+                record = next_record(input_file, file_format)
+                if record != None:
+                    self.records.append(record)
+                    to_conserve = record.test_conservation(constraints)
+                    if to_conserve:
+                        self.conserved_records.append(copy.copy(record))
+                else:
+                    to_continue = False           
+
+    # Getters
+    def get_records(self):
+        return copy.copy(self.records)
+
+    def get_record_nb(self):
+        return len(self.records)
+
+    def get_conserved_records(self):
+        return copy.copy(self.conserved_records)
+
+    def get_conserved_record_nb(self):
+        return len(self.conserved_records)
+
+    # Other functions
+    def save_conserved_records(self,args):
+        if args.custom_extraction_type == 'True':
+            to_extract = args.to_extract[1:-1].split(',')
+            with open(args.output_information, 'w') as output_information_file:
+                output_information_file.write('\t'.join(to_extract) + '\n')
+                for record in self.conserved_records:
+                    extracted_info = record.extract_information(to_extract)
+                    string_info = [str(info) for info in extracted_info]
+                    string = '\t'.join(string_info)
+                    output_information_file.write(string + '\n')
+        else:
+            qual_format = None
+            if args.format == 'fasta':
+                output_file_formats = ['fasta']
+            elif args.format == 'fastq':
+                if args.split == 'True':
+                    output_file_formats = ['fasta','qual']
+                    qual_format = args.quality_format
+                else:
+                    output_file_formats = ['fastq']
+
+            with open(args.output_sequence,'w') as output_sequence_file: 
+                if "qual" in output_file_formats:
+                    output_qual_file = open(args.output_quality, 'w')
+                else:
+                    output_qual_file = None
+                for record in self.conserved_records:
+                    write_information(record, output_file_formats,
+                        output_sequence_file, output_qual_file, qual_format)
+                if "qual" in output_file_formats:
+                    output_qual_file.close()
+
+class Constraint:
+
+    def __init__(self, constraint_type, value, constrained_information):
+        if not constraints.has_key(constraint_type):
+            string = os.path.basename(__file__) + ': '
+            string += constraint_type + ' is not a correct type of constraint'
+            raise ValueError(string)
+        self.raw_constraint_type = constraint_type
+        self.type = constraints[constraint_type]
+
+        value_format = extractable_information[constrained_information]
+        if self.raw_constraint_type in ['in', 'not_in']:
+            self.values = []
+            with open(value, 'r') as value_file:
+                for row in value_file.readlines():
+                    value = row[:-1]
+                    self.values.append(value_format(value))
+        else:
+            self.values = [value_format(value)]
+        self.values.sort()
+
+    def get_raw_constraint_type(self):
+        return self.raw_constraint_type
+
+    def get_type(self):
+        return self.type
+
+    def get_values(self):
+        return self.values
+
+    def test_constraint(self, similarity_info_value):
+        to_conserve = True
+        if self.raw_constraint_type == 'in':
+            to_conserve &= fast_test_element_in_list(similarity_info_value, 
+                self.values)
+        elif self.raw_constraint_type == 'not_in':
+            to_conserve &= (not fast_test_element_in_list(similarity_info_value, 
+                self.values))
+        else:
+            to_conserve &= self.type(similarity_info_value, self.values[0])
+        return to_conserve    
+
+################
+# Misc methods #
+################
+def test_input_filepath(input_filepath, tool, file_format):
+    if not os.path.exists(input_filepath):
+        string = os.path.basename(__file__) + ': '
+        string += input_filepath + ' does not exist'
+        raise ValueError(string)
+
+def format_constraints(constraints):
+    formatted_constraints = {}
+    if constraints != None:
+        for constr in constraints:
+            split_constraint = constr.split(': ')
+            constrained_information = split_constraint[0]
+            constraint = Constraint(split_constraint[1], split_constraint[2], 
+                constrained_information)
+            formatted_constraints.setdefault(constrained_information,[]).append(
+                constraint)
+    return formatted_constraints
+
+def convert_extract_sequence_file(args):
+    input_filepath = args.input
+    file_format = args.format
+    constraints = args.constraint
+    formatted_constraints = format_constraints(constraints)
+
+    records = Records(input_filepath, file_format, formatted_constraints)
+    records.save_conserved_records(args)
+    
+    report_filepath = args.report
+    with open(report_filepath, 'w') as report_file:
+
+        report_file.write('Information to extract:\n')
+        if args.custom_extraction_type == 'True':
+            for info in args.to_extract[1:-1].split(','):
+                report_file.write('\t' + info + '\n')
+        else:
+            report_file.write('\tsequences\n')
+
+        if constraints != None:
+            report_file.write('Constraints on extraction:\n')
+            for constrained_info in formatted_constraints:
+                report_file.write('\tInfo to constraint: ' + constrained_info 
+                    + '\n')
+                for constraint in formatted_constraints[constrained_info]:
+                    report_file.write('\t\tType of constraint: ' + 
+                        constraint.get_raw_constraint_type()
+                        + '\n')
+                    report_file.write('\t\tValues:\n')
+                    values = constraint.get_values()
+                    for value in values:
+                        report_file.write('\t\t\t' + str(value) + '\n')
+        report_file.write('Number of similarity records: ' + 
+            str(records.get_record_nb()) + '\n')
+        report_file.write('Number of extracted similarity records: ' +
+            str(records.get_conserved_record_nb()) + '\n')
+
+########
+# Main #
+########
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    parser.add_argument('--input', required=True)
+    parser.add_argument('--format', required=True)
+    parser.add_argument('--custom_extraction_type', required=True)
+    parser.add_argument('--to_extract')
+    parser.add_argument('--output_information')
+    parser.add_argument('--split')
+    parser.add_argument('--quality_format')
+    parser.add_argument('--output_sequence')
+    parser.add_argument('--output_quality')
+    parser.add_argument('--constraint', action='append')
+    parser.add_argument('--report', required=True)
+    args = parser.parse_args()
+
+    convert_extract_sequence_file(args)
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/convert_extract_sequence_file.xml	Tue Apr 26 08:17:42 2016 -0400
@@ -0,0 +1,249 @@
+<tool id="convert_extract_sequence_file" name="Convert/ Extract information" version="1.0.0">
+
+	<description>from a sequence file, with possible constraints</description>
+
+    <macros>
+        <xml name="extraction_option">
+            <param name="to_extract" type="select" display="checkboxes" multiple="true" label="Information to extract" help="">
+                <option value="id">Identifiant</option>
+                <option value="length">Length</option>
+                <validator type="no_options" message="Select at least one information to extract"/>
+            </param>
+        </xml>
+
+        <xml name="extraction_test">
+            <param name='specific_extraction' type="select" label="Extract specific information?" help="If no is selected, a sequence file is generated. If yes, a text file containing the wanted information is generated">
+                <option value="True">Yes</option>
+                <option value="False" selected="true">No</option>
+            </param>
+        </xml>
+    </macros>
+
+	<requirements>
+  	</requirements>
+
+    <stdio>
+    </stdio>
+
+    <version_command>
+    </version_command>
+
+  	<!--<command>-->
+    <command><![CDATA[
+  		python $__tool_directory__/convert_extract_sequence_file.py 
+      		--input $sequence_file_format.sequence_file
+
+            --custom_extraction_type $sequence_file_format.extraction.specific_extraction
+
+            #if $sequence_file_format.extraction.specific_extraction == "True":
+                --to_extract "{$sequence_file_format.extraction.to_extract}"
+                --output_information $information_file
+            #else if $sequence_file_format.format=="fastq":
+                --split $sequence_file_format.extraction.split.split_test
+                #if $sequence_file_format.extraction.split.split_test :
+                    --quality_format $sequence_file_format.extraction.split.quality_format
+                    --output_sequence $fasta_sequence_file_from_fastq
+                    --output_quality $quality_file
+                #else:
+                    --output_sequence $fastq_sequence_file
+                #end if
+            #else:
+                --output_sequence $fasta_sequence_file
+            #end if
+                
+    		#if $constraints.constrained_extraction == "True" :
+                #for $i, $constrain in enumerate( $constraints.constraint_definition )
+                	#set info_to_constrain=$constrain.constrained_information['info_to_constrain']             
+                    #if $info_to_constrain in ("id"):
+                    	--constraint "$info_to_constrain:
+                    	${constrain.constrained_information.constraint_type.type}:
+                    	${constrain.constrained_information.constraint_type.value}"
+                    #else:
+                    	#for $j, $sub_constrain in enumerate( $constrain.constrained_information.constraint_definition )
+                    		--constraint "$info_to_constrain:
+                    		${sub_constrain.type}:
+                    		${sub_constrain.value}"
+                        #end for
+                    #end if
+                #end for
+            #end if
+
+            --report $report_filepath
+            --format $sequence_file_format.format
+        ]]>
+  	</command>
+
+  	<inputs>
+        <conditional name="sequence_file_format">
+        	<param name="format" type="select" display="radio" 
+                label="Format of the sequence file" help="">
+	            <option value="fasta">Fasta</option>
+                <option value="fastq">FastQ</option>
+	        </param>
+            <when value="fastq">
+                <param name="sequence_file" type="data" format="fastq" 
+                    label="Sequence file" help=""/>
+                <conditional name="extraction">
+                    <expand macro="extraction_test"/> 
+
+                    <when value="True">
+                        <expand macro="extraction_option"/> 
+                    </when>
+                    <when value="False">
+                        <conditional name="split">
+                            <param name='split_test' type="select" label="Split file into sequence and quality files?" help="If yes is selected, a fasta and a quality file are generated. If no, a fastq file is generated">
+                                <option value="True" selected="true">Yes</option>
+                                <option value="False">No</option>
+                            </param>
+
+                            <when value="True">
+                                <param name="quality_format" type="select" display="radio" label="Coding of quality scores?" help="">
+                                    <option value="sanger" selected="true">Sanger (Phred+33)</option>
+                                    <option value="solexa">Solexa (Solexa+64) </option>
+                                    <option value="illumina_1_3">Illumina 1.3+ (Phred+64) </option>
+                                    <option value="illumina_1_5">Illumina 1.5+ (Phred+64) </option>
+                                    <option value="illumina_1_8">Illumina 1.8+ (Phred+33) </option>
+                                </param>
+                            </when>
+                            <when value="False" />
+                        </conditional> 
+                    </when>
+                </conditional> 
+            </when>
+
+            <when value="fasta">
+                <param name="sequence_file" type="data" format="fasta" 
+                    label="Sequence file" help=""/>
+                <conditional name="extraction">
+                    <expand macro="extraction_test"/> 
+
+                    <when value="True">
+                        <expand macro="extraction_option"/>
+                    </when>
+                    <when value="False" />
+                </conditional> 
+            </when>
+        </conditional>
+        
+        <conditional name="constraints">
+            <param name='constrained_extraction' type='select' label="Constrain extraction?" help="">
+                <option value="True">Yes</option>
+                <option value="False" selected="true">No</option>
+            </param>
+
+            <when value="True">
+                <repeat name="constraint_definition" title="Constraints on sequences" min="1">
+                    <conditional name="constrained_information">
+                        <param name="info_to_constrain" type="select" label="Information to constrain" help="">
+                            <option value="id">Identifiant</option>
+                            <option value="length">Length</option>
+                        </param>
+                        <when value="id">
+                            <conditional name="constraint_type">
+                                <param name="type" type="select" display="radio" label="Type of constraint" help="">
+                                    <option value="equal">Equal a value</option>
+                                    <option value="in">In a list</option>
+                                    <option value="not_in">Not in a list</option>
+                                </param>
+                                <when value="equal">
+                                    <param name="value" type="text" size="200" label="Equal to" help=""/>
+                                        <validator type="empty_field" message="Give a value"/>
+                                </when>
+                                <when value="in">
+                                    <param format="txt" name="value" type="data" label="List of constraint" help="Text file with a value per line and nothing else"/>
+                                        <validator type="unspecified_build" message="Select a file"/>
+                                </when>
+                                <when value="not_in">
+                                    <param format="txt" name="value" type="data" label="List of constraint" help="Text file with a value per line and nothing else"/>
+                                        <validator type="unspecified_build" message="Select a file"/>
+                                </when>
+                            </conditional>
+                        </when>  
+                        <when value="length">
+                            <repeat name="constraint_definition" title="Constraint on sequence length" min="1">
+                                <param name="type" type="select" label="Type of constraint" help="">
+                                    <option value="equal">Equal to </option>
+                                    <option value="lower">Lower than </option>
+                                    <option value="strictly_lower">Strictly lower than </option>
+                                    <option value="greater">Greater than </option>
+                                    <option value="strictly_greater">Strictly greater than </option>
+                                </param>
+                                <param name="value" type="integer" min="0" max="3000" value="100" label="Value" help=""/>
+                            </repeat>
+                        </when>  
+                    </conditional>
+                </repeat>
+            </when>
+            <when value="False" />
+        </conditional> />
+  	</inputs>
+
+  	<outputs>
+        <data format="txt" name="information_file" 
+            label="${tool.name} on ${on_string}: Information">
+            <filter>((sequence_file_format['extraction']['specific_extraction'] == "True" ))</filter>
+        </data>
+
+        <data format="fasta" name="fasta_sequence_file"
+            label="${tool.name} on ${on_string}: Extracted sequences" >
+            <filter>((sequence_file_format['format'] == 'fasta' and not sequence_file_format['extraction']['specific_extraction']== "True" ))</filter>
+        </data>
+
+        <data format="fastq" name="fastq_sequence_file"
+            label="${tool.name} on ${on_string}: Extracted sequences">
+            <filter>((sequence_file_format['format'] == 'fastq' and sequence_file_format['extraction']['specific_extraction'] == "False" and sequence_file_format['extraction']['split']['split_test'] == "False" ))</filter>
+        </data>
+
+        <data format="qual" name="quality_file" 
+            label="${tool.name} on ${on_string}: Extracted quality">
+            <filter>((sequence_file_format['format'] == 'fastq' and sequence_file_format['extraction']['specific_extraction'] == "False" and sequence_file_format['extraction']['split']['split_test'] == "True" ))</filter>
+        </data>
+
+        <data format="fasta" name="fasta_sequence_file_from_fastq"
+            label="${tool.name} on ${on_string}: Extracted sequences">
+            <filter>((sequence_file_format['format'] == 'fastq' and sequence_file_format['extraction']['specific_extraction'] == "False" and sequence_file_format['extraction']['split']['split_test'] == "True" ))</filter>
+        </data>
+
+        <data format="txt" name="report_filepath" 
+            label="${tool.name} on ${on_string}: Report"/>
+  	</outputs>
+
+  	<tests>
+        <test>
+            <param name="format" value="fasta"/>
+            <param name="sequence_file" value="input_sequence_file.fasta"/>
+            <param name="specific_extraction" value="True" />
+            <param name="to_extract" value="length" />
+            <param name="constrained_extraction" value="False" />
+            <output name="information_file" file="information_lenght_fasta_output.txt"/>
+            <output name="report_filepath" file="report_length_fasta_output.txt"/>
+        </test>
+        <test>
+            <param name="format" value="fastq"/>
+            <param name="sequence_file" value="input_sequence_file.fastq"/>
+            <param name="specific_extraction" value="False" />
+            <param name="split_test" value="True" />
+            <param name="quality_format" value="illumina_1_3" />
+            <param name="constrained_extraction" value="False" />
+            <output name="quality_file" file="extracted_quality_illumina_1_3_fastq_output.qual"/>
+            <output name="fasta_sequence_file_from_fastq" file="extracted_sequences_illumina_1_3_fastq_output.fasta"/>
+            <output name="report_filepath" file="report_illumina_1_3_fastq_output.txt"/>
+        </test>
+  	</tests>
+
+  	<help><![CDATA[
+
+**What it does**
+
+This tool extracts information (sequences, id, length, ...) from sequence files or convert a FastQ file to Fasta file.
+
+Some constraints could be added to extraction/conversion. For example, only sequences with more than 30 bp could be extracted. Or, a sequences whose the identifiant is in a list. 
+
+The input is a sequence file in fasta or fastq format. The tool generates different outputs given the chosen parameters.
+]]>
+  	</help>
+
+    <citations>
+    </citations>
+</tool>
+
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/extracted_quality_illumina_1_3_fastq_output.qual	Tue Apr 26 08:17:42 2016 -0400
@@ -0,0 +1,174 @@
+>HWI-M00234:263:000000000-ADM55:1:1101:21704:2233 1:N:0:ATCACG
+33 34 34 34 34 38 38 36 35 23 35 37 38 34 25 25 10 31 34 31 24 31 11 11 36 38 37 32 37 31 34 34 22 31 31 31 37 38 32 37 27 31 37 38 38 36 38 35 22 25 27 21 36 35 35 36 34 34 37 38
+38 34 37 38 38 34 27 21 21 11 37 27 37 37 34 38 37 34 19 33 37 37 30 20 30 27
+>HWI-M00234:263:000000000-ADM55:1:1101:21334:2699 1:N:0:ATCACG
+34 34 34 34 34 38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 31 37 38 38 38 38 38 38 38 38 36 32 35 38 38 38
+38 38 38 38 38 38 38 38 38 38 37 38 38 38 38 37 37 31 34 37 37 36 38 38 35 38 38 38 38 38 37 38 38 38 38 38 38 38 38 37 38 37 34 37 38 38 38 38 38 37 38 34 36 28 37 38 37 35 38 37
+38 38 34 36 36 38 38 38 38 35 37 38 38 38 37 38 38 38 38 38 34
+>HWI-M00234:263:000000000-ADM55:1:1101:13968:2885 1:N:0:ATCACG
+27 34 34 23 34 36 37 35 38 38 37 35 37 27 11 21 31 37 22 37 34 38 37 11 25 37 37 34 36 35 31 31 31 11 26 26 11 27 34 37 37 37 32 11 21 34 31 37 34 31 11 27 36 10 23 22 37 37 34 37
+34 38 37 37 23 11 27 27 37 38 22 10 31 37 22 37 36 37 37 38 38 38 34 37 36 34 37 11 28 27 33 28 36 37 24 24 37 31 24 27 37 32 37 37 38 35 37 30 28 36 25 28 19 25 11 24 11 11 34 37
+24 32 19 11 29 23 29 34 10 29 18 33 37 38 35 26 31 11 22 29 11 28 28 29 21 30 28 24 11 11 31 10 31 19 27 28 21 24 24 34 24 11 31 10 31 27 10 22 17 26 31 20 26 15 9 24 25 30 23 17
+33 37 23 20 28 31 17 28 34 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+>HWI-M00234:263:000000000-ADM55:1:1101:11873:2948 1:N:0:ATCACG
+34 34 34 34 34 34 35 26 33 21 34 11 26 27 36 32 37 36 34 37 31 37 38 38 38 38 32 36 34 36 38 31 37 31 37 38 38 38 37 32 32 37 24 37 38 38 34 37 29 37 22 27 37 34 37 37 27 21 37 36
+37 37 37 34 35 34 37 38 38 38 36 34 27 37 11 27 32 27 36 37 34 31 37 24 33 37 38 36 27 24 35 37 37 38 36 36 38 38 31 37 37 38 37 37 38 37 23 37 35 36 37 34 27 37 11 24 19 25 36 37
+24 11 34 28 36 38 38 38 34 34 37 34 34 36 29 33 10 29 36 24 37 34 38 38 21 10 31 34 34 29 36 37 34 23 35 29 34 36 37 11 36 28 31 28 36 30 34 11 21 28 32 37 38 29 29 24 30 35 34 38
+34 29 37 38 29 38 38 34 35 32 20 9 26 10 28 32 37 37 9 32 26 14 30 33 8 12 8 7 26 21 19 25 8 29 18 27 36 27 18 8 8 22 27 36 18 28 26 29 37 35 37 30 36 27 27 19 8 18 26 36
+37 31 37 37 32 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+>HWI-M00234:263:000000000-ADM55:1:1101:7855:3066 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 38 37 38 38 38 34 33 34 37 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 11 34 36 38 38 38 38 38 38 38 38 38 38 38 38 38 38
+31 37 31 37 38 38 38 38 38 38 38 38 31 31 36 38 37 38 38 38 37 38 37 38 34 38 36 38 38 38 38 38 38 38 38 38 38 34 37 38 38 38 38 36 38 36 36 36 22 37 37 38 37 37 38 35
+>HWI-M00234:263:000000000-ADM55:1:1101:24817:3238 1:N:0:ATCACG
+34 34 34 34 34 22 37 38 37 38 36 38 38 38 38 38 38 35 37 38 38 38 38 38 38 35 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 36 36 34 38 38 38 38 38 38 37 37 38
+38 38 38
+>HWI-M00234:263:000000000-ADM55:1:1101:17179:3527 1:N:0:ATCACG
+34 34 34 34 34 38 27 37 34 34 38 38 37 38 38 37 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 35 36 38 30 27 36 34 38 34 37 36 38 27 36 38 38 38 37 11 34 37 38
+>HWI-M00234:263:000000000-ADM55:1:1101:21254:3571 1:N:0:ATCACG
+34 34 34 34 34 37 36 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 27 37 34 34 38 38 37 37 38 38 35 37 38 38 38 37 38 38 34 38 38 22 37 38
+38 38 38 38 34 38 38 32 37 37 36 36 38 34 25 37 38 38 38 38 38 38 38 38 38 35 37 38 38 37 32 38 37 38 38 38 38 22 37 36 38 38 38 38 38 38 36 22 37 38 38 38 29 36 38 38 38 37 37 37
+34 37 38 38 37 34 36 36 38 38 37 38 34 38 38 38 37 38 37 35 38 37 37 38 38 34 37 38 38 38 22 34 26 11 20 28 36 37 11 34 38 20 24 35 34 34 38 31 11 20 34 37 37 37 38 28 37 34 9 34
+37 37 38 38 38 35 37 38 38 32 37 37 37 37
+>HWI-M00234:263:000000000-ADM55:1:1101:16569:3709 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38
+38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 24 37 38 38 38 38 35 38 38 38 38 38 38 38 36 34 38 38
+38 38 38 36 38 34 38 38 38 38 38 38 38 35 38 38 38 37 38 38 38 38 38 37 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 32 34 37 38 38 38 37 38 38 38 38 38 37 38 38 38 38 38
+34 37 38 38 38 38 38 38 37 37 37 37 37 37 36 37 25 21 20 34 37 37 37 23 37 36 37 22 32 37 36 37 36 36 7 11 21
+>HWI-M00234:263:000000000-ADM55:1:1101:22403:3828 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 36 38 38 38 38 38 38 38 38 37 38 38 38
+38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 34 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38
+38 38 38 38 38 38 38 38 38 38 38 38 38 29 35 38 38 38 38 38 38 38 38 37 35 37 37 36 35 38 38 38 34 36 36 36 34 38 38 38 37 38 38 38 38 38 38 37 38 38 38 38 38 38 38 37 37 37 35 38
+38 38 38 37 37 38 38 38 28 35 30 35 37 37 37 37 30 34 37 37 37 20 9 25 27 36 37 36 29 10 9 18 23 23 21 28 32 32 32 31 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+2 2 2 2 2 2 2 2 2 2 2 2 2 2
+>HWI-M00234:263:000000000-ADM55:1:1101:7508:4067 1:N:0:ATCACG
+34 34 34 34 34 38 37 38 38 37 23 37 37 36 34 37 37 34 38 36 24 37 37 38 38 38 38 24 34 37 32 37 37 34 34 31 31 34 37 38 37 38 38 34 38 37 38 38 38 38 38 38 37 37 38 35 38 36 37 37
+36 37 38 23 37 38 38 37 31 31 37 38 34 37 38 38 34 32 31 37 34 37 37 34 37 38 38 38 38 37 37 38 37 37 24 30 30 37 37 37 37 38 38 38 38 38 37 37 37 28 37 38 38 38 35 36 37 25 37 23
+11 19 31 32 34 36 36 23 34 34 36 36 38 38 38 34 34 37 38 24 37 37 37 32 37 38 21 34 38 38 36 38 36 11 28 18 36 38 34 17 26 28 36 37 37 37 38 37 38 37 38 38 24 31 24 36 38 38 38 38
+34 29 23 28 35 34 37 38 38 35 37 36 37 37 10 28 22 27 32 37 37 36 29 29 20 32 32 36 37 23 32 37 36 20 23 24 9 8 23 19 24 29 20 17 19 28 26 23 9 16 24 23 30 34 36 30 24 29 20 24
+31 29 21 7 21 21 31 34 27 13 8 8 14 20 26 29 7 16 18 28 36 37 36 21 15 7 18 18 19 25 32 33 30
+>HWI-M00234:263:000000000-ADM55:1:1101:26232:4161 1:N:0:ATCACG
+34 34 34 34 34 38 38 37 38 37 37 37 38 38 38 38 38 38 34 37 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38
+38 38 38 34 37 38 38 37 38 36 38 37 38 38 38 38 37 38 37 38 37 38 38 38 37 32 37 35 38 34 37 38 38 38 38 37 38 38 38 37 38 34 38 37 38 38 38 38 34 38 38 38 37 38 38 38 38 25 37 37
+38 38 37 31 37 24 37 38 38 38 38 38 37 38 38 38 38 38 38 34 36 38 38 34 30 37 38 38 38 38 38 38 38 37 38 38 35 37 37 38 37 23 35 37 38 38 34 38 38 38 38 34 35 37 38 38 38 38 38 38
+38 38 35 37 38 38 34 37 38 37 35 37 22 26 36 37 37 37 37 37 37 37 33 27 37 35 37 37 32 36 35 37 37 37 37 37 37 31 34 36 37 34 34 36 36 37 37 37 37 37 33 36 37 36 31 23 28 31 21 20
+22 29
+>HWI-M00234:263:000000000-ADM55:1:1101:23151:4189 1:N:0:ATCACG
+34 34 34 23 32 37 11 21 11 37 38 38 34 37 36 36 33 37 38 34 32 37 38 38 38 37 38 38 37 22 37 33 23 11 34 37 11 27 11 26 11 34 36 36 27 11 31 11 23 10 11 11 21 11 11 11 34 37 37 38
+38 38 38 38 11 37 27 36 32 31 37 11 33 27 37 21 31 37 34 21 31 34 33 36 24 37 22 37 11 20 25 37 24 32 37 23 19 32 11 32 33 37 37 11 28 32 11 32 11 19 11 19 32 36 37 36 38 38 38 38
+38 35 23 28 36 34 11 11 19 11 34 26 36 37 24 11 24 28 10 19 10 10 11 10 19 28 23 35 38 38 21 31 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+>HWI-M00234:263:000000000-ADM55:1:1101:17148:4803 1:N:0:ATCACG
+32 32 34 33 34 35 37 32 31 31 25 10 25 34 34 36 37 22 31 34 34 31 31 32 37 37 35 38 35 26 37 35 32 31 31 21 36 31 37 37 27 11 34 34 26 31 31 10 22 31 37 38 31 37 27 34 34 37 37 31
+37 31 37 31 11 27 11 33 31 37 11 34 35 38 27 31 37 36 37 27 31 11 31 11 34 32 37 24 36 27 37 35 27 30 30
+>HWI-M00234:263:000000000-ADM55:1:1101:8939:4808 1:N:0:ATCACG
+34 34 23 34 24 34 21 27 36 37 38 37 36 36 38 38 38 38 38 38 38 35 36 34 38 37 35 36 31 37 37 32 37 38 37 38 37 38 38 38 38 38 38 38 38 37 38 37 36 36 31 37 37 38 37 36 38 38 34 37
+36 34 35 38 34 34 37 38 34 10 21 31 33 31 31 37 37 38 11 23 37 31 37 37 38 38 38 38 37 36 35 37 34 37 31 37 37 37 38 38 35 37 37 35 37 37
+>HWI-M00234:263:000000000-ADM55:1:1101:11727:5103 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38
+38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 37 38 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38
+38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 37 35 37 31 38 38 35 38 38 38 38
+38 38 38 38 38 19 9 26 34 37 37 37
+>HWI-M00234:263:000000000-ADM55:1:1101:15029:5173 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 36 38 38 22 37 36 34 38 37 38 38 38 38 38 36 38 38 38 38 38 36 36 38 38 38 38 38 38 38 38 38 38 38 38 38
+38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 34 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 37 38 38 38 38 38 38 38 38 38 38 37 37 38 24 37 34 38 38 38 37 38 38 38
+38 38 37 37 37 35 38 38 36 36 34 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 36 34 38 38 38 38 38 35 29 34 34 38 29 28 24 23 36 22 24 28 34 35 35 35 35 19 35 20 35
+38 37 28 37 38 38 38 35 38 37 37 37 37 37 37 37 37 21 32 34
+>HWI-M00234:263:000000000-ADM55:1:1101:7330:5248 1:N:0:ATCACG
+34 34 34 34 34 38 36 38 38 38 38 38 38 37 38 38 38 38 38 36 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 37 38 38 38 38 35 36 38 38
+38 38 38 37 38 38 38 38 38 38 38 38 38 38 36 34 38 38 38 38 36 37 38 35 38 32 37 38 38 38 38 38 38 37 37 38 29 38 38 36 34 37 37 38 34 37 10 31 34 34 31 37 38 38 10 10 31 37 37 37
+37 11 29 37 11 35 37 37 38 38 37 37 38 34 38 36 37 38 21 34 36 38 20 19 9 28 31 35
+>HWI-M00234:263:000000000-ADM55:1:1101:18630:5353 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 38 38 34 38 38 38 38 38 38 38 38 38 38 37 38 38 37 38 37 38 38 38 38 38 38 38 36 38 38 38 38 38 38 38 38 38 38 38 38 38 35 36 34 35 37 38 38 38
+38 38 38 38 38 38 38 37 38 38 38 38 35 38 38 38 38 38 38 38 38 38 38 38 38 37 37 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 35 23 27 37 38 38 38 37 38 38 38 38 38 38 38
+37 32 36 38 38 37 38 34 11 23 36 37 38 38 38 38 37 35 34 24 35 38 24 36 24 35 34 36 36 29 36 38 38 35 38 38 37 38 38 38 38 37 38 30 37 34 37 35 36 35 21 37 21 35 38 21 34 21 28 28
+35 35 22 28 35 28 35 21 35 37 37 30 37 9 9 18 26 24 31 30 21 24 24 34 35 33 37 37 20 37 36 33 29 29 35 29 25 31 15 15 29 28 34 9 23 25 26 17 20 26 20 24 9
+>HWI-M00234:263:000000000-ADM55:1:1101:11799:5476 1:N:0:ATCACG
+34 34 34 34 27 37 37 37 38 38 37 31 37 37 37 38 37 37 38 34 38 34 34 37 38 38 38 36 37 38 38 35 26 34 37 37 38 37 38 38 38 38 38 38 34 37 37 31 37 37 38 38 34 27 36 36 38 38 38 34
+36 37 38 38 38 37 31 36 31 31 11 33 37 37 38 37 38 38 38 38 38 22 10 31 32 37 36 32 36 37 37 38 38 38 38 38 38 38 37 37 36 38 38 37 38 38 38 34 36 38 36 37 35 38 37 38 38 37 38 38
+25 28 29 31 36 34 31 31 22 22 31 36 29 19 35 36 34 23 34 29 35 38 38 38 29 37 38 38 38 38 37 28 35 32 36 34 35 35 37 35 36 38 23 28 28 10 10 28 11 21 28 37 38 35 38 37 38 38 38 38
+38 38 38 38 38 38 37 37 38 37 37 37 37 37 37 37 37 37 37 35 37 37 32 35 37 37 37 36 32 37 31 37 31 34 20 31 36 36 37 20 28 36 26 36 36 19 19 22 22 32 37 33 36 37 33 37 26 9 32 19
+29 34
+>HWI-M00234:263:000000000-ADM55:1:1101:11348:5668 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 38 38 34 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38
+38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 34 37 38 37 38 38 38 38 38 35 38 38 34 38 38 38 38 38 38 38 38 38 38 38 38 38
+38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 35 38 38 38 38 38 38 38 38 38 35 38 38 38 21 29 36 24 34 34 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38
+38 38 37 38 37 38 37 37 37 37 37 37 37 37 37 37 37 37 37 37 32 37 37 37 37 37 37 37 37 37 37 37 33 16 24 24 31 37 28 24 31 35 37 31 30 26 31 37 35 37 37 37 37 37 37 29 17 22 19 32
+29 33 27 30 37 32 33 37 37 22 30 37 30 30 30 37 33 24 19 25 27 27 37 17 21 8 12 21 24 29 15
+>HWI-M00234:263:000000000-ADM55:1:1101:25874:5826 1:N:0:ATCACG
+34 34 34 34 34 35 37 38 38 38 38 27 31 37 11 34 36 27 37 38 38 36 38 35 35 37 38 24 36 36 36 37 22 34 38 37 38 38 38 24 27 36 31 35 31 31 36 34 11 31 37 37 37 36 38 38 38 11 34 27
+24 34 27 37 38 38 37 38 37 10 31 34 38 36 36 34 38 36 37 37 38 38 38 38 27 37 27 32 11 11 19 30 37 30 11 30 20 36 35 37 11 11 28 33 36 37 10 11 32 27 32 11 34 11 11 32 36 23 19 10
+37 28 10 37 29 37 37 38 38 37 37 38 35 23 35 29 35 36 11 11 18 22 18 10 10 10 10 10 10 21 11 11 18 31 10 10 10 31 24 9 31 24 29 20 31 34 9 27 25 25 22 11 9 15 26 34 34 22 10 25
+9 18 24 34 37 9 15 19 20 30 23 32 34 28 32 25 33 33 25 20 8 15 20 14 26 21 25 21 8 23 21 25 25 23 31 37 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+>HWI-M00234:263:000000000-ADM55:1:1101:26932:5861 1:N:0:ATCACG
+24 21 33 34 34 37 38 38 36 38 38 38 37 38 38 38 38 38 30 36 37 37 38 38 38 38 38 34 37 38 24 37 35 37 38 38 37 38 23 37 38 38 34 37 38 38 38 38 38 38 38 38 38 37 35 38 38 35 37 36
+33 37 38 37 37 38 38 38 38 38 36 36 36 37 38 38 38 27 37 37 37 34 37 34 37 37 38 35 34 37 38 37 38 38 27 23 37 38 36 37 38 38 38 34 34 37 37 32 36 38 38 37 37 38 37 37 37 37 38 38
+23 36 36 37 34 36 38 38 31 36 35 36 38 38 37 38 37 37 37 37 38 38 37 34 33 36 36 23 34 37 23 28 34 37 37 32 37 11 28 35 23 37 23 37 38 38 10 31 35 34 23 21 30 28 34 38 37 35 38 34
+24 35 21 37 34 25 37 34 9 10 26 24 9 18 18 16 30 10 28 26 32 33 33 19 24 29 37 35 36 33 28 19 20 31 31 37 37 37 33 37 37 26 23 31 36 31 37 34 8 14 21 21 24 15 7 12 16 8 8 11
+23 17 30 33 30 30 33 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+>HWI-M00234:263:000000000-ADM55:1:1101:14154:5990 1:N:0:ATCACG
+34 34 34 34 34 38 38 34 27 37 24 35 36 31 36 38 24 37 37 31 31 37 38 37 38 38 37 36 37 38 37 31 36 31 37 32 37 38 38 38 37 38 37 36 36 23 37 37 36 38 38 38 38 35 29 29 28 37 23 37
+38 23 30 36 36 35 37 38 38 38 38 38 38 27 37 37 35 30 37 37 31 37 37 38 36 23 37 28 11 29 37 37 36 33 34 36 37 38 38 38 37 38 38 38 38 38 38 34 36 38 23 35 30 37 37 38 38 36 38 38
+37 37 36 38 36 36 23 37 37 38 38 38 38 23 10 10 29 23 36 29 36 20 31 33 35 32 30 37 38 38 38 38 38 38 34 37 37 21 36 28 28 20 22 30 30 23 21 36 34 37 34 37 31 34 34 34 34 33 37 34
+38 35 38 38 38 38 28 9 29 18 8 23 21 23 25 22 28 37 37
+>HWI-M00234:263:000000000-ADM55:1:1101:25022:6229 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 37 38 38 38 37 38 38 38 38 36 38 38 34 37 38 37 38 38 32 36 38 38 38 35 38 38 36 38 38 38 37 38 37 37 38 38 24 37 37 38 36 37 38 38 38 38 38 38 38
+38 38 32 36 38 38 38 23 37 37 38 38 38 30 36 37 38 38 38 38 34 37 38 38 38 34 34 37 38 37 37 38 34 37 38 38 38 34 38 38 38 38 38 38 24 36 37 11 36 38 38 34 37 37 38 37 37 38 38 36
+36 38 38 38 35 36 38 38 38 32 37 38 38 38 34 36 37 36 36 33 36 23 36 35 37 38 38 38 38 38 38 38 38 34 38 38 38 38 38 38 38 38 37 38 34 37 35 35
+>HWI-M00234:263:000000000-ADM55:1:1101:21023:6286 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 34 37 37 38 38 35 36 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 36 38 38 38 38 38 37 36 38 38 38 38 38 38 38 35 37 37 38 24 37 34 38 38 38
+38 38 38 38 38 38 38 38 37 37 37 38 38 38 38 38 36 38 34 37 38 35 38 38 38 32 38 23 36 37 27 37 37 38 38 38 38 38 38 38 37 38 38 34 35 38 35 36 38 37 38 38 38 38 38 38 38 37 38 37
+30 38 38 35 37 35 37 38 35 35 36 38 35 10 33 28 35 37 37 37 35 24 35 38 37 38 38 38 38 38 36 38 34 37 34 36 38 36 38 38 38 38 37 34 37 29 37 38 38 34 38 38 38 38 34 38 38 37 35 35
+38 27 20 20 34 37 19 34 37 37 26 20 20 20 20 29 37 37 37 37 37 32 21 10 15 7 17 11 15 23 8 15 15 7 18 21 11 11 8 20 25 32 33 17 25
+>HWI-M00234:263:000000000-ADM55:1:1101:8138:6336 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 37 27 37 38 38 38 38 36 35 31 37 38 38 38 37 38 38 38 38 38 38 35 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38
+38 38 38 38 38 38 38 38 34 38 37 38 38 38 34 38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 37 36 38 38 38 38 35 38 38 36 37 34 34 38 36 37 37 38 38 38 38 32 37 38 38 38 38 38 37
+38 37 37 37 38 38 37 38 38 37 38 35 37 38 38 38 38 38 38
+>HWI-M00234:263:000000000-ADM55:1:1101:11055:6543 1:N:0:ATCACG
+31 33 11 23 33 37 23 36 37 38 37 38 38 22 22 31 22 10 23 31 31 21 11 37 37 37 27 11 10 31 34 10 21 37 37 24 24 31 32 31 36 34 11 34 34 11 33 37 37 35 37 38 32 27 31 35 11 34 24 37
+31 34 37 22 11 33 22 34 37 38 38 11 34 31 11 33 31 27 37 30 22 37 37 23 27 11 25 11 34 31 11 30 27 36 36 11 34 30 32 11 36 11 32 34 36 37 38 24 11 34 26 31 11 11 32 26 36 36 32 11
+11 30 36 24 23 23 19 33 23 28 11 24 11 19 11 31 10 22 29 31 11 33 26 28 11 21 21 10 31 35 11 11 31 11 18 28 36 37 28 25 31 37 11 34 28 23 23 21 11 10 21 31 35 23 35 10 21 10 15 28
+28 34 24 10 21 10 20 10 15 26 10 16 10 18 33 34 16 27 32 30 24 29 24
+>HWI-M00234:263:000000000-ADM55:1:1101:24980:6575 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 31 38 27 37 37 37 38 38 38 36 36 38 38 38 38 38 38 37 38 38 34 36 34 37 38 38 38 38 38
+35 25 31 37 38 38 38 38 38 22 32 35 38 38 38
+>HWI-M00234:263:000000000-ADM55:1:1101:7596:6682 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 32 34 37 38 38 38 38 38 37 37 36 36 38 38 38 38 38 38 37 37 36 38 38 38 38 38 38 38 38 38 38 36 38 37 38 38 38 38 36 37 38 31 37 38 35 37 37 38 38
+38 38 38 38 38 36 38 38 38 35 38 37 37 34 34 29 37 38 34 35 37 38 37 38 38 38 34 36 11 36 25 37 34 34 34 34 22 34 38 38 38 38 38 38 37 36 26 37 37 36 37 34 34 38 37 38 38 31 34 36
+37 38 38 38 38 31 37 31 29 31 23 35 38 38 38 28 26 31 37 37 37 38 38 34 26 36 21 11 31 31 10 19 25 11 18 16 23 26 24 11 31 37 38 31 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+>HWI-M00234:263:000000000-ADM55:1:1101:24419:6736 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 35 38 38 38 38 38 37 38 38 38 38 38 38 38 35 38 38 38 38 38 38 38 38 38
+38 38 38 38 38 38 38 35 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 37 38 38 38 38 38 38 38 38 35 24 37 37 34 37 36 38 38 38 37 38 38 38
+38 38 22 28 10 19 29 31 36 37 36 36 37 37 38 22 29 36 36 35 36 36 36 37 35 35 35 38 31 23 35 34 37 36 37 35 37 38 38 34 23 28 34 35 34 38 38 37 38 38 35 34 21 29 35 35 38 35 34 37
+35 38 35 38 35 38 37 38 38 31 32 37 33 32 30 37 37 37 37 37 37 37 37 32 33 33 37 24 20 33 31 32 37 37 37 37 37 37 37 37
+>HWI-M00234:263:000000000-ADM55:1:1101:5068:6755 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38
+38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 35 37 37 30 37 38 38 38 38 38 35 37 38 38 38 38 38 38 38 38 38 38 37 37 37 37 38 38 38 38 38 37 38 38 37 38 38 38 38 38 38 35
+38 38 38 38 38 38 38 37 38 38 38 36 36 35 38 38 38 24 34 24 36 36 38 38 38 38 38 35 23 31 37 38 38 38 38 38 38 38 38 38 38 38 38 38 29 34 37 38 38 38 38 38 34 37 38 35 38 35 37 38
+37 38 38 37 22 34 37 38 35 37 29 37 37 37 32 37 28 26 32 29 36 35 35 33 37 33 33 37 37 37 31 35 31 35 27 36 30 31 37 15 16 26 31 27 30 34 27 19 22 16 13 17 8 19 23 27 30 30 17 7
+20 19 24 27 33 29 37 35 37 17 19 8 21 21 27 8 8
+>HWI-M00234:263:000000000-ADM55:1:1101:21477:6796 1:N:0:ATCACG
+34 34 11 32 34 25 37 23 27 37 31 34 34 36 35 38 38 34 36 38 38 38 38 38 37 32 38 27 37 38 38 23 31 37 36 37 36 37 37 34 36 38 38 34 37 37 27 27 27 37 31 27 34 10 31 37 37 25 32 37
+34 36 37 36 11 36 34 37 24 32 37 38 34 31 35 36 27 37 36 11 11 20 31 24 33 23 33 37 37 34 36 23 37 11 28 37 37 31 34 38 22 37 34 37 38 35 25 37 37 37 22 36 32 37 35 38 24 37 26 37
+37 37 31 25 37 36 36 38 31 19 28 31 35 36 37 38 21 28 36 38 34 32 35 34 21 31 36 34 34 32 11 31 35 35 37
+>HWI-M00234:263:000000000-ADM55:1:1101:12483:6880 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 37 38 38 37 38 38 38 38 38 37 38 35 37 36 38 38 38 38 38 37 37 37 38 38 37 38 38 38 38 38 38 38 38 37 38 38 38 37 38 38 38 38 38 38 38 38 34 36
+38 38 38 38 34 37 38 38 38 38 38 38 38 38 38 38 38 38 37 38 38 38 37 36 38 38 35 38 38 38 38 37 37 37 38 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 37 38 37 38 34 37 31
+37 36 37 37 38 35 32 38 37 38 37 38 38 38 38 37 38 38 38 38 35 38 38 38 37 37 38 38 38 35 26 36 36 37 38 38 38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 37 35 38 35 38 38 38 38
+38 38 38 38 38 38 38 35 38 37 37 37 37 37 37 37 24 26 26 35 37 37 37 37 37 33 37 37 33 35 33 37 37 33 37 35 28 35 35 37 35 37 37 37 36 37 36 37 36 37 36 36 34 36 27 31 36 31 34 37
+37 31 36 33 32 37 37 36 36 36 37 37
+>HWI-M00234:263:000000000-ADM55:1:1101:27958:6935 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 38 38 38 38 35 38 38 34 37 38 38 38 38 38 38 38 37 36 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 23 35 34
+27 37 38 38 38 37 37 38 38 38 38 38 38 38 38 38 38 34 38 37 25 37 35 38 38 38 38 38 38 31 37 36 36 36 38 38 38 36 38 35 38 38 38 37 38 38 38 38 38 38 25 37 37 38 38 28 36 38 37 37
+37 34 36 37 38 24 36 36 37 38 35 10 31 31 36 36 35 36 35 23 35 32 29 36 36 34 31 36 37 38 37 32 37 37 38 37 28 37 30 10 19 19 26 34 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
+>HWI-M00234:263:000000000-ADM55:1:1101:6151:7404 1:N:0:ATCACG
+34 34 34 34 34 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 37 38 37 38 38 38 38 38
+38 38 38 38 38 37 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 38 35 37 23 37 38 38 38 37 38 38 38 38 36 38 38 38 22 10 34 38 38 37 38 38 38 38 38 38 38 38 34 25 23 37 38 38
+38 35 37 38 37 36 38 38 38 37 38 38 38 37 38 34 38 38 38 38 38 38 38 38 35 38 30 36 38 38 38 38 38 37 37 11 27 37 38 38 38 38 37 35 38 38 38 38 11 20 11 36 37 38 38 38 35 10 10 9
+20 25 35 38 37 34 35 35 30 21 29 32 37 37 37 19 30 21 8 20 30 36 33 30 35 15 29 35 37 37 37 32 37 15 7 14 13 21 27 35 15 18 26 18 7 8 13 21 19 21 27 32 8 8 13 8 8 7 19 25
+15 27 33 37 33 35 30 37 27 17 27 32 37 37 27 33 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/extracted_sequences_illumina_1_3_fastq_output.fasta	Tue Apr 26 08:17:42 2016 -0400
@@ -0,0 +1,174 @@
+>HWI-M00234:263:000000000-ADM55:1:1101:21704:2233 1:N:0:ATCACG
+GTGTACAAGGCCCGGGAACGTATTCACCGCGGCATGCTGATCCGCGATTACTAGCGATTC
+CAACTTCATACAGGCGGGTTTCAGCC
+>HWI-M00234:263:000000000-ADM55:1:1101:21334:2699 1:N:0:ATCACG
+CTTTTGACGGCCTTTTTGTTGTCTTCTGAATTTTGTTTTTTTCGGTTGTAACATAATTCC
+TAAAAATCAAATTCGTTAGCGATTATTTTTCTTTCTTTTGAAGTTCTTTCCGCCATTGTT
+TCCGCTATTGCTTCCACGACC
+>HWI-M00234:263:000000000-ADM55:1:1101:13968:2885 1:N:0:ATCACG
+CCCACTGCTGCCTCCCGTAGGAGCCTGGACCGTGTCTCAGTTCCAATGTGGCCGATCACC
+CTCTCAGGTCGGCTACCCATCGTTGCCCTGGTAAGCCATTACCCTACCAACTAGCTAATG
+GGACGCGGGCACATCTCAAAGCGGATTACCCCTTTGGTTAAAGTTTAATGCGAAACTCTA
+ACTTTATGCGTTATTAACCCTCCTTTCGGAGGGCTATTCCCCTCTTTGATGCAGGTTGCC
+CACGTGTTACTCACCCGTCCGCCGCTAATCCACTTCCCGAAGGCAGATTCAACCCTCGAT
+>HWI-M00234:263:000000000-ADM55:1:1101:11873:2948 1:N:0:ATCACG
+CCCCGTTACATCTTCCGCGCAGGAAGACTCGATCAGTGAGCTATTACGCTTTCTTTGAAG
+GATGGCTGCTTCTAAGCCAACTTCCTGACTGTCTTAGCCTTCCCACTTCGTTTTCCACTT
+AGTCAATATTAGGGACCTTAGCCGGCGGTCTGGGTTGTTTCCCTCTTGAGTCCGGACGTT
+AGCACCCGGTGCTCTGTCCCCCGTGCCCAAACTTCCAAGTATTCGGAGTTTGCCATGGTT
+TGGTAAGACGCTATGTCCCCCTAACCATAACAGTGTTCTACCCTCTGAACACATACTCGA
+>HWI-M00234:263:000000000-ADM55:1:1101:7855:3066 1:N:0:ATCACG
+CGTCAATCTTCCAACGCCCACGGCAGATAGGGACAAAACTGTCTCACGACGTTTTAAACC
+CAGCTCACGTACCTCTTTAAATGGCGAACAGCCATACCCTTGGGACCGGCTACAGC
+>HWI-M00234:263:000000000-ADM55:1:1101:24817:3238 1:N:0:ATCACG
+CCCGTGACCAGATTCATGGCCGCCGGTTAGAACCCCAGTACTGTCAGGGTGGTATCCCAA
+GGA
+>HWI-M00234:263:000000000-ADM55:1:1101:17179:3527 1:N:0:ATCACG
+GTGCTTATTTCACTTCCTCAAAATCAGCATCCTGCACATTATCGCCATGCTTT
+>HWI-M00234:263:000000000-ADM55:1:1101:21254:3571 1:N:0:ATCACG
+GTCGCGGGGAAGATCAACTCCTGCAATTCGAGCCATACCAATTACCTCCTAGCGCCCTGA
+CGCTGTTTATGACGAGGATCGCGGCTGCAGATGACGCGAATGACGCCATTGCGCTTGATC
+ACTCGGCAATACTCACAAATGGGTTTAACAGATTATCTAACCTTCATAGTTTGCACACTC
+CTCATGGACATTCC
+>HWI-M00234:263:000000000-ADM55:1:1101:16569:3709 1:N:0:ATCACG
+CCCGTCAATTCCTTTGAGTTTCATTCTTGCGAACGTACTCCCCAGGTGGAATACTTATTG
+CGTTTGCTGCGGCACCGAATGGCTTTGCCACCCGACACCTAGTATTCATCGTTTACGGCG
+TGGACTACCAGGGTATCTAATCCTGTTTGCTCCCCACGCTTTCGAGCCTCAACGTCAGGA
+TCGGAAGAGCACACGTCTGAACTCCAGTCACATCCCG
+>HWI-M00234:263:000000000-ADM55:1:1101:22403:3828 1:N:0:ATCACG
+CCCGGACATCTTCGGCGCAGGATCTCTTGACTAGTGAGCTATTACGCACTCTTTAAATGA
+GTGGCTGCTTCTAAGCCAACATCCTAGTTGTCTTAGAAATCCCACATCCTTTTCCACTTA
+ACTTACACTTTGGGACCTTAGCTGATGAGATCGGAAGAGCACACGTCTGAACTCCAGTCA
+CATCACGATCTCGTATGCCGTCTTCTGCTTGAAAAAAAAAAAAATATCAATCAAACACAC
+ACACACCAGCTTAC
+>HWI-M00234:263:000000000-ADM55:1:1101:7508:4067 1:N:0:ATCACG
+GGTGCACTAGGATCGTAGTTGGCTACTTTCCCGTTTTCAATGTATACGCAAGGTACACGG
+TCAGCGGTAGCTGCCATAATGTAATGGTAGTCAAATCCTAAGTCTCCCAATGCACATGGC
+AGTGGAGCGTTCCAATCTTGTGTACCGGCTTTGTCTCCTAATCCCAAGTGCCATTTTCCG
+ATAGCTCCGGTAGCATAACCGGTACTTTTGAACATAACCGCCATGGTATATTGTTCGGGA
+CGGATAATCATTCCGGCATTTCCGGCAGCTACG
+>HWI-M00234:263:000000000-ADM55:1:1101:26232:4161 1:N:0:ATCACG
+CTCTTCTTAAGCTCGAACAGCTTCTTCAGTCTTACCTGCCATTTCATCTAAAATTTTTAA
+AGCTCGCTCTAAAACAGTAGTATCATCAATCATAACCAATCCACCATCTGGTCCAGGTTC
+CAAGTGAATCCCAACACTTTTCCCCTCCTTAAAATTGTGTCCACCGAAAAAATTTCTTAC
+AGTGTCAACATTCAGTCCAAGTTCATCGGCTATTCTATGCATACTACCACTAGGCAATGA
+GT
+>HWI-M00234:263:000000000-ADM55:1:1101:23151:4189 1:N:0:ATCACG
+GCGGATTTTCTCGGGAGTATGATTACCCACACTATTGGATTCTTCCGAAGAAGACTCCAT
+ACTACCAAGTTCAGCTCGGATGGTGGATTTGCCTGCCAAGATCAGAAGAGCACACGTCTG
+AACTCCAGTCACATCACGACTTCGTATGCCGTATTCTGCTTGAAAAAAACAATGAAAACT
+AGTCACCGATGACTCACGTTCGCTGAACATTATCTGACAACTAGCTTAACAATGGACATG
+CTTAGCACTGACAACCAGACG
+>HWI-M00234:263:000000000-ADM55:1:1101:17148:4803 1:N:0:ATCACG
+CCCTTTTCGGCAATGGCGATGTTACGGTACATAAGAGCGATTTCGGGGAAACCTTCTTCG
+TCTGCAATATCAGCAAACTTAGGATAATCCAATGA
+>HWI-M00234:263:000000000-ADM55:1:1101:8939:4808 1:N:0:ATCACG
+CCACAGTTCTGTCATATCGCAGTACAGGAATCTCAACCTGTTGTCCATCGGCTACGGCTC
+TCGCCCTCGCCTTAGGCCCCGACTTACCCAGGGCAGATCAGCTTTA
+>HWI-M00234:263:000000000-ADM55:1:1101:11727:5103 1:N:0:ATCACG
+CTCCCGTATAGGATGGATCGAAAGCAATCGTCAGGAATCCACGTTCTGCCAATGTCTGCG
+CATACAAGCCCGAAGCTTGTTCCTTCACGGCACCAAATGGGCCACTGATGGCAATGGCAG
+GCAATTTACCCGTCACATTCTTGGGTACATACAAATCGGCGGCAAGTGTAATGCCGTAAC
+GGTTGTGGAAAG
+>HWI-M00234:263:000000000-ADM55:1:1101:15029:5173 1:N:0:ATCACG
+GGCCTATTCTCTGCGGCCGCCTTTCGGCGGCACCCCTTCTCCCGAAGTTACGGGGTCATT
+TTGCCGAGTTCCTTAACAATGCTTCTTCCGTCGGCCTTAGGATTCTCTCCTCATCCACCT
+GTGTCGGTTTACGGTACGGGTACAATATAAACAATAGCGGCTTTTCTTGACGGCCGGCTC
+ATGGGCTTCCCTACTTTAGT
+>HWI-M00234:263:000000000-ADM55:1:1101:7330:5248 1:N:0:ATCACG
+TGTGTATGAATGAGCGGCTACAGGCTTAGTCGATTTCTTTACTGCGCAGAAGCGGGACTG
+TGACCGACAAAACAGCCGTCGCCTCTCTACGTTCCGGGACCATACGCCGCTCGCAGTGAT
+TGACCCTTACAACCTTGCGGGCGCTCTC
+>HWI-M00234:263:000000000-ADM55:1:1101:18630:5353 1:N:0:ATCACG
+GGCGTGTTCTGCCAAAATAGTGCTGGGCAATATACGACATAGAAGCGAAAGGCAATACTT
+TTTCTAAGGCCTGCCTGATTTCTACTGTTTTCACAATGGCTTGGGCTTCATTGATTGATT
+GCCTGGCACCATCTTGGAATGCTTGCGCAAACGCTTTTTTATCCTCCGGTGAAAGCGTCT
+GCAGAAAAGCCCTGAAACGTTTTTTATGGTCGGCCACTTCCTCAGGAGTATTG
+>HWI-M00234:263:000000000-ADM55:1:1101:11799:5476 1:N:0:ATCACG
+CCTAAATTTTCGAGTATAAGCAGGACCGAAGCCACCAACTTATACCTTATCCTCTAAATT
+TTCGTAAGAGACATGAAGCGGATCTCTAACTATTCCCGATTTTACTGCACCACTTGATCA
+AACGCTTCGGAACAAGAGCTTTTGAGTGATGTCTCGTTTCCACCACTTTGGCAGAAATAA
+AGCTAATCTACTATGATTCGATTAAGCAGCAAGAGCATAATTTTCGTTGCCAGATAAAAT
+TT
+>HWI-M00234:263:000000000-ADM55:1:1101:11348:5668 1:N:0:ATCACG
+GCCTAAATTTTCGTGCAGCGGCAGAACCAAAGCCATCAACCGTTGCCTTATCCTCTAAAT
+TTTCACCCGCGCCACGAGGCTGACACGAACTATCCCCGATTTGACTGCACCACTTTATCG
+GAATGCTTCGGAGCAACAGCTTCCGAGTGATGTCACGTCCCAGCACCTGGTGCCGGGATT
+AAGCTTCAATCTACTATACTTCGATTAAGCAGCGAGAGCGTAACGAGTTTCGCCAGATAA
+AATTTTGAGGACTGAGATTAAAGTGAAAATC
+>HWI-M00234:263:000000000-ADM55:1:1101:25874:5826 1:N:0:ATCACG
+CCTGCAGTGGATAGGGACCGAACTGTCTCACGACGTTCTGAACCCAGCTCACGTACCTCT
+TTAATGGGCGAACAGCCCAACCCTTGGGACCTTCTCCAGCCCCAGGATGAGATGAGCCGA
+CATCGAGGTGCCAAACTTTCCCGCCGATATGGACGCCCGGGCAAAATCAGCTTGTTATCC
+CCAGGGTAGCTTTTATCCGTTGAGCGACGACCCTTCCATTCGGAATCGCCGGAATACTAT
+GCCCTGCTTTCGCACCTGCCCAACCAGTCCGCCCAGCAGTTAAG
+>HWI-M00234:263:000000000-ADM55:1:1101:26932:5861 1:N:0:ATCACG
+AGCGTCAGTTACAGTCCAGAAAGCCGCCTTCGCCACTGGTGTTCTTCCTAATCTCTACGC
+ATTTCACCGCTACACTAGGAATTCCGCTTTCCTCTCCTGCACTCTAGATATCCAGTTTGG
+AATGCAGCCCCCAGGTTAAGCCCGGGGATTTCACATCCCACTTAAACATCCGCCTACGCA
+CCCTTTACCACCAGTAAATCCGGACAACGCTCGCCACCTACGTATTACCGCGGCTGCTGG
+CACGTAGTTAGCCGTGGCTTCCTCCTCTGGTACCTTCATTATCGTCCCCGAAACC
+>HWI-M00234:263:000000000-ADM55:1:1101:14154:5990 1:N:0:ATCACG
+GTGGGATGTCAAGGTAAGCGGCGGCAGCCTTGGCTACAGCAAGAGATACGCCGAGGATGG
+CATTGGCACCCAGATTGGCTTTCGTTTTGGTTCCGTCCAGTGCAAGCATGGCATGGTCGA
+TACCCATCTGGTCGAGGGCGGACATACCGATGAGCTTGGGAGCAATGATATTATTGATAT
+TGTCCACGGCTTTCAGGAC
+>HWI-M00234:263:000000000-ADM55:1:1101:25022:6229 1:N:0:ATCACG
+CCCGAGAACGTATTCACCGCAACATTGCTGATTTGCGATTACTAGTGATTCCAACTTCAT
+GTACTCGAGTTGCAGAGTACAATCCGAACTACGAACAGCTTTCTGAGGTTTGCTCCTCCT
+CGCAGATTTGCTGATCGGAAGAGCACACGTCTGAACTCCAGTCACATC
+>HWI-M00234:263:000000000-ADM55:1:1101:21023:6286 1:N:0:ATCACG
+GTGTACAAGGCCCGGGAACGTATTCACCGCGCCGTGGCTGATGCGCGATTACTAGCGAAT
+CCAGCTTCATGGAGTCGGGTTGCAGACTCCAATCCGAACTGAGAGAGGCTTTAGGGATTA
+GCATCACGTCGCCGTGTAGCTGCCTTCTGTACCCCCCATTGTAACACGTGTGTAGCCCCG
+GACGTAAGGGCCGTGCTGATTTGCCGTCATCCCCACCTTCCTCAC
+>HWI-M00234:263:000000000-ADM55:1:1101:8138:6336 1:N:0:ATCACG
+TGTGTACAAGGCCCGGGAACGTATTCACCGCGACATTCTGATTCGCGATTACTAGCAACT
+CCAGCTTCATGTAGGCGAGTTGCAGCCTACAATCCGAACTGAGATAGGTTTTATAAGTTT
+TGCTCCACCTCACGGTCTT
+>HWI-M00234:263:000000000-ADM55:1:1101:11055:6543 1:N:0:ATCACG
+CCTGGACATTTTCGGCGCAGGACCTCCCGACCAGTGAGCTATTACGCACTCTTTGACTGT
+GTGGCTGCTTCTGAGCCAACATCCTGGTTGACTTTGAAATCTCACATACTTTTCCACTTA
+ACACGCACTTTGGGACCTTAGCTGGAGGTCTTGGCTCTTTCCTTTTTGCCTATCCAACTT
+ATCTCGTATAGTCTGACTCCCGG
+>HWI-M00234:263:000000000-ADM55:1:1101:24980:6575 1:N:0:ATCACG
+GCCATTTATCTACGCCTGTTGTCACCAACAGGCTCTAGCGGTCTACCCTCCGACGTGGGG
+CGAGCAACCCTCATA
+>HWI-M00234:263:000000000-ADM55:1:1101:7596:6682 1:N:0:ATCACG
+GCCCCCGTCAATTCCTTTGAGTTTCACCGTTGCCGGCGTACTCCCCAGGTGGAATACTTA
+ACGCTTTCGCTTGGCGGCTGACAATGTATCGCCAACCGCGAGTATTCATCAGATCGGAAG
+AGCACACGTCTGAACTCCAGTCACATCCCGATCTCGTATGCCGTCCTCGGCTTGAAAAAA
+AAAAATATAAACCATGATGAATTTCGAACACTCACGACCACACACTAAGCGTCGACGTA
+>HWI-M00234:263:000000000-ADM55:1:1101:24419:6736 1:N:0:ATCACG
+CGGGCGTTGGCAAGTACGTTATATCACTTACCCACGCTCGATTCAGAACCCCAGGAGTAA
+ATGCTCGTTTTAAGAGGTTGGGATACACAGGCATGGTGTGATTACTGTCGGTGGTTTTTA
+CGGTTCGCTTAAAAAAGCGGTAACCAATGATGCCATTAAAGCGAAGGATAGCGCGTAAAC
+GTTTGACACCAACTTTCACTCCACGGTGTTGCATCAAAGC
+>HWI-M00234:263:000000000-ADM55:1:1101:5068:6755 1:N:0:ATCACG
+GCAGCGGCAGAACCAAAGCCATCAACCGTTGCCTTATCCTCTAAATTTTCACCCGCGCCA
+CGAGGCTGACACGAACTATCCCCGATTTGACTGCACCACTTTATCGGAATGCTTCGGAGC
+AACAGCTTCCGAGTGATGTCACGTCCCAGCACCTGGTGCCGGGATTAAGCTTCAATCTAC
+TATACTTCGATTAAGCAGCGAGAGCGTAACGAGTTTCGCCAGATAAAATTTTGAGGACTG
+AGATTAAAGTGCAAATC
+>HWI-M00234:263:000000000-ADM55:1:1101:21477:6796 1:N:0:ATCACG
+CCCCACTGCTGCTTCCCGTAGGAGTTTGGACCGTGTCTCAGTTCCAATGTGGGGGACCTT
+CCTCTCAGAACCCCTATCCATCGTTGACTAGGTGGGCCGTTACCCCGCCTACTATCTAAT
+GGAACGCATCCCCATCGTCTACCGGAAAATACCTT
+>HWI-M00234:263:000000000-ADM55:1:1101:12483:6880 1:N:0:ATCACG
+CTCCTTGTCTGCCTTCGATTACGGCATTTGCAATCGTTCCTGTAAGTAGTTTTACAGCTC
+TAATGGCATCGTCATTCCCTGGTATTACGTAGTCTATTTCATCAGGATCACAGTTAGTAT
+CAACTATTGCTACAACTGGTATTCCTAATATCTTCGCTTCATTTACTGCAATTCTTTCTT
+TTCTTGGATCTACAACAAATAATACATCAGGAAGACCACCCATATCTTGAATGCCACCTA
+AAAACTTTTCAA
+>HWI-M00234:263:000000000-ADM55:1:1101:27958:6935 1:N:0:ATCACG
+CCATTCGGAAATCCGCGGATCAAAGGTCATTTGCACCTACCCGCAGCTTATCGCAGCTTA
+TCACGTCCTTCATCGCCTCCGAGAGCCAAGAGATCGGAAGAGCACACGTCTGAACTCCAG
+TCACATCACGATCTCGTATGCCGTCTTCTGCTTGAAAAAAAAAACCCACAAATTCACACT
+ACACACCCACCTCCCATCACGCATCTCTTTTGTCCGAGTCACGCTGCACGCTACCTGCAC
+ACTACCTGCCTCAGTTACATCTTTTTACTCAATGTCCCACCATTTATCAC
+>HWI-M00234:263:000000000-ADM55:1:1101:6151:7404 1:N:0:ATCACG
+GCACGTAGTTAGCCGGGGCTTCCTCCTAAGGTACCGTCATTATCGTCCCTTAGGACAGAG
+CTTTACGATCCGAAAACCTTCATCGCTCACGCGGCGTCGCTGCATCAGAGTTCCCTCCAT
+TGTGCAATATTCCCCACTGCTGCCTCCCGTAGGAGTCTGGACCGTGTCTCAGTTCCAGTG
+TGGCCGTTCACCCTCCCAGGCCGGCTACCCATCGTCGCCTTGGTTAGCTATTACCTCCCC
+AACTAGCTAATGGGACGCGAGTCCAGCTTATACCACTTAACCGCTTTTGCTTGAAAATCA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/information_lenght_fasta_output.txt	Tue Apr 26 08:17:42 2016 -0400
@@ -0,0 +1,37 @@
+length
+86
+141
+300
+300
+116
+63
+53
+194
+217
+254
+273
+242
+261
+95
+106
+192
+200
+148
+233
+242
+271
+284
+295
+199
+168
+225
+139
+203
+75
+239
+220
+257
+155
+252
+290
+300
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/input_sequence_file.fasta	Tue Apr 26 08:17:42 2016 -0400
@@ -0,0 +1,174 @@
+>HWI-M00234:263:000000000-ADM55:1:1101:21704:2233 1:N:0:ATCACG
+GTGTACAAGGCCCGGGAACGTATTCACCGCGGCATGCTGATCCGCGATTACTAGCGATTC
+CAACTTCATACAGGCGGGTTTCAGCC
+>HWI-M00234:263:000000000-ADM55:1:1101:21334:2699 1:N:0:ATCACG
+CTTTTGACGGCCTTTTTGTTGTCTTCTGAATTTTGTTTTTTTCGGTTGTAACATAATTCC
+TAAAAATCAAATTCGTTAGCGATTATTTTTCTTTCTTTTGAAGTTCTTTCCGCCATTGTT
+TCCGCTATTGCTTCCACGACC
+>HWI-M00234:263:000000000-ADM55:1:1101:13968:2885 1:N:0:ATCACG
+CCCACTGCTGCCTCCCGTAGGAGCCTGGACCGTGTCTCAGTTCCAATGTGGCCGATCACC
+CTCTCAGGTCGGCTACCCATCGTTGCCCTGGTAAGCCATTACCCTACCAACTAGCTAATG
+GGACGCGGGCACATCTCAAAGCGGATTACCCCTTTGGTTAAAGTTTAATGCGAAACTCTA
+ACTTTATGCGTTATTAACCCTCCTTTCGGAGGGCTATTCCCCTCTTTGATGCAGGTTGCC
+CACGTGTTACTCACCCGTCCGCCGCTAATCCACTTCCCGAAGGCAGATTCAACCCTCGAT
+>HWI-M00234:263:000000000-ADM55:1:1101:11873:2948 1:N:0:ATCACG
+CCCCGTTACATCTTCCGCGCAGGAAGACTCGATCAGTGAGCTATTACGCTTTCTTTGAAG
+GATGGCTGCTTCTAAGCCAACTTCCTGACTGTCTTAGCCTTCCCACTTCGTTTTCCACTT
+AGTCAATATTAGGGACCTTAGCCGGCGGTCTGGGTTGTTTCCCTCTTGAGTCCGGACGTT
+AGCACCCGGTGCTCTGTCCCCCGTGCCCAAACTTCCAAGTATTCGGAGTTTGCCATGGTT
+TGGTAAGACGCTATGTCCCCCTAACCATAACAGTGTTCTACCCTCTGAACACATACTCGA
+>HWI-M00234:263:000000000-ADM55:1:1101:7855:3066 1:N:0:ATCACG
+CGTCAATCTTCCAACGCCCACGGCAGATAGGGACAAAACTGTCTCACGACGTTTTAAACC
+CAGCTCACGTACCTCTTTAAATGGCGAACAGCCATACCCTTGGGACCGGCTACAGC
+>HWI-M00234:263:000000000-ADM55:1:1101:24817:3238 1:N:0:ATCACG
+CCCGTGACCAGATTCATGGCCGCCGGTTAGAACCCCAGTACTGTCAGGGTGGTATCCCAA
+GGA
+>HWI-M00234:263:000000000-ADM55:1:1101:17179:3527 1:N:0:ATCACG
+GTGCTTATTTCACTTCCTCAAAATCAGCATCCTGCACATTATCGCCATGCTTT
+>HWI-M00234:263:000000000-ADM55:1:1101:21254:3571 1:N:0:ATCACG
+GTCGCGGGGAAGATCAACTCCTGCAATTCGAGCCATACCAATTACCTCCTAGCGCCCTGA
+CGCTGTTTATGACGAGGATCGCGGCTGCAGATGACGCGAATGACGCCATTGCGCTTGATC
+ACTCGGCAATACTCACAAATGGGTTTAACAGATTATCTAACCTTCATAGTTTGCACACTC
+CTCATGGACATTCC
+>HWI-M00234:263:000000000-ADM55:1:1101:16569:3709 1:N:0:ATCACG
+CCCGTCAATTCCTTTGAGTTTCATTCTTGCGAACGTACTCCCCAGGTGGAATACTTATTG
+CGTTTGCTGCGGCACCGAATGGCTTTGCCACCCGACACCTAGTATTCATCGTTTACGGCG
+TGGACTACCAGGGTATCTAATCCTGTTTGCTCCCCACGCTTTCGAGCCTCAACGTCAGGA
+TCGGAAGAGCACACGTCTGAACTCCAGTCACATCCCG
+>HWI-M00234:263:000000000-ADM55:1:1101:22403:3828 1:N:0:ATCACG
+CCCGGACATCTTCGGCGCAGGATCTCTTGACTAGTGAGCTATTACGCACTCTTTAAATGA
+GTGGCTGCTTCTAAGCCAACATCCTAGTTGTCTTAGAAATCCCACATCCTTTTCCACTTA
+ACTTACACTTTGGGACCTTAGCTGATGAGATCGGAAGAGCACACGTCTGAACTCCAGTCA
+CATCACGATCTCGTATGCCGTCTTCTGCTTGAAAAAAAAAAAAATATCAATCAAACACAC
+ACACACCAGCTTAC
+>HWI-M00234:263:000000000-ADM55:1:1101:7508:4067 1:N:0:ATCACG
+GGTGCACTAGGATCGTAGTTGGCTACTTTCCCGTTTTCAATGTATACGCAAGGTACACGG
+TCAGCGGTAGCTGCCATAATGTAATGGTAGTCAAATCCTAAGTCTCCCAATGCACATGGC
+AGTGGAGCGTTCCAATCTTGTGTACCGGCTTTGTCTCCTAATCCCAAGTGCCATTTTCCG
+ATAGCTCCGGTAGCATAACCGGTACTTTTGAACATAACCGCCATGGTATATTGTTCGGGA
+CGGATAATCATTCCGGCATTTCCGGCAGCTACG
+>HWI-M00234:263:000000000-ADM55:1:1101:26232:4161 1:N:0:ATCACG
+CTCTTCTTAAGCTCGAACAGCTTCTTCAGTCTTACCTGCCATTTCATCTAAAATTTTTAA
+AGCTCGCTCTAAAACAGTAGTATCATCAATCATAACCAATCCACCATCTGGTCCAGGTTC
+CAAGTGAATCCCAACACTTTTCCCCTCCTTAAAATTGTGTCCACCGAAAAAATTTCTTAC
+AGTGTCAACATTCAGTCCAAGTTCATCGGCTATTCTATGCATACTACCACTAGGCAATGA
+GT
+>HWI-M00234:263:000000000-ADM55:1:1101:23151:4189 1:N:0:ATCACG
+GCGGATTTTCTCGGGAGTATGATTACCCACACTATTGGATTCTTCCGAAGAAGACTCCAT
+ACTACCAAGTTCAGCTCGGATGGTGGATTTGCCTGCCAAGATCAGAAGAGCACACGTCTG
+AACTCCAGTCACATCACGACTTCGTATGCCGTATTCTGCTTGAAAAAAACAATGAAAACT
+AGTCACCGATGACTCACGTTCGCTGAACATTATCTGACAACTAGCTTAACAATGGACATG
+CTTAGCACTGACAACCAGACG
+>HWI-M00234:263:000000000-ADM55:1:1101:17148:4803 1:N:0:ATCACG
+CCCTTTTCGGCAATGGCGATGTTACGGTACATAAGAGCGATTTCGGGGAAACCTTCTTCG
+TCTGCAATATCAGCAAACTTAGGATAATCCAATGA
+>HWI-M00234:263:000000000-ADM55:1:1101:8939:4808 1:N:0:ATCACG
+CCACAGTTCTGTCATATCGCAGTACAGGAATCTCAACCTGTTGTCCATCGGCTACGGCTC
+TCGCCCTCGCCTTAGGCCCCGACTTACCCAGGGCAGATCAGCTTTA
+>HWI-M00234:263:000000000-ADM55:1:1101:11727:5103 1:N:0:ATCACG
+CTCCCGTATAGGATGGATCGAAAGCAATCGTCAGGAATCCACGTTCTGCCAATGTCTGCG
+CATACAAGCCCGAAGCTTGTTCCTTCACGGCACCAAATGGGCCACTGATGGCAATGGCAG
+GCAATTTACCCGTCACATTCTTGGGTACATACAAATCGGCGGCAAGTGTAATGCCGTAAC
+GGTTGTGGAAAG
+>HWI-M00234:263:000000000-ADM55:1:1101:15029:5173 1:N:0:ATCACG
+GGCCTATTCTCTGCGGCCGCCTTTCGGCGGCACCCCTTCTCCCGAAGTTACGGGGTCATT
+TTGCCGAGTTCCTTAACAATGCTTCTTCCGTCGGCCTTAGGATTCTCTCCTCATCCACCT
+GTGTCGGTTTACGGTACGGGTACAATATAAACAATAGCGGCTTTTCTTGACGGCCGGCTC
+ATGGGCTTCCCTACTTTAGT
+>HWI-M00234:263:000000000-ADM55:1:1101:7330:5248 1:N:0:ATCACG
+TGTGTATGAATGAGCGGCTACAGGCTTAGTCGATTTCTTTACTGCGCAGAAGCGGGACTG
+TGACCGACAAAACAGCCGTCGCCTCTCTACGTTCCGGGACCATACGCCGCTCGCAGTGAT
+TGACCCTTACAACCTTGCGGGCGCTCTC
+>HWI-M00234:263:000000000-ADM55:1:1101:18630:5353 1:N:0:ATCACG
+GGCGTGTTCTGCCAAAATAGTGCTGGGCAATATACGACATAGAAGCGAAAGGCAATACTT
+TTTCTAAGGCCTGCCTGATTTCTACTGTTTTCACAATGGCTTGGGCTTCATTGATTGATT
+GCCTGGCACCATCTTGGAATGCTTGCGCAAACGCTTTTTTATCCTCCGGTGAAAGCGTCT
+GCAGAAAAGCCCTGAAACGTTTTTTATGGTCGGCCACTTCCTCAGGAGTATTG
+>HWI-M00234:263:000000000-ADM55:1:1101:11799:5476 1:N:0:ATCACG
+CCTAAATTTTCGAGTATAAGCAGGACCGAAGCCACCAACTTATACCTTATCCTCTAAATT
+TTCGTAAGAGACATGAAGCGGATCTCTAACTATTCCCGATTTTACTGCACCACTTGATCA
+AACGCTTCGGAACAAGAGCTTTTGAGTGATGTCTCGTTTCCACCACTTTGGCAGAAATAA
+AGCTAATCTACTATGATTCGATTAAGCAGCAAGAGCATAATTTTCGTTGCCAGATAAAAT
+TT
+>HWI-M00234:263:000000000-ADM55:1:1101:11348:5668 1:N:0:ATCACG
+GCCTAAATTTTCGTGCAGCGGCAGAACCAAAGCCATCAACCGTTGCCTTATCCTCTAAAT
+TTTCACCCGCGCCACGAGGCTGACACGAACTATCCCCGATTTGACTGCACCACTTTATCG
+GAATGCTTCGGAGCAACAGCTTCCGAGTGATGTCACGTCCCAGCACCTGGTGCCGGGATT
+AAGCTTCAATCTACTATACTTCGATTAAGCAGCGAGAGCGTAACGAGTTTCGCCAGATAA
+AATTTTGAGGACTGAGATTAAAGTGAAAATC
+>HWI-M00234:263:000000000-ADM55:1:1101:25874:5826 1:N:0:ATCACG
+CCTGCAGTGGATAGGGACCGAACTGTCTCACGACGTTCTGAACCCAGCTCACGTACCTCT
+TTAATGGGCGAACAGCCCAACCCTTGGGACCTTCTCCAGCCCCAGGATGAGATGAGCCGA
+CATCGAGGTGCCAAACTTTCCCGCCGATATGGACGCCCGGGCAAAATCAGCTTGTTATCC
+CCAGGGTAGCTTTTATCCGTTGAGCGACGACCCTTCCATTCGGAATCGCCGGAATACTAT
+GCCCTGCTTTCGCACCTGCCCAACCAGTCCGCCCAGCAGTTAAG
+>HWI-M00234:263:000000000-ADM55:1:1101:26932:5861 1:N:0:ATCACG
+AGCGTCAGTTACAGTCCAGAAAGCCGCCTTCGCCACTGGTGTTCTTCCTAATCTCTACGC
+ATTTCACCGCTACACTAGGAATTCCGCTTTCCTCTCCTGCACTCTAGATATCCAGTTTGG
+AATGCAGCCCCCAGGTTAAGCCCGGGGATTTCACATCCCACTTAAACATCCGCCTACGCA
+CCCTTTACCACCAGTAAATCCGGACAACGCTCGCCACCTACGTATTACCGCGGCTGCTGG
+CACGTAGTTAGCCGTGGCTTCCTCCTCTGGTACCTTCATTATCGTCCCCGAAACC
+>HWI-M00234:263:000000000-ADM55:1:1101:14154:5990 1:N:0:ATCACG
+GTGGGATGTCAAGGTAAGCGGCGGCAGCCTTGGCTACAGCAAGAGATACGCCGAGGATGG
+CATTGGCACCCAGATTGGCTTTCGTTTTGGTTCCGTCCAGTGCAAGCATGGCATGGTCGA
+TACCCATCTGGTCGAGGGCGGACATACCGATGAGCTTGGGAGCAATGATATTATTGATAT
+TGTCCACGGCTTTCAGGAC
+>HWI-M00234:263:000000000-ADM55:1:1101:25022:6229 1:N:0:ATCACG
+CCCGAGAACGTATTCACCGCAACATTGCTGATTTGCGATTACTAGTGATTCCAACTTCAT
+GTACTCGAGTTGCAGAGTACAATCCGAACTACGAACAGCTTTCTGAGGTTTGCTCCTCCT
+CGCAGATTTGCTGATCGGAAGAGCACACGTCTGAACTCCAGTCACATC
+>HWI-M00234:263:000000000-ADM55:1:1101:21023:6286 1:N:0:ATCACG
+GTGTACAAGGCCCGGGAACGTATTCACCGCGCCGTGGCTGATGCGCGATTACTAGCGAAT
+CCAGCTTCATGGAGTCGGGTTGCAGACTCCAATCCGAACTGAGAGAGGCTTTAGGGATTA
+GCATCACGTCGCCGTGTAGCTGCCTTCTGTACCCCCCATTGTAACACGTGTGTAGCCCCG
+GACGTAAGGGCCGTGCTGATTTGCCGTCATCCCCACCTTCCTCAC
+>HWI-M00234:263:000000000-ADM55:1:1101:8138:6336 1:N:0:ATCACG
+TGTGTACAAGGCCCGGGAACGTATTCACCGCGACATTCTGATTCGCGATTACTAGCAACT
+CCAGCTTCATGTAGGCGAGTTGCAGCCTACAATCCGAACTGAGATAGGTTTTATAAGTTT
+TGCTCCACCTCACGGTCTT
+>HWI-M00234:263:000000000-ADM55:1:1101:11055:6543 1:N:0:ATCACG
+CCTGGACATTTTCGGCGCAGGACCTCCCGACCAGTGAGCTATTACGCACTCTTTGACTGT
+GTGGCTGCTTCTGAGCCAACATCCTGGTTGACTTTGAAATCTCACATACTTTTCCACTTA
+ACACGCACTTTGGGACCTTAGCTGGAGGTCTTGGCTCTTTCCTTTTTGCCTATCCAACTT
+ATCTCGTATAGTCTGACTCCCGG
+>HWI-M00234:263:000000000-ADM55:1:1101:24980:6575 1:N:0:ATCACG
+GCCATTTATCTACGCCTGTTGTCACCAACAGGCTCTAGCGGTCTACCCTCCGACGTGGGG
+CGAGCAACCCTCATA
+>HWI-M00234:263:000000000-ADM55:1:1101:7596:6682 1:N:0:ATCACG
+GCCCCCGTCAATTCCTTTGAGTTTCACCGTTGCCGGCGTACTCCCCAGGTGGAATACTTA
+ACGCTTTCGCTTGGCGGCTGACAATGTATCGCCAACCGCGAGTATTCATCAGATCGGAAG
+AGCACACGTCTGAACTCCAGTCACATCCCGATCTCGTATGCCGTCCTCGGCTTGAAAAAA
+AAAAATATAAACCATGATGAATTTCGAACACTCACGACCACACACTAAGCGTCGACGTA
+>HWI-M00234:263:000000000-ADM55:1:1101:24419:6736 1:N:0:ATCACG
+CGGGCGTTGGCAAGTACGTTATATCACTTACCCACGCTCGATTCAGAACCCCAGGAGTAA
+ATGCTCGTTTTAAGAGGTTGGGATACACAGGCATGGTGTGATTACTGTCGGTGGTTTTTA
+CGGTTCGCTTAAAAAAGCGGTAACCAATGATGCCATTAAAGCGAAGGATAGCGCGTAAAC
+GTTTGACACCAACTTTCACTCCACGGTGTTGCATCAAAGC
+>HWI-M00234:263:000000000-ADM55:1:1101:5068:6755 1:N:0:ATCACG
+GCAGCGGCAGAACCAAAGCCATCAACCGTTGCCTTATCCTCTAAATTTTCACCCGCGCCA
+CGAGGCTGACACGAACTATCCCCGATTTGACTGCACCACTTTATCGGAATGCTTCGGAGC
+AACAGCTTCCGAGTGATGTCACGTCCCAGCACCTGGTGCCGGGATTAAGCTTCAATCTAC
+TATACTTCGATTAAGCAGCGAGAGCGTAACGAGTTTCGCCAGATAAAATTTTGAGGACTG
+AGATTAAAGTGCAAATC
+>HWI-M00234:263:000000000-ADM55:1:1101:21477:6796 1:N:0:ATCACG
+CCCCACTGCTGCTTCCCGTAGGAGTTTGGACCGTGTCTCAGTTCCAATGTGGGGGACCTT
+CCTCTCAGAACCCCTATCCATCGTTGACTAGGTGGGCCGTTACCCCGCCTACTATCTAAT
+GGAACGCATCCCCATCGTCTACCGGAAAATACCTT
+>HWI-M00234:263:000000000-ADM55:1:1101:12483:6880 1:N:0:ATCACG
+CTCCTTGTCTGCCTTCGATTACGGCATTTGCAATCGTTCCTGTAAGTAGTTTTACAGCTC
+TAATGGCATCGTCATTCCCTGGTATTACGTAGTCTATTTCATCAGGATCACAGTTAGTAT
+CAACTATTGCTACAACTGGTATTCCTAATATCTTCGCTTCATTTACTGCAATTCTTTCTT
+TTCTTGGATCTACAACAAATAATACATCAGGAAGACCACCCATATCTTGAATGCCACCTA
+AAAACTTTTCAA
+>HWI-M00234:263:000000000-ADM55:1:1101:27958:6935 1:N:0:ATCACG
+CCATTCGGAAATCCGCGGATCAAAGGTCATTTGCACCTACCCGCAGCTTATCGCAGCTTA
+TCACGTCCTTCATCGCCTCCGAGAGCCAAGAGATCGGAAGAGCACACGTCTGAACTCCAG
+TCACATCACGATCTCGTATGCCGTCTTCTGCTTGAAAAAAAAAACCCACAAATTCACACT
+ACACACCCACCTCCCATCACGCATCTCTTTTGTCCGAGTCACGCTGCACGCTACCTGCAC
+ACTACCTGCCTCAGTTACATCTTTTTACTCAATGTCCCACCATTTATCAC
+>HWI-M00234:263:000000000-ADM55:1:1101:6151:7404 1:N:0:ATCACG
+GCACGTAGTTAGCCGGGGCTTCCTCCTAAGGTACCGTCATTATCGTCCCTTAGGACAGAG
+CTTTACGATCCGAAAACCTTCATCGCTCACGCGGCGTCGCTGCATCAGAGTTCCCTCCAT
+TGTGCAATATTCCCCACTGCTGCCTCCCGTAGGAGTCTGGACCGTGTCTCAGTTCCAGTG
+TGGCCGTTCACCCTCCCAGGCCGGCTACCCATCGTCGCCTTGGTTAGCTATTACCTCCCC
+AACTAGCTAATGGGACGCGAGTCCAGCTTATACCACTTAACCGCTTTTGCTTGAAAATCA
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/input_sequence_file.fastq	Tue Apr 26 08:17:42 2016 -0400
@@ -0,0 +1,144 @@
+@HWI-M00234:263:000000000-ADM55:1:1101:21704:2233 1:N:0:ATCACG
+GTGTACAAGGCCCGGGAACGTATTCACCGCGGCATGCTGATCCGCGATTACTAGCGATTCCAACTTCATACAGGCGGGTTTCAGCC
++
+BCCCCGGED8DFGC::+@C@9@,,EGFAF@CC7@@@FGAF<@FGGEGD7:<6EDDECCFGGCFGGC<66,F<FFCGFC4BFF?5?<
+@HWI-M00234:263:000000000-ADM55:1:1101:21334:2699 1:N:0:ATCACG
+CTTTTGACGGCCTTTTTGTTGTCTTCTGAATTTTGTTTTTTTCGGTTGTAACATAATTCCTAAAAATCAAATTCGTTAGCGATTATTTTTCTTTCTTTTGAAGTTCTTTCCGCCATTGTTTCCGCTATTGCTTCCACGACC
++
+CCCCCGFGGGGGGGGGGGGGGGGGGGGGGGFGGGGGGGGGGGGG@FGGGGGGGGEADGGGGGGGGGGGGGFGGGGFF@CFFEGGDGGGGGFGGGGGGGGFGFCFGGGGGFGCE=FGFDGFGGCEEGGGGDFGGGFGGGGGC
+@HWI-M00234:263:000000000-ADM55:1:1101:13968:2885 1:N:0:ATCACG
+CCCACTGCTGCCTCCCGTAGGAGCCTGGACCGTGTCTCAGTTCCAATGTGGCCGATCACCCTCTCAGGTCGGCTACCCATCGTTGCCCTGGTAAGCCATTACCCTACCAACTAGCTAATGGGACGCGGGCACATCTCAAAGCGGATTACCCCTTTGGTTAAAGTTTAATGCGAAACTCTAACTTTATGCGTTATTAACCCTCCTTTCGGAGGGCTATTCCCCTCTTTGATGCAGGTTGCCCACGTGTTACTCACCCGTCCGCCGCTAATCCACTTCCCGAAGGCAGATTCAACCCTCGAT
++
+<CC8CEFDGGFDF<,6@F7FCGF,:FFCED@@@,;;,<CFFFA,6C@FC@,<E+87FFCFCGFF8,<<FG7+@F7FEFFGGGCFECF,=<B=EF99F@9<FAFFGDF?=E:=4:,9,,CF9A4,>8>C+>3BFGD;@,7>,==>6?=9,,@+@4<=699C9,@+@<+72;@5;0*9:?82BF85=@2=C###############################################################################################################
+@HWI-M00234:263:000000000-ADM55:1:1101:11873:2948 1:N:0:ATCACG
+CCCCGTTACATCTTCCGCGCAGGAAGACTCGATCAGTGAGCTATTACGCTTTCTTTGAAGGATGGCTGCTTCTAAGCCAACTTCCTGACTGTCTTAGCCTTCCCACTTCGTTTTCCACTTAGTCAATATTAGGGACCTTAGCCGGCGGTCTGGGTTGTTTCCCTCTTGAGTCCGGACGTTAGCACCCGGTGCTCTGTCCCCCGTGCCCAAACTTCCAAGTATTCGGAGTTTGCCATGGTTTGGTAAGACGCTATGTCCCCCTAACCATAACAGTGTTCTACCCTCTGAACACATACTCGA
++
+CCCCCCD;B6C,;<EAFECF@FGGGGAECEG@F@FGGGFAAF9FGGCF>F7<FCFF<6FEFFFCDCFGGGEC<F,<A<EFC@F9BFGE<9DFFGEEGG@FFGFFGF8FDEFC<F,94:EF9,C=EGGGCCFCCE>B+>E9FCGG6+@CC>EFC8D>CEF,E=@=E?C,6=AFG>>9?DCGC>FG>GGCDA5*;+=AFF*A;/?B)-)(;64:)>3<E<3))7<E3=;>FDF?E<<4)3;EF@FFA#######################################################
+@HWI-M00234:263:000000000-ADM55:1:1101:7855:3066 1:N:0:ATCACG
+CGTCAATCTTCCAACGCCCACGGCAGATAGGGACAAAACTGTCTCACGACGTTTTAAACCCAGCTCACGTACCTCTTTAAATGGCGAACAGCCATACCCTTGGGACCGGCTACAGC
++
+CCCCCGGGGGGGGFGGGCBCFGGGGGFGGGGGGGGGGGGGGGG,CEGGGGGGGGGGGGGG@F@FGGGGGGGG@@EGFGGGFGFGCGEGGGGGGGGGGCFGGGGEGEEE7FFGFFGD
+@HWI-M00234:263:000000000-ADM55:1:1101:24817:3238 1:N:0:ATCACG
+CCCGTGACCAGATTCATGGCCGCCGGTTAGAACCCCAGTACTGTCAGGGTGGTATCCCAAGGA
++
+CCCCC7FGFGEGGGGGGDFGGGGGGDGGGGGGGGGGGGGGGGGGGGGFEECGGGGGGFFGGGG
+@HWI-M00234:263:000000000-ADM55:1:1101:17179:3527 1:N:0:ATCACG
+GTGCTTATTTCACTTCCTCAAAATCAGCATCCTGCACATTATCGCCATGCTTT
++
+CCCCCG<FCCGGFGGFGGGGGGGGFGGGGGGDEG?<ECGCFEG<EGGGF,CFG
+@HWI-M00234:263:000000000-ADM55:1:1101:21254:3571 1:N:0:ATCACG
+GTCGCGGGGAAGATCAACTCCTGCAATTCGAGCCATACCAATTACCTCCTAGCGCCCTGACGCTGTTTATGACGAGGATCGCGGCTGCAGATGACGCGAATGACGCCATTGCGCTTGATCACTCGGCAATACTCACAAATGGGTTTAACAGATTATCTAACCTTCATAGTTTGCACACTCCTCATGGACATTCC
++
+CCCCCFEFGGGGGGGGGGGGGGGGGGGGGGGGGGGG<FCCGGFFGGDFGGGFGGCGG7FGGGGGCGGAFFEEGC:FGGGGGGGGGDFGGFAGFGGGG7FEGGGGGGE7FGGG>EGGGFFFCFGGFCEEGGFGCGGGFGFDGFFGGCFGGG7C;,5=EF,CG59DCCG@,5CFFFG=FC*CFFGGGDFGGAFFFF
+@HWI-M00234:263:000000000-ADM55:1:1101:16569:3709 1:N:0:ATCACG
+CCCGTCAATTCCTTTGAGTTTCATTCTTGCGAACGTACTCCCCAGGTGGAATACTTATTGCGTTTGCTGCGGCACCGAATGGCTTTGCCACCCGACACCTAGTATTCATCGTTTACGGCGTGGACTACCAGGGTATCTAATCCTGTTTGCTCCCCACGCTTTCGAGCCTCAACGTCAGGATCGGAAGAGCACACGTCTGAACTCCAGTCACATCCCG
++
+CCCCCGGGGGGGGGGGGGFGGGGGGGGGGGGGGGGGGGGGGGGGGGGFGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGFGGGGGGGGGGGG9FGGGGDGGGGGGGECGGGGGEGCGGGGGGGDGGGFGGGGGFGGGGGGFGGGGGGGGGGGACFGGGFGGGGGFGGGGGCFGGGGGGFFFFFFEF:65CFFF8FEF7AFEFEE(,6
+@HWI-M00234:263:000000000-ADM55:1:1101:22403:3828 1:N:0:ATCACG
+CCCGGACATCTTCGGCGCAGGATCTCTTGACTAGTGAGCTATTACGCACTCTTTAAATGAGTGGCTGCTTCTAAGCCAACATCCTAGTTGTCTTAGAAATCCCACATCCTTTTCCACTTAACTTACACTTTGGGACCTTAGCTGATGAGATCGGAAGAGCACACGTCTGAACTCCAGTCACATCACGATCTCGTATGCCGTCTTCTGCTTGAAAAAAAAAAAAATATCAATCAAACACACACACACCAGCTTAC
++
+CCCCCGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGFGGGGGGGGGEGGGGGGGGFGGGGGGGGGGGGGGGGFGGGGGGGGGGGGGGGCGGFGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGG>DGGGGGGGGFDFFEDGGGCEEECGGGFGGGGGGFGGGGGGGFFFDGGGGFFGGG=D?DFFFF?CFFF5*:<EFE>+*3886=AAA@##################################
+@HWI-M00234:263:000000000-ADM55:1:1101:7508:4067 1:N:0:ATCACG
+GGTGCACTAGGATCGTAGTTGGCTACTTTCCCGTTTTCAATGTATACGCAAGGTACACGGTCAGCGGTAGCTGCCATAATGTAATGGTAGTCAAATCCTAAGTCTCCCAATGCACATGGCAGTGGAGCGTTCCAATCTTGTGTACCGGCTTTGTCTCCTAATCCCAAGTGCCATTTTCCGATAGCTCCGGTAGCATAACCGGTACTTTTGAACATAACCGCCATGGTATATTGTTCGGGACGGATAATCATTCCGGCATTTCCGGCAGCTACG
++
+CCCCCGFGGF8FFECFFCGE9FFGGGG9CFAFFCC@@CFGFGGCGFGGGGGGFFGDGEFFEFG8FGGF@@FGCFGGCA@FCFFCFGGGGFFGFF9??FFFFGGGGGFFF=FGGGDEF:F8,4@ACEE8CCEEGGGCCFG9FFFAFG6CGGEGE,=3EGC2;=EFFFGFGFGG9@9EGGGGC>8=DCFGGDFEFF+=7<AFFE>>5AAEF8AFE589*)849>524=;8*198?CE?9>59@>6(66@C<.))/5;>(13=EFE60(334:AB?
+@HWI-M00234:263:000000000-ADM55:1:1101:26232:4161 1:N:0:ATCACG
+CTCTTCTTAAGCTCGAACAGCTTCTTCAGTCTTACCTGCCATTTCATCTAAAATTTTTAAAGCTCGCTCTAAAACAGTAGTATCATCAATCATAACCAATCCACCATCTGGTCCAGGTTCCAAGTGAATCCCAACACTTTTCCCCTCCTTAAAATTGTGTCCACCGAAAAAATTTCTTACAGTGTCAACATTCAGTCCAAGTTCATCGGCTATTCTATGCATACTACCACTAGGCAATGAGT
++
+CCCCCGGFGFFFGGGGGGCFGGGGGGGGGGGFGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGCFGGFGEGFGGGGFGFGFGGGFAFDGCFGGGGFGGGFGCGFGGGGCGGGFGGGG:FFGGF@F9FGGGGGFGGGGGGCEGGC?FGGGGGGGFGGDFFGF8DFGGCGGGGCDFGGGGGGGGDFGGCFGFDF7;EFFFFFFFB<FDFFAEDFFFFFF@CEFCCEEFFFFFBEFE@8=@657>
+@HWI-M00234:263:000000000-ADM55:1:1101:23151:4189 1:N:0:ATCACG
+GCGGATTTTCTCGGGAGTATGATTACCCACACTATTGGATTCTTCCGAAGAAGACTCCATACTACCAAGTTCAGCTCGGATGGTGGATTTGCCTGCCAAGATCAGAAGAGCACACGTCTGAACTCCAGTCACATCACGACTTCGTATGCCGTATTCTGCTTGAAAAAAACAATGAAAACTAGTCACCGATGACTCACGTTCGCTGAACATTATCTGACAACTAGCTTAACAATGGACATGCTTAGCACTGACAACCAGACG
++
+CCC8AF,6,FGGCFEEBFGCAFGGGFGGF7FB8,CF,<,;,CEE<,@,8+,,6,,,CFFGGGGG,F<EA@F,B<F6@FC6@CBE9F7F,5:F9AF84A,ABFF,=A,A,4,4AEFEGGGGGD8=EC,,4,C;EF9,9=+4++,+4=8DGG6@#############################################################################################################
+@HWI-M00234:263:000000000-ADM55:1:1101:17148:4803 1:N:0:ATCACG
+CCCTTTTCGGCAATGGCGATGTTACGGTACATAAGAGCGATTTCGGGGAAACCTTCTTCGTCTGCAATATCAGCAAACTTAGGATAATCCAATGA
++
+AACBCDFA@@:+:CCEF7@CC@@AFFDGD;FDA@@6E@FF<,CC;@@+7@FG@F<CCFF@F@F@,<,B@F,CDG<@FEF<@,@,CAF9E<FD<??
+@HWI-M00234:263:000000000-ADM55:1:1101:8939:4808 1:N:0:ATCACG
+CCACAGTTCTGTCATATCGCAGTACAGGAATCTCAACCTGTTGTCCATCGGCTACGGCTCTCGCCCTCGCCTTAGGCCCCGACTTACCCAGGGCAGATCAGCTTTA
++
+CC8C9C6<EFGFEEGGGGGGGDECGFDE@FFAFGFGFGGGGGGGGFGFEE@FFGFEGGCFECDGCCFGC+6@B@@FFG,8F@FFGGGGFEDFCF@FFFGGDFFDFF
+@HWI-M00234:263:000000000-ADM55:1:1101:11727:5103 1:N:0:ATCACG
+CTCCCGTATAGGATGGATCGAAAGCAATCGTCAGGAATCCACGTTCTGCCAATGTCTGCGCATACAAGCCCGAAGCTTGTTCCTTCACGGCACCAAATGGGCCACTGATGGCAATGGCAGGCAATTTACCCGTCACATTCTTGGGTACATACAAATCGGCGGCAAGTGTAATGCCGTAACGGTTGTGGAAAG
++
+CCCCCGGGGGGGGFGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGFGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGFFGGGGGGGGGFGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGFFGGGGGGGGGGGGGGFGGFDF@GGDGGGGGGGGG4*;CFFF
+@HWI-M00234:263:000000000-ADM55:1:1101:15029:5173 1:N:0:ATCACG
+GGCCTATTCTCTGCGGCCGCCTTTCGGCGGCACCCCTTCTCCCGAAGTTACGGGGTCATTTTGCCGAGTTCCTTAACAATGCTTCTTCCGTCGGCCTTAGGATTCTCTCCTCATCCACCTGTGTCGGTTTACGGTACGGGTACAATATAAACAATAGCGGCTTTTCTTGACGGCCGGCTCATGGGCTTCCCTACTTTAGT
++
+CCCCCGGGGGGGGGGGGGGGGGGGGEGG7FECGFGGGGGEGGGGGEEGGGGGGGGGGGGGGGFGGGGGGGGGGGGFGGGCGGGGGGGGGGGGGGGFFGGGGGGGGGGFFG9FCGGGFGGGGGFFFDGGEECGGGGGGGGGGGGGGGGGGGGECGGGGGD>CCG>=98E79=CDDDD4D5DGF=FGGGDGFFFFFFFF6AC
+@HWI-M00234:263:000000000-ADM55:1:1101:7330:5248 1:N:0:ATCACG
+TGTGTATGAATGAGCGGCTACAGGCTTAGTCGATTTCTTTACTGCGCAGAAGCGGGACTGTGACCGACAAAACAGCCGTCGCCTCTCTACGTTCCGGGACCATACGCCGCTCGCAGTGATTGACCCTTACAACCTTGCGGGCGCTCTC
++
+CCCCCGEGGGGGGFGGGGGEGGGGGGFGGGGGGGGGGGGGGGGGGGGGGGFFGGGGDEGGGGGFGGGGGGGGGGECGGGGEFGDGAFGGGGGGFFG>GGECFFGCF+@CC@FGG++@FFFF,>F,DFFGGFFGCGEFG6CEG54*=@D
+@HWI-M00234:263:000000000-ADM55:1:1101:18630:5353 1:N:0:ATCACG
+GGCGTGTTCTGCCAAAATAGTGCTGGGCAATATACGACATAGAAGCGAAAGGCAATACTTTTTCTAAGGCCTGCCTGATTTCTACTGTTTTCACAATGGCTTGGGCTTCATTGATTGATTGCCTGGCACCATCTTGGAATGCTTGCGCAAACGCTTTTTTATCCTCCGGTGAAAGCGTCTGCAGAAAAGCCCTGAAACGTTTTTTATGGTCGGCCACTTCCTCAGGAGTATTG
++
+CCCCCGGGGGGGGGCGGGGGGGGGGFGGFGFGGGGGGGEGGGGGGGGGGGGGDECDFGGGGGGGGGGFGGGGDGGGGGGGGGGGGFFFGGGGGGGGGGGGGGGGGD8<FGGGFGGGGGGGFAEGGFGC,8EFGGGGFDC9DG9E9DCEE>EGGDGGFGGGGFG?FCFDED6F6DG6C6==DD7=D=D6DFF?F**3;9@?699CDBFF5FEB>>D>:@00>=C*8:;25;59*
+@HWI-M00234:263:000000000-ADM55:1:1101:11799:5476 1:N:0:ATCACG
+CCTAAATTTTCGAGTATAAGCAGGACCGAAGCCACCAACTTATACCTTATCCTCTAAATTTTCGTAAGAGACATGAAGCGGATCTCTAACTATTCCCGATTTTACTGCACCACTTGATCAAACGCTTCGGAACAAGAGCTTTTGAGTGATGTCTCGTTTCCACCACTTTGGCAGAAATAAAGCTAATCTACTATGATTCGATTAAGCAGCAAGAGCATAATTTTCGTTGCCAGATAAAATTT
++
+CCCC<FFFGGF@FFFGFFGCGCCFGGGEFGGD;CFFGFGGGGGGCFF@FFGGC<EEGGGCEFGGGF@E@@,BFFGFGGGGG7+@AFEAEFFGGGGGGGFFEGGFGGGCEGEFDGFGGFGG:=>@EC@@77@E>4DEC8C>DGGG>FGGGGF=DAECDDFDEG8==++=,6=FGDGFGGGGGGGGGGFFGFFFFFFFFFFDFFADFFFEAF@F@C5@EEF5=E;EE4477AFBEFBF;*A4>C
+@HWI-M00234:263:000000000-ADM55:1:1101:11348:5668 1:N:0:ATCACG
+GCCTAAATTTTCGTGCAGCGGCAGAACCAAAGCCATCAACCGTTGCCTTATCCTCTAAATTTTCACCCGCGCCACGAGGCTGACACGAACTATCCCCGATTTGACTGCACCACTTTATCGGAATGCTTCGGAGCAACAGCTTCCGAGTGATGTCACGTCCCAGCACCTGGTGCCGGGATTAAGCTTCAATCTACTATACTTCGATTAAGCAGCGAGAGCGTAACGAGTTTCGCCAGATAAAATTTTGAGGACTGAGATTAAAGTGAAAATC
++
+CCCCCGGGGGGGGGCGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGCFGFGGGGGDGGCGGGGGGGGGGGGGGFGGGGGGGGGGGGGGGFGGGGGGDGGGGGGGGGDGGG6>E9CCGGGGGGGGGGGGGGGGGGFGFGFFFFFFFFFFFFFFAFFFFFFFFFFFB199@F=9@DF@?;@FDFFFFFF>274A>B<?FABFF7?F???FB94:<<F26)-69>0
+@HWI-M00234:263:000000000-ADM55:1:1101:25874:5826 1:N:0:ATCACG
+CCTGCAGTGGATAGGGACCGAACTGTCTCACGACGTTCTGAACCCAGCTCACGTACCTCTTTAATGGGCGAACAGCCCAACCCTTGGGACCTTCTCCAGCCCCAGGATGAGATGAGCCGACATCGAGGTGCCAAACTTTCCCGCCGATATGGACGCCCGGGCAAAATCAGCTTGTTATCCCCAGGGTAGCTTTTATCCGTTGAGCGACGACCCTTCCATTCGGAATCGCCGGAATACTATGCCCTGCTTTCGCACCTGCCCAACCAGTCCGCCCAGCAGTTAAG
++
+CCCCCDFGGGG<@F,CE<FGGEGDDFG9EEEF7CGFGGG9<E@D@@EC,@FFFEGGG,C<9C<FGGFGF+@CGEECGEFFGGGG<F<A,,4?F?,?5EDF,,=BEF+,A<A,C,,AE84+F=+F>FFGGFFGD8D>DE,,373++++++6,,3@+++@9*@9>5@C*<::7,*0;CC7+:*39CF*045?8AC=A:BB:5)05/;6:6)86::8@F####################################################################
+@HWI-M00234:263:000000000-ADM55:1:1101:26932:5861 1:N:0:ATCACG
+AGCGTCAGTTACAGTCCAGAAAGCCGCCTTCGCCACTGGTGTTCTTCCTAATCTCTACGCATTTCACCGCTACACTAGGAATTCCGCTTTCCTCTCCTGCACTCTAGATATCCAGTTTGGAATGCAGCCCCCAGGTTAAGCCCGGGGATTTCACATCCCACTTAAACATCCGCCTACGCACCCTTTACCACCAGTAAATCCGGACAACGCTCGCCACCTACGTATTACCGCGGCTGCTGGCACGTAGTTAGCCGTGGCTTCCTCCTCTGGTACCTTCATTATCGTCCCCGAAACC
++
+96BCCFGGEGGGFGGGGG?EFFGGGGGCFG9FDFGGFG8FGGCFGGGGGGGGGFDGGDFEBFGFFGGGGGEEEFGGG<FFFCFCFFGDCFGFGG<8FGEFGGGCCFFAEGGFFGFFFFGG8EEFCEGG@EDEGGFGFFFFGGFCBEE8CF8=CFFAF,=D8F8FGG+@DC86?=CGFDGC9D6FC:FC*+;9*331?+=;ABB49>FDEB=45@@FFFBFF;8@E@FC)/6690(-1)),82?B??B################################################
+@HWI-M00234:263:000000000-ADM55:1:1101:14154:5990 1:N:0:ATCACG
+GTGGGATGTCAAGGTAAGCGGCGGCAGCCTTGGCTACAGCAAGAGATACGCCGAGGATGGCATTGGCACCCAGATTGGCTTTCGTTTTGGTTCCGTCCAGTGCAAGCATGGCATGGTCGATACCCATCTGGTCGAGGGCGGACATACCGATGAGCTTGGGAGCAATGATATTATTGATATTGTCCACGGCTTTCAGGAC
++
+CCCCCGGC<F9DE@EG9FF@@FGFGGFEFGF@E@FAFGGGFGFEE8FFEGGGGD>>=F8FG8?EEDFGGGGGG<FFD?FF@FFGE8F=,>FFEBCEFGGGFGGGGGGCEG8D?FFGGEGGFFEGEE8FFGGGG8++>8E>E5@BDA?FGGGGGGCFF6E==57??86ECFCF@CCCCBFCGDGGGG=*>3)868:7=FF
+@HWI-M00234:263:000000000-ADM55:1:1101:25022:6229 1:N:0:ATCACG
+CCCGAGAACGTATTCACCGCAACATTGCTGATTTGCGATTACTAGTGATTCCAACTTCATGTACTCGAGTTGCAGAGTACAATCCGAACTACGAACAGCTTTCTGAGGTTTGCTCCTCCTCGCAGATTTGCTGATCGGAAGAGCACACGTCTGAACTCCAGTCACATC
++
+CCCCCGGGGGGFGGGFGGGGEGGCFGFGGAEGGGDGGEGGGFGFFGG9FFGEFGGGGGGGGGAEGGG8FFGGG?EFGGGGCFGGGCCFGFFGCFGGGCGGGGGG9EF,EGGCFFGFFGGEEGGGDEGGGAFGGGCEFEEBE8EDFGGGGGGGGCGGGGGGGGFGCFDD
+@HWI-M00234:263:000000000-ADM55:1:1101:21023:6286 1:N:0:ATCACG
+GTGTACAAGGCCCGGGAACGTATTCACCGCGCCGTGGCTGATGCGCGATTACTAGCGAATCCAGCTTCATGGAGTCGGGTTGCAGACTCCAATCCGAACTGAGAGAGGCTTTAGGGATTAGCATCACGTCGCCGTGTAGCTGCCTTCTGTACCCCCCATTGTAACACGTGTGTAGCCCCGGACGTAAGGGCCGTGCTGATTTGCCGTCATCCCCACCTTCCTCAC
++
+CCCCCGGGCFFGGDEGGGGGGFGGGGGGGGGGGGGEGGGGGFEGGGGGGGDFFG9FCGGGGGGGGGGGFFFGGGGGEGCFGDGGGAG8EF<FFGGGGGGGFGGCDGDEGFGGGGGGGFGF?GGDFDFGDDEGD+B=DFFFD9DGFGGGGGEGCFCEGEGGGGFCF>FGGCGGGGCGGFDDG<55CF4CFF;5555>FFFFFA6+0(2,08)00(36,,)5:AB2:
+@HWI-M00234:263:000000000-ADM55:1:1101:8138:6336 1:N:0:ATCACG
+TGTGTACAAGGCCCGGGAACGTATTCACCGCGACATTCTGATTCGCGATTACTAGCAACTCCAGCTTCATGTAGGCGAGTTGCAGCCTACAATCCGAACTGAGATAGGTTTTATAAGTTTTGCTCCACCTCACGGTCTT
++
+CCCCCGGGF<FGGGGED@FGGGFGGGGGGDGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGCGFGGGCGGGGGGGGGGGGGFGGFEGGGGDGGEFCCGEFFGGGGAFGGGGGFGFFFGGFGGFGDFGGGGGG
+@HWI-M00234:263:000000000-ADM55:1:1101:11055:6543 1:N:0:ATCACG
+CCTGGACATTTTCGGCGCAGGACCTCCCGACCAGTGAGCTATTACGCACTCTTTGACTGTGTGGCTGCTTCTGAGCCAACATCCTGGTTGACTTTGAAATCTCACATACTTTTCCACTTAACACGCACTTTGGGACCTTAGCTGGAGGTCTTGGCTCTTTCCTTTTTGCCTATCCAACTTATCTCGTATAGTCTGACTCCCGG
++
+@B,8BF8EFGFGG77@7+8@@6,FFF<,+@C+6FF99@A@EC,CC,BFFDFGA<@D,C9F@CF7,B7CFGG,C@,B@<F?7FF8<,:,C@,?<EE,C?A,E,ACEFG9,C;@,,A;EEA,,?E9884B8=,9,4,@+7>@,B;=,66+@D,,@,3=EF=:@F,C=886,+6@D8D+6+0==C9+6+5+0;+1+3BC1<A?9>9
+@HWI-M00234:263:000000000-ADM55:1:1101:24980:6575 1:N:0:ATCACG
+GCCATTTATCTACGCCTGTTGTCACCAACAGGCTCTAGCGGTCTACCCTCCGACGTGGGGCGAGCAACCCTCATA
++
+CCCCCGGGGGFGGGGGGGGGGGFGGGGGGGG@G<FFFGGGEEGGGGGGFGGCECFGGGGGD:@FGGGGG7ADGGG
+@HWI-M00234:263:000000000-ADM55:1:1101:7596:6682 1:N:0:ATCACG
+GCCCCCGTCAATTCCTTTGAGTTTCACCGTTGCCGGCGTACTCCCCAGGTGGAATACTTAACGCTTTCGCTTGGCGGCTGACAATGTATCGCCAACCGCGAGTATTCATCAGATCGGAAGAGCACACGTCTGAACTCCAGTCACATCCCGATCTCGTATGCCGTCCTCGGCTTGAAAAAAAAAAATATAAACCATGATGAATTTCGAACACTCACGACCACACACTAAGCGTCGACGTA
++
+CCCCCGGGGGGACFGGGGGFFEEGGGGGGFFEGGGGGGGGGGEGFGGGGEFG@FGDFFGGGGGGGEGGGDGFFCC>FGCDFGFGGGCE,E:FCCCC7CGGGGGGFE;FFEFCCGFGG@CEFGGGG@F@>@8DGGG=;@FFFGGC;E6,@@+4:,318;9,@FG@###########################################################################
+@HWI-M00234:263:000000000-ADM55:1:1101:24419:6736 1:N:0:ATCACG
+CGGGCGTTGGCAAGTACGTTATATCACTTACCCACGCTCGATTCAGAACCCCAGGAGTAAATGCTCGTTTTAAGAGGTTGGGATACACAGGCATGGTGTGATTACTGTCGGTGGTTTTTACGGTTCGCTTAAAAAAGCGGTAACCAATGATGCCATTAAAGCGAAGGATAGCGCGTAAACGTTTGACACCAACTTTCACTCCACGGTGTTGCATCAAAGC
++
+CCCCCGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGDGGGGGFGGGGGGGDGGGGGGGGGGGGGGGGDFGGGGGGGGGGGGGGGGGGGGGGGGFGGGFGGGGGGGGD9FFCFEGGGFGGGGG7=+4>@EFEEFFG7>EEDEEEFDDDG@8DCFEFDFGGC8=CDCGGFGGDC6>DDGDCFDGDGDGFGG@AFBA?FFFFFFFFABBF95B@AFFFFFFFF
+@HWI-M00234:263:000000000-ADM55:1:1101:5068:6755 1:N:0:ATCACG
+GCAGCGGCAGAACCAAAGCCATCAACCGTTGCCTTATCCTCTAAATTTTCACCCGCGCCACGAGGCTGACACGAACTATCCCCGATTTGACTGCACCACTTTATCGGAATGCTTCGGAGCAACAGCTTCCGAGTGATGTCACGTCCCAGCACCTGGTGCCGGGATTAAGCTTCAATCTACTATACTTCGATTAAGCAGCGAGAGCGTAACGAGTTTCGCCAGATAAAATTTTGAGGACTGAGATTAAAGTGCAAATC
++
+CCCCCGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGDFF?FGGGGGDFGGGGGGGGGGFFFFGGGGGFGGFGGGGGGDGGGGGGGFGGGEEDGGG9C9EEGGGGGD8@FGGGGGGGGGGGGG>CFGGGGGCFGDGDFGFGGF7CFGDF>FFFAF=;A>EDDBFBBFFF@D@D<E?@F01;@<?C<471.2)48<??2(549<B>FDF24)66<))
+@HWI-M00234:263:000000000-ADM55:1:1101:21477:6796 1:N:0:ATCACG
+CCCCACTGCTGCTTCCCGTAGGAGTTTGGACCGTGTCTCAGTTCCAATGTGGGGGACCTTCCTCTCAGAACCCCTATCCATCGTTGACTAGGTGGGCCGTTACCCCGCCTACTATCTAATGGAACGCATCCCCATCGTCTACCGGAAAATACCTT
++
+CC,AC:F8<F@CCEDGGCEGGGGGFAG<FGG8@FEFEFFCEGGCFF<<<F@<C+@FF:AFCEFE,ECF9AFGC@DE<FE,,5@9B8BFFCE8F,=FF@CG7FCFGD:FFF7EAFDG9F;FFF@:FEEG@4=@DEFG6=EGCADC6@ECCA,@DDF
+@HWI-M00234:263:000000000-ADM55:1:1101:12483:6880 1:N:0:ATCACG
+CTCCTTGTCTGCCTTCGATTACGGCATTTGCAATCGTTCCTGTAAGTAGTTTTACAGCTCTAATGGCATCGTCATTCCCTGGTATTACGTAGTCTATTTCATCAGGATCACAGTTAGTATCAACTATTGCTACAACTGGTATTCCTAATATCTTCGCTTCATTTACTGCAATTCTTTCTTTTCTTGGATCTACAACAAATAATACATCAGGAAGACCACCCATATCTTGAATGCCACCTAAAAACTTTTCAA
++
+CCCCCGGGGGGGFGGFGGGGGFGDFEGGGGGFFFGGFGGGGGGGGFGGGFGGGGGGGGCEGGGGCFGGGGGGGGGGGGFGGGFEGGDGGGGFFFGGGGGGGGFGGGGGGGGGGFGFGCF@FEFFGDAGFGFGGGGFGGGGDGGGFFGGGD;EEFGGGGGGGFGGGGGGGGGGFDGDGGGGGGGGGGGDGFFFFFFF9;;DFFFFFBFFBDBFFBFD=DDFDFFFEFEFEFEECE<@E@CFF@EBAFFEEEFF
+@HWI-M00234:263:000000000-ADM55:1:1101:27958:6935 1:N:0:ATCACG
+CCATTCGGAAATCCGCGGATCAAAGGTCATTTGCACCTACCCGCAGCTTATCGCAGCTTATCACGTCCTTCATCGCCTCCGAGAGCCAAGAGATCGGAAGAGCACACGTCTGAACTCCAGTCACATCACGATCTCGTATGCCGTCTTCTGCTTGAAAAAAAAAACCCACAAATTCACACTACACACCCACCTCCCATCACGCATCTCTTTTGTCCGAGTCACGCTGCACGCTACCTGCACACTACCTGCCTCAGTTACATCTTTTTACTCAATGTCCCACCATTTATCAC
++
+CCCCCGGGGGGGGGGGDGGCFGGGGGGGFEGGGGGGGGGGGGGGGGGGGGGGGGGGG8DC<FGGGFFGGGGGGGGGGCGF:FDGGGGGG@FEEEGGGEGDGGGFGGGGGG:FFGG=EGFFFCEFG9EEFGD+@@EEDED8DA>EEC@EFGFAFFGF=F?+44;C##############################################################################################################################
+@HWI-M00234:263:000000000-ADM55:1:1101:6151:7404 1:N:0:ATCACG
+GCACGTAGTTAGCCGGGGCTTCCTCCTAAGGTACCGTCATTATCGTCCCTTAGGACAGAGCTTTACGATCCGAAAACCTTCATCGCTCACGCGGCGTCGCTGCATCAGAGTTCCCTCCATTGTGCAATATTCCCCACTGCTGCCTCCCGTAGGAGTCTGGACCGTGTCTCAGTTCCAGTGTGGCCGTTCACCCTCCCAGGCCGGCTACCCATCGTCGCCTTGGTTAGCTATTACCTCCCCAACTAGCTAATGGGACGCGAGTCCAGCTTATACCACTTAACCGCTTTTGCTTGAAAATCA
++
+CCCCCGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGGFGFGGGGGGGGGGFGGGGGGGGGGGGGGGGGGDF8FGGGFGGGGEGGG7+CGGFGGGGGGGGC:8FGGGDFGFEGGGFGGGFGCGGGGGGGGDG?EGGGGGFF,<FGGGGFDGGGG,5,EFGGGD++*5:DGFCDD?6>AFFF4?6)5?EB?D0>DFFFAF0(/.6<D03;3().646<A)).))(4:0<BFBD?F<2<AFF<B############################################
\ No newline at end of file
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/report_illumina_1_3_fastq_output.txt	Tue Apr 26 08:17:42 2016 -0400
@@ -0,0 +1,4 @@
+Information to extract:
+	sequences
+Number of similarity records: 36
+Number of extracted similarity records: 36
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/report_length_fasta_output.txt	Tue Apr 26 08:17:42 2016 -0400
@@ -0,0 +1,4 @@
+Information to extract:
+	length
+Number of similarity records: 36
+Number of extracted similarity records: 36