changeset 0:614a12d56e58 draft default tip

planemo upload for repository https://github.com/sanbi-sa/tools-sanbi-uwc/tree/master/tools/fasttree commit 4db125fcd73327813d7bd511852bbe9ffc68a25c
author sanbi-uwc
date Mon, 09 Jan 2017 08:07:45 -0500
parents
children
files fasttree.xml test-data/sample_aln1.fasta test-data/sample_aln2.fasta
diffstat 3 files changed, 937 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/fasttree.xml	Mon Jan 09 08:07:45 2017 -0500
@@ -0,0 +1,137 @@
+<tool id="fasttree" name="FastTree" version="0.1">
+  <description>infers approximately-maximum-likelihood phylogenetic trees from alignments of nucleotide or protein sequences.</description>
+
+  <requirements>
+      <requirement type="package" version="2.1.9">fasttree</requirement>
+  </requirements>
+
+  <command detect_errors="aggressive">
+  <![CDATA[
+    OMP_NUM_THREADS=\${GALAXY_SLOTS:-1} &&
+    export OMP_NUM_THREADS &&
+    FastTreeMP
+    #if ( ( str( $advanced_options.advanced_options_selector ) == 'false'
+           and str( $advanced_options.alignment_type1 ) == 'nucl' ) or
+          ( str( $advanced_options.advanced_options_selector ) == 'true'
+             and str( $advanced_options.alignment_type_selection.alignment_type2 ) == 'nucl' ) ):
+      -nt
+    #end if
+    #if str( $advanced_options.advanced_options_selector ) == 'true':
+      $advanced_options.fastest
+      $advanced_options.gamma
+      $advanced_options.noml
+      $advanced_options.nosupport
+      $advanced_options.log
+      #if str( $advanced_options.alignment_type_selection.alignment_type2 ) == 'nucl':
+        $advanced_options.alignment_type_selection.nucl_alignment_model
+      #else
+        $advanced_options.alignment_type_selection.prot_alignment_model
+      #end if
+    #end if
+    '${input_alignment}' > '${output_tree}'
+  ]]>
+  </command>
+
+  <inputs>
+    <param name="input_alignment" type="data" format="fasta,phylip"
+      label="Multiple sequence alignment"/>
+    <conditional name="advanced_options">
+      <param name="advanced_options_selector" type="select" label="Advanced options">
+        <option value="true">Yes</option>
+        <option value="false" selected="True">No</option>
+      </param>
+      <when value="true">
+        <param argument="-fastest" type="boolean" truevalue="-fastest" falsevalue=""
+          label="Fastest mode (recommended for > 50,000 sequences)"/>
+        <param argument="-gamma" type="boolean" truevalue="-gamma" falsevalue=""
+          label="Rescale likelihoods using Gamma20 model" />
+        <param argument="-noml" type="boolean" truevalue="-noml" falsevalue=""
+          label="Disable Maximum-Likelihood topology refinement step" />
+        <param argument="-nosupport" type="boolean" truevalue="-nosupport" falsevalue=""
+          label="Disable computation of support values for tree splits" />
+        <param argument="-log" type="boolean" truevalue="-log output_log.txt" falsevalue=""
+          label="Save log file" />
+        <conditional name="alignment_type_selection">
+        <param name="alignment_type2" type="select" label="Alignment type">
+          <option value="nucl">Nucleotide</option>
+          <option value="prot" selected="True">Protein</option>
+        </param>
+        <when value="nucl">
+          <param name="nucl_alignment_model" label="Alignment model" type="select">
+            <option value="" selected="True">Jukes-Cantor+CAT</option>
+            <option value="-gtr">GTR+CAT</option>
+          </param>
+        </when>
+        <when value="prot">
+          <param name="prot_alignment_model" label="Alignment model" type="select">
+            <option value="">JTT+CAT</option>
+            <option value="-wag">WAG+CAT</option>
+            <option value="-lg">LG+CAT</option>
+          </param>
+        </when>
+        </conditional>
+      </when>
+      <when value="false">
+        <param name="alignment_type1" type="select" label="Alignment type">
+          <option value="nucl">Nucleotide</option>
+          <option value="prot" selected="True">Protein</option>
+        </param>
+      </when>
+    </conditional>
+
+  </inputs>
+
+  <outputs>
+    <data name="output_tree" format="nhx" />
+    <data name="output_log" format="txt" label="Log from ${tool.name} on ${on_string}" from_work_dir="output_log.txt">
+      <filter>advanced_options['advanced_options_selector'] == 'true' and advanced_options['log'] is True</filter>
+    </data>
+  </outputs>
+
+  <tests>
+    <test>
+      <param name="input_alignment" value="sample_aln1.fasta" ftype="fasta" />
+      <param name="advanced_options_selector" value="false" />
+      <param name="alignment_type1" value="nucl" />
+      <output name="output_tree">
+        <assert_contents>
+          <has_text_matching expression="^^\(\(\(471528:[^,]+,\(\(484305:[^,]+,\(471785:[^,]+,\(484347:[^,]+,484343:" />
+        </assert_contents>
+      </output>
+    </test>
+    <test>
+      <param name="input_alignment" value="sample_aln2.fasta" ftype="fasta" />
+      <param name="advanced_options_selector" value="false" />
+      <output name="output_tree">
+        <assert_contents>
+          <has_text_matching expression="^\(\(N3970:\d\.\d+,N3339:\d\.\d+\)\d+\.\d+:\d\.\d+,\(\(\(\(N3243:\d\.\d+,\(\(N3234:\d\.\d+,\(N500:" />
+        </assert_contents>
+      </output>
+    </test>
+    <test>
+      <param name="input_alignment" value="sample_aln2.fasta" ftype="fasta" />
+      <param name="advanced_options_selector" value="true" />
+      <param name="log" value="True" />
+      <output name="output_log">
+        <assert_contents>
+          <has_text text="Amino acid distances: BLOSUM45 Joins: balanced Support: SH-like 1000" />
+        </assert_contents>
+      </output>
+    </test>
+  </tests>
+
+  <help>
+  <![CDATA[
+    FastTree infers approximately-maximum-likelihood phylogenetic trees from
+    alignments of nucleotide or protein sequences. For more information see
+    the `FastTree`_ website.
+
+    .. _FastTree: http://www.microbesonline.org/fasttree
+  ]]>
+  </help>
+
+  <citations>
+    <citation type="doi">10.1093/molbev/msp077</citation>
+    <citation type="doi">10.1371/journal.pone.0009490</citation>
+  </citations>
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/sample_aln1.fasta	Mon Jan 09 08:07:45 2017 -0500
@@ -0,0 +1,100 @@
+>484463 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGACAGAATGCTTAACACATGCAAGTCT-TTGGCAAGGCGGACGGGTGAGTAACGCGTAAAGAACTTGCCCTGCAGACAGGGATAACAGACGGAAACGACTGACAACACCTGATACTGCGGGAGAGCTTTGCGTCCTATTAGCTTGTTGGCGGGGTAACGGCCCACCAAGGCGATGATAGGTAGCCGGCCTGAGAGGGTGAACGGCCACAAGGGGACTGAGATACGGCCCTTACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGGGCAACCCTGATCCAGCAATTCTGTGTGCACGATGAAGGTTTTCGGATTGTAAAGTGCTTTCAGCAGGGAAGCGGTACCTGCAGAAGAAGCGACGGCTAAA-TACGTGCCAGCAGCCGCGGTAATACGTATGTCGCAAGCGTTATCCGGAATTATTGGGCATAAAGGGCATCTAGGCGGCCAGGCAAGTCTGGGGTGAAAACTTGCGGCTCAACCGCAAGCCTGCCCTGGAAACTGCCTGGCTAGAGTGCTGGAGAGGTGGACGGAACTGCACGAGTAGAGGTGAAATTCGTAGATATGTGCAGGAATGCCGATGATGAAGATAGTTCACTGGACGGCAACTGACGCTGAAGTGCGAAAGCTGGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCCAGCCGTAAACGATGATTACTGGGTGTGGGCCCGTGCCGAAGCAAATGCGATAAGTAATCCGCCTGGGGAGTACGGCCGCAAGGCTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGACGCAACGCGAGGAACCTTACCAGATCTTGACATCCAGGTGGTGCATGGCTGTCGACAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATCGCCAGTTGCGACTCTGGCGAGACTGCCTGCGAAGAGCAGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATGATCTGGGCTACACACGTGCTACAATGGCCGGTACAGAGAGCTGCGAAGCGGCAACGCCCAGCGAATCTTC-AAAGCCGGTCCAAGTTCGGATTGAAGTCTGCAACTCGACTTCATGAAGCTGGAATCGCTAGTAATCGCAGATCAGCATGCTGCGGTGAATACGTT-TCGGGTCTTGTACACACCGCCCGTCACACCACGAGAGTTGTCTGCACCTGAAGCTGCCATCTAAGGTGTGGACAGTGATTGGGGTGAAGTCGTAACAAGGTATCCGT
+>484462 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGACAGAATGCTTAACACATGCAAGTCT-TTGGCAAGGCGGACGGGTGAGTAACGCGTAAAGAACTTGCCCTGCAGACAGGGATAACAGACGGAAACGACTGACAACACCTGATACTGCGGGAGAGCTTTGCGTCCTATTAGCTTGTTGGCGGGGTAACGGCCCACCAAGGCGATGATAGGTAGCCGGCCTGAGAGGGTGAACGGCCACAAGGGGACTGAGATACGGCCCTTACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGGGCAACCCTGATCCAGCAATTCTGTGTGCACGAGGAAGGTTTTCGGATTGTAAAGTGCTTTCAGCAGGGAAGCGGTACCTGCAGAAGAAGCGACGGCTAAA-TACGTGCCAGCAGCCGCGGTAATACGTATGTCGCAAGCGTTATCCGGAATTATTGGGCATAAAGGGCATCTAGGCGGCCAGGCAAGTCTGGGGTGAAAACTTGCGGCTCAACCGCAAGCCTGCCCTGGAAACTGCCTGGCTAGAGTGCTGGAGAGGTGGACGGAACTGCACGAGTAGAGGTGAAATTCGTAGATATGTGCAGGAATGCCGATGATGAAGATAGTTCACTGGACGGCAACTGACGCTGAAGTGCGAAAGCTGGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCCAGCCGTAAACGATGATTACTGGGTGTGGGCCCGTGCCGAAGCAAATGCGATAAGTAATCCGCCTGGGGAGTACGGCCGCAAGGCTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGACGCAACGCGAGGAACCTTACCAGATCTTGACATCCAGGTGGTGCATGGCTGTCGACAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATCGCCAGTTGCGACTCTGGCGAGACTGCCTGCGAAGAGCAGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATGATCTGGGCTACACACGTGCTACAATGGCCGGTACAGAGAGCTGCGAAGCGGCAACGCCCAGCGAATCTTC-AAAGCCGGTCCAAGTTCGGATTGAAGTCTGCAACTCGACTTCATGAAGCTGGAATCGCTAGTAATCGCAGATCAGCATGCTGCGGTGAATACGTT-TCGGGTCTTGTACACACCGCCCGTCACACCACGAGAGTTGTCTGCACCTGAAGCTGCCATCTAAGGTGTGGACAGTGATTGGGGTGAAGTCGTAACAAGGTATCCGT
+>484461 div_ratio=1.127 study_id=40698 non_ACGT_percent=0.0000 decision=named_isolate
+GACGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGACAG-GCACGCGGATGGGTGAGTAACGCGTGGGTAACCTGCCCTTAAGTCTGGGATACCATTTGGAAACAGATGCTAATACCGGATACTAAAGGATGGACCTGCGATGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCGATGATGCATAGCCGAGTTGAGAGACTGATCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCACAATGGACGCAAGTCTGATGGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAGCTCTGTTGTTGGTGAAGCGGTAATCAACCAGAAAGTCACGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGATTGATAAGTCTGATGTGAAAGCCTTCGGCTCAACCGAAGAA-CGCATCAGAAACTGTCAATCTTGAGTGCAGAAGAGGAGAGTGGAACTCCATGTGTAGCGGTGGAATGCGTAGATATATGGAAGAACACCAGTGGCGAAGGCGGCTCTCTGGTCTGTAACTGACGCTGAGGCTCGAAAGCATGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCATGCCGTAAACGATGAGTGCTAAGTGTGGGACAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTTAATAGTTGCCACTCTATTGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGGCAGTACAACGAGAAGCGAACCTGTGAAGGCAAGCGGATCTCTTAAAGCTGTTCTCAGTTCGGACTGTAGGCTGCAACTCGCCTACACGAAGCTGGAATCGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGAGAGTTTGTAACACCCAAAGTCGGCGCCTAAGGTGGGACAGATGATTAGGGTGAAGTCGTAACAAGGTAGCCGT
+>484454 study_id=40697 non_ACGT_percent=0.0000 decision=named_isolate
+GACGAACGCTGGCGGCGTGCC-AATACATGCAAGTCGAGCGAAGCGGCGGATGGGTGAGTAACACGTGGGGAACCTGCCCCATAGTCTGGGATACCACTTGGAAACAGGTGCTAATACCGGATACTATGGGATGGCCCCGCGGTGCATTAGCTAGTTGGTAAGGTAAAGGCTTACCAAGGCGATGATGCATAGCCGAGTTGAGAGACTGATCGGCCACATTGGGACTGAGACACGGCCCAAACT-CTACGGGAGGCAGCAGTAGGGAATCTTCCACAATGGACGCAAGTCTGATGGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAGCTCTGTTGTTGGTGAAGCGGTAATCAACCAGAAAGTCACGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGAAGAATAAGTCTGATGTGAAAGCCCTCGGCTTAACCGAGGAACTGCATCGGAAACTGTTTTTCTTGAGTGCAGAAGAGGAGAGTGGAACTCCATGTGTAGCGGTGGAATGCGTAGATATATGGAAGAACACCAGTGGCGAAGGCGGCTCTCTGGTCTGCAACTGACGCTGAGGCTCGAAAGCATGGGTAGTGAACAGGATTAGATACCCTGGTAGTCCATGCCGTAAACGATGAGTGCTAAGTGTTGGGCAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGC-GTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTTATTAGTTGCCACTCTAATGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGGCAGTACAACGAGAAGCGAGCCTGCGAAGGCAAGCGAATCTCTGAAAGCTGTTCTCAGTTCGGACTGCAGTCTGCAACTCGACTGCACGAAGCTGGAATCGCTAGTAATCGCGGATCAG-ACGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTCTGCAATGCCCAAAGCCGGCGTCTAAGGCAGGGCAGATGACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484444 div_ratio=1.151 study_id=40696 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCCGGCGGTGTGCC-AATACATGCAAGTCGAACGCAGTGGCGGACGGGTGAGTAACACGTAGGCAACCTGCCCAGAAGCGGGGGACAACATTTGGAAACAAGTGCTAATACCGCATACTTCTGGATGGGCCTGCGGCGCATTAGCTAGTTGGTAAGGCAACGGCTTACCAAGGCAGTGATGCGTAGCCGAGTTGAGAGACTGATCGGCCACAATGGAACTGAGACACGGTCCATACT-CTACGGGAGGCAGCAGTAGGGAATCTTCCACAATGGGCGCAAGCCTGATGGAGCAACACCGCGTGAGTGAAGAAGGGTTTCGGCTCGTAAAACTCTGTTGTTGAAGAAGCGGTATTCAACCAGAAAGTCACGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGTTTTCTAAGTCTGATGTGAAAGCCTTCGGCTTAACCGGAGAAGGGCATCGGAAACTGGATAACTTGAGTGCAAGAGAGGACAGTGGAACTCCATGTGTAGCGGTGGAATGCGTAGATATATGGAAGAACACCAGTGGCGAAGGCGGCTGTCTAGCTTGCAACTGACGCTGAGGCTCGAAAGCATGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCATGCCGTAAACGATGAGTGCTAGGTGTTGGACAGTGCCGGAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGC-GTGGAGCATGTGGTTTAATTCGAAGCTACGCGAAGAACCTTACCAGGTCTTGACATCCAGGTGGTGCATGGTCGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTTACTAGTTGCCACTCTAGTGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGACGACGTCAGATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGACGGTACAACGAGCAGCGAACTCGCAAGGGCCAGCTAATCTCTTAAAACCGTTCTCAGTTCGGACTGCAGTCTGCAACTCGACTGCACGAAGTCGGAATCGCTAGTAATCGCGGATCAG-ATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTTTGCAATGCCCAAAGCCGGCGTCTAAGGCAGGGCAGATGACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484443 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAGCGAAGCGGCGGACGGGTGAGTAACGCGTAGGCAACCTGCCCTTCACAGAGGTATAGCCTCGGGAAACCGGGATTAAAACCACATAGTGAAGGATGGGCCTGCGTCTGATTAGCTGGTTGGTAGGGTAAAAGCCTACCAAGGCGACGATCAGTAGCCGACCTGAGAGGGTGATCGGCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTGGGGGATATTGCACAATGGGGGAAACCCTGATGCAGCAACGCCGCGTGAGGTATGAAGGCCTTTGGGTTGTAAGCCTCTGTCCTAGGGGAAGCGGTACCCGAGGAGGAAGCCCCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGAGTGCGTAGGTGGTCTACTAAGCGCGAGGTGAAAGGCAATGGCTCAACCATTGTT-AGCCTTGCGAACTGGCAGACTTGAGTGCAAGAGAGGAAAGCGGAATTCCTAGTGTAGCGGTGAAATGCGCAGATATTAGGAGGAACACCGGCGGCGAAGGCGGCTTTCTGGATTGTAACTGACACTGAGGCACGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGCACTAGGTGTC-GGCGGTGCCGCAGTTAACGCAATAAGTGCTCCGCCTGGGGAGTACGCACGCAAGTGTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCAGCGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAAGACTTGACATCCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCTTTAGTTGCCACTCTAAAGAGACTGCCGGGGA-AACTCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGTCTTGGGCTACACACGTGCTACAATGGCCGGTACAAAGAGAAGCGATACCGCAAGGGGGAGCAAATCTTA-AAAACCGGTCCCAGTTCGGATTGCAGGCTGCAACTCGCCTGCATGAAGTCGGAGTTGCTAGTAATCGCAGATCAG-ATGCTGCGGTGAATGCGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGAAGTTGGGGGCGCCCGAAGTTGGTACCTAAGGCGAAATCAATGACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484442 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAGCGAAGCGGCGGACGGGTGAGTAACGCGTAGGCAACCTGCCCTTCACAGAGGTATAGCCTCGGGAAACCGGGATTAAAACCACATAGTGAAGGATGGGCCTGCGTCTGATTAGCTGGTTGGTAGGGTAAAAGCCTACCAAGGCGACGATCAGTAGCCGACCTGAGAGGGTGATCGGCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTGGGGGATATTGCACAATGGGGGAAACCCTGATGCAGCAACGCCGCGTGAGGTATGAAGGCCTTTGGGTTGTAAGCCTCTGTCCTAGGGGAAGCGGTACCCGAGGAGGAAGCCCCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGAGTGCGTAGGTGGTCTACTAAGCGCGAGGTGAAAGGCAATGGCTCAACCATTGTT-AGCCTTGCGAACTGGCAGACTTGAGTGCAAGAGAGGAAAGCGGAATTCCTAGTGTAGCGGTGAAATGCGCAGATATTAGGAGGAACACCGGCGGCGAAGGCGGCTTTCTGGATTGTAACTGACACTGAGGCACGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGCACTAGGTGTC-GGCGGTGCCGCAGTTAACGCAATAAGTGCTCCGCCTGGGGAGTACGCACGCAAGTGTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCAGCGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAAGACTTGACATCCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCTTTAGTTGCCACTCTAAAGAGACTGCCGGGGA-AACTCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGTCTTGGGCTACACACGTGCTACAATGGCCGGTACAAAGAGAAGCGATACCGCAAGGGGGAGCAAATCTTA-AAAACCGGTCCCAGTTCGGATTGCAGGCTGCAACTCGCCTGCATGAAGTCGGAGTTGCTAGTAATCGCAGATCAG-ATGCTGCGGTGAATGCGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGAAGTTGGGGGCGCCCGAAGTTGGTACCTAAGGCGAAATCAATGACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484439 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GATAAACGCTGGCGGCGTGCTTAACACATGCAAGTTGGACGGAGTAGCGGACGGGTGAGTAATGCATAAGA-ATCTATCCATCAGAGGGGGACAACTGCGGGAAACCGGAGCTAATACCCCGTACTGATGGAGGAGCTTGTGTCCTATCAGGTAGTTGGTGAGGTAAGAGCTCACCAAGCCGAAGACGGGTAGCCGGGCTGAGAGGTTGTACGGCCACATTGGAACTGAGAGACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGGCAATGGGCGAAAGCCTGACCCAGCGACGCCGCGTGAGGGAAGACGGCCTTCGGGTTGTAAACCTCTGTTGCAGGGGAAGCGGTACCCTGCGAGGAAGCTCCGGCAAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGAGCGAGCGTTATCCGGAATTACTGGGCGTAAAGGGCGCGTAGGCGGAATGACAAGTCAGAAGTGAAAGCGTGGGGCTCAACCCCATGA-TGCGGCTGAAACTGTTATTCTAGAGGCATGGAGAGGCAAACGGAATTCCCGGTGTAGCGGTGAAATGCGTAGATATCGGGAAGAACACCAGTGGCGAAGGCGGTTTGCTGGCCA-TGACTGACGCTCAAGCGCGAAAGCTAGGGTAGCAAACGGGATTAGATACCCCGGTAGTCCTAGCAGTAAACGATGTATGCTGGGTGTGGGTCCGTGCCGAAGTTAACGCGATAAGCATACCGCCTGGGGAGTACGGTCGCAAGATTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCACGTGGTTTAATTCGATGCAAACCGAAGAACCTTACCTGGGCTTGACATGCAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATTGCCAGTTGCCACTCAGGCGAGACTGCCGCCGACAAGGTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTATGCCCAGGGCCACACACATGCTACAATGGCCGGTACAAAGGGAAGCGAGGCTGCGAAGCGGAGCGAACCCCA-AAAGCCGGTCCCAGTTCGGATTGCAGTCTGCAACTCGACTGCATGAAGTTGGAATCGCTAGTAATCGCGAATCAG-AAGTCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATCCGAGTTGGATGCACTCCAAGTCGGCGCCCAAAGTGTGTCTGGTGAGGAGGGTGAAGTCGTAACAAGGTAGCCGT
+>484437 study_id=40682 non_ACGT_percent=0.0000 decision=named_isolate
+AACGAACGCTGGCGGCGCGTCTTAAGCATGCAAGTCGAACGGAGTGGCGGACTGGTGAGGAACACGTGGGTAATCTACCCTTAAGATGGGGATAGCTGCTAGAAATAGCAGGTAATACCGAATACTTGAGGATGAGCTTGCGTCCCATTAGCTAGTTGGTGAGGTAAAGGCCCACCAAGGCGACGATGGGTATCCGGCCTGAGAGGGTGATCGGACACATTGGGACTGAGATACGGCCCAAACTCCTACGGGAGGCAGCAGCTAAGAATATTCCGCAATGGACGGAAGTCTGACGGAGCGACGCCGCGTGGATGAAGAAGGCTGAAAAGTTGTAAAATCCTTTTGTTGATGAAGCGGTAATCG-CGAATAAGCCCCGGCTAAT-TACGTGCCAGCAGCCGCGGTAACACGTAAGGGGCGAGCGTTGTTCGGAATTATTGGGCGTAAAGGGCATGTAGGCGGTTATGTAAGCCTGGTGTGAAATCCTGGGGCTTAACCCTAGAATAGCATTGGGTACTGTATAACTTGAATTACGGAAGGGAAACTGGAATTCCAAGTGTAGGGGTGGAATCTGTAGATATTTGGAAGAACACCGGTGGCGAAGGCGGGTTTCTGGCCGATAATTGACGCTGAGATGCGAAAGTGTGGGGATCGAACAGGATTAGATACCCTGGTAGTCCACACTGTAAACGATGTACACTAGGTGTTGGGCAGTGCCAAAGCAAACGCGATAAGTGTACCGCCTGGGGAGTATGCCCGCAAGGGTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGGTACGCGAGGAACCTTACCTGGGTTTGACATCCAGGTGCTGCATGGCTGTCGTCAGCTCGTGCCGTGAGGTGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTACTGCCAGTTACGACTCTGGCGGAACTGCCGATGACAAATCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTATGTCCAGGGCTACACACGTGCTACAATGGTTGCTACAAAGCGAAGCGAGACCGTAAGG-GGAGCAAACCGCAAAAAAGCAATCGTAGTTCGGATTGAAGTCTGAAACTCGACTTCATGAAGTTGGAATCGCTAGTAATCGCGCATCAGCACGGCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATCCGAGTTGGGGGTACCCGAAGTCGCTGCCGAAGGTACGCTTGGTGAGGAGGGTGAAGTCGTAACAAGGTAGCCGT
+>484436 study_id=40695 non_ACGT_percent=0.0000 decision=named_isolate
+ATTGAACGCTGGCGGCAGGCTTAACACATGCAAGTCGAACGAAGTGGCGGACGGGTGAGTAACATTTAGGA-ATCTGCCTAGTAGTGGGGGATAGCTCGGGGAAACTCGAATTAATACCGCATACTATTAGATGAGCCTAAATCAGATTAGCTAGTTGGTGGGGTAAAGGCCC-CCAAGGCGACGATCTGTAACTGGTCTGAGAGGATGATCAGTCACACCGGAACTGAGACACGGTCCGGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGGGCAACCCTGATCCAGCCATGCCGCGTGTGTGAAGAAGGCCTTTTGGTTGTAAAGCACTTTAAGCAGGGAGGCGTTACCTGCAGAATAAGCACCGGCTAAC-TCTGTGCCAGCAGCCGCGGTAATACAGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGAGTGTAGGTGGCTCATTAAGTCACATGTGAAATCCCCGGGCTTAACCTGGGAACTGCATGTGATACTGGTGGGCTAGAATATGTGAGAGGGAAGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGATGGCGAAGGCAGCTTCCTGGCATAATATTGACACTGAGATTCGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGTCTACTAGCCGTTGGGTAGTGGCGCAGTTAACGCGATAAGTAGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTTTCCTTATTTGCAACTTTAAGGATACTGCCAGTGACAAACTGGAGGAAGGCGGGGACGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGTAGGTACAGAGGGTTGCTACACAGCGATGTGATGCTAATCTCAAAAAGCCTATCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGCAGATCAG-ATGCTGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTCTATTGCACCAGAAGTAGGTTACCACGGTGTGGTCGATGACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484430 study_id=40682 non_ACGT_percent=0.0000 decision=named_isolate
+AGTGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAACGGAGTGGCGCACGGGTGAGTAATATATAGCTAATCTGCCCCTTGCTGGAGGACAACAGTTAGAAATGACTGCTAATACTCCATAGCAAGGGATGAGACTATATCGTATCAGCTAGTCGGTGGGGTAACGGCCTACCGAGGCTATGACGCGTAACTGGTCTGAGAGGATGATCAGTCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTAGGGAATATTGCGCAATGGGGGAAACCCTGACGCAGCAACGCCGCGTGGAGGATGACACTTTTCGGAGCGTAAACTCCTTTTGTTAGGGAAGCGGTACCTAACGAATAAGCACCGGCTAAC-TCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTACTCGGAATCACTGGGCGTAAAGGACGCGTAGGCGGATTATCAAGTCTCTTGTGAAATCTAACGGCTTAACCGTTAAACTGCTTGGGAAACTGATAATCTAGAGTAAGGGAGAGGCAGATGGAATTCTTGGTGTAGGGGTAAAATCCGTAGATATCAAGAAGAATACCTATTGCGAAGGCGATCTGCTGGAACTTAACTGACGCTAATGCGTGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTATACCGGTTGTTGCTCAGTAATCCACCTAACGGATTAAGTATACCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATAGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGATACGCGAAGAACCTTACCCGGACTTGATATCCAGGTGCTGCACGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCACGTCATTAGTTGCCACTCTAATGAGACTGCCTTCG-TAAGGAGGAGGAAGGTGTGGACGACGTCAAGTCATCATGGCCCTTATGTCCGGGGCGACACACGTGCTACAATGGCATATACAATAAGACGCAATATCGTAAGATGGAGCAAATCTAA-AAAATATGTCCCAGTTCGGATTGGAGTCTGCAACTCGACTCCATGAAGCCGGAATCGCTAGTAATCGTAGATCAGCATGCTACGGTGAATACGTTCCCGGGTCTTGTACTCACCGCCCGTCACACCATGGGAGTTGATTTCACTCGAAGCGGGCCTCCACAGTGGAATCAGCGACTGGGGTGAAGTCGTAACAAGGTAACCGT
+>484425 div_ratio=1.104 study_id=37832 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTAGCGACAGGCTTAACACATGCAAGTCGAGGG-ACCGGCGCACGGGTGAGTAACGCGTATGCAACTTGCCTATCAGAGGGGGATAACCCGGCGAAAGTCGGACTAATACCGCATGCTGATAGATAGGCATGCGTTCCATTAGGCAGTTGGCGGGGTAACGGCCCACCAAACCGACGATGGATAGGGGTTCTGAGAGGAAGGTCCCCCACATTGGTACTGAGACACGGACCAAACTCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGCCGAGAGGCTGAACCAGCCAAGTCGCGTGAGGGATGAAGGTTTATGGATCGTAAACCTCTTTTATAAGGGAATATGTACCTTATGAATAAGGATCGGCTAAC-TCCGTGCCAGCAGCCGCGGTAATACGGAGGATCCGAGCGTTATCCGGATTTATTGGGTTTAAAGGGTGCGTAGGCGGCCTTTTAAGTCAGCGGTGAAAGTCTGTGGCTCAACCATAGAATTGCCGTTGAAACTGGGGGGCTTGAGTATGTTTGAGGCAGGCGGAATGCGTGGTGTAGCGGTGAAATGCATAGATATCACGCAGAACCCCGATTGCGAAGGCAGCCTGCCAAGCCATGACTGACGCTGATGCACGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCCACGCAGTAAACGATGATCACTAGCTGTTTGCAAGCGGCACAGCGAAAGCGTTAAGTGATCCACCTGGGGAGTACGCCGGCAACGGTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGAGGAACATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCCGGGTTTGAACGCGAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCGGCTTAAGTGCCATAACGAGCGCAACCCTTGCCACTAGTTACGACTCTGGTGGGACTGCCAGCG-TAAGCTGGAGGAAGGCGGGGATGACGTCAAATCAGCACGGCCCTTACATCCGGGGCGACACACGTGTTACAATGGCGTGGACAAAGGGAGGCCACCTGGCGACAGGGAGCGAATCCCC-AAACCACGTCTCAGTTCGGATCGGAGTCTGCAACCCGACTCCGTGAAGCTGGATTCGCTAGTAATCGCGCATCAGCATGGCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCAAGCCATGGGAGCCGGGGGTACCTGAAGTCCGGGCCTAGGGTAAAACTGGTGACTGGGGCTAAGTCGTAACAAGGTAGCCGT
+>484424 study_id=37831 non_ACGT_percent=0.0000 decision=named_isolate
+GACGAACGCTGGCGGCGTGCC-AATACATGCAAGTCGAGCGAAGCGGCGGATGGGTGAGTAACACGTGGGGAACCTGCCCCATAGTCTGGGATACCACTTGGAAACAGGTGCTAATACCGGATACTATGGGATGGCCCCGCGGTGCATTAGCTAGTTGGTAAGGTAAAGGCTTACCAAGGCGATGATGCATAGCCGAGTTGAGAGACTGATCGGCCACATTGGGACTGAGACACGGCCCAAACT-CTACGGGAGGCAGCAGTAGGGAATCTTCCACAATGGACGCAAGTCTGATGGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAGCTCTGTTGTTGGTGAAGCGGTAATCAACCAGAAAGTCACGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGAAGAATAAGTCTGATGTGAAAGCCCTCGGCTTAACCGAGGAACTGCATCGGAAACTGTTTTTCTTGAGTGCAGAAGAGGAGAGTGGAACTCCATGTGTAGCGGTGGAATGCGTAGATATATGGAAGAACACCAGTGGCGAAGGCGGCTCTCTGGTCTGCAACTGACGCTGAGGCTCGAAAGCATGGGTAGTGAACAGGATTAGATACCCTGGTAGTCCATGCCGTAAACGATGAGTGCTAAGTGTTGGGCAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGC-GTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTTATTAGTTGCCACTCTAATGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGGCAGTACAACGAGAAGCGAGCCTGCGAAGGCAAGCGAATCTCTGAAAGCTGTTCTCAGTTCGGACTGCAGTCTGCAACTCGACTGCACGAAGCTGGAATCGCTAGTAATCGCGGATCAG-ACGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTCTGCAATGCCCAAAGCCGGCGTCTAAGGCAGGGCAGATGACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484408 study_id=37830 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGACAGAATGCTTAACACATGCAAGTCAACTTGGGTGGCGGACGGGTGAGTAACGCGTAAAGAACTTGCCTCACAGCTAGGGACAACATTTGGAAACGAATGCTAATACCTAATACTGTGAGAGAGCTTTGCGTCCCATTAGCTAGTTGGAGAGGTAACGGCTCACCAAGGCGATGATGGGTAGCCGGCCTGAGAGGGTGATCGGCCACAAGGGGACTGAGACACGGCCCTTACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGACCAAAGTCTGATCCAGCAATTCTGTGTGCACGATGAAGTTTTTCGGAATGTAAAGTGCTTTCAGTTGGGAAGCGGTACCAACAGAAGAAGTGACGGCTAAA-TACGTGCCAGCAGCCGCGGTAATACGTATGTCACGAGCGTTATCCGGATTTATTGGGCGTAAAGCGCGTCTAGGTGGTTATGTAAGTCTGATGTGAAAATGCAGGGCTCAACTC--GTATTGCGTTGGAAACTGTATAACTAGAGTACTGGAGAGGTAAGCGGAACTACAAGTGTAGAGGTGAAATTCGTAGATATTTGTAGGAATGCCGATGGGGAAGCCAGCTTACTGGACAGATACTGACGCTGAAGCGCGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGATTACTAGGTGTTGGGCAGCGCCCAAGCAAACGCGATAAGTAATCCGCCTGGGGAGTACGTACGCAAGTATGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGACGCAACGCGAGGAACCTTACCAGCGTTTGACATCCAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTTTCGTATGTTACGACTCATGCGATACTGCCTACGATGAGTAGGAGGAAGGTGGGGATGACGTCAAGTCATCATGCCCCTTATACGCTGGGCTACACACGTGCTACAATGG-GTAGACAGAGAGTCGCAAAGCTGTGAAGTGGAGCTAATCTCA-GAAAACTATCTTAGTTCGGATTGTACTCTGCAACTCGAGTACATGAAGTTGGAATCGCTAGTAATCGCGAATCAGCATGTCGCGGTGAATACGTTCTCGGGTCTTGTACACACCGCCCGTCACACCACGAGAGTTGGTTGCACCTGAAGTAGCCTCCGAGGGTGTGATTAGCGATTGGGGTGAAGTCGTAACAAGGTATCCGT
+>484407 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGCGCCTAACACATGCAAGTCGAACG-AGTGGCGAACGGGTGAGTAACACGTGACCAACCCGCCCCCCC-ACCGGGACAACCTCGGGAAACCGAGGCTAATACCGGATAGGAGGGGACGGGGTCGCGGCCCATCAGGTAGACGGCGGGGCGAAGGCCCGCCGTGCCGACGACGGGTAGCCGGGCTGAGAGGCCGATCGGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGGCGAAAGCCTGACGCAGCGACGCCGCGTGCGGGAAGGAGGCCTTCGGGTCGTAAACCGCTTTCAGCAGGGAAGCGGTACCTGCAGAAGAAGCCCCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCGAGCGTTATCCGGATTCATTGGGCGTAAAGCGCGCGCAGGCGGCCCGCCAAGCGGCCTCTCGAAGCCGGGGGCTCAACCCCCGGAAGCGACCCGA-ACTGGC-GGCTCGAGTGGGGCAGGGGAGGATGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCGACGGCGAAGGCAGCCCTCTGGGCCTTCACTGACGCTGAGGCGCGAAAGCTGGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCCAGCCGTAAACGATGGGCGCTAGGTGCGGGGCCGTGCCGCAGCCAACGCATTAAGCGCCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCAGCGGAGCATGTGGCTTAATTCGAAGCAACGCGAAGAACCTTACCAGGGCTTGACATGCAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCCGCCGCATGTTGCCACTCATGCGGGACCGCCGGCGCCAAGCCGGAGGAAGGCGGGGACGACGTCAAGTCATCATGCCCCCCATGCCCTGGGCCGCACACGTGCTACAATGGCCGGCACAGCGGGCAGCGGACCCGCGAGGGCGAGCGAATCCCTTAAAGCCGG-CCCAGTTCGGATCGGAGGCTGCAACCCGCCTCCGTGAAGCCGGAGTTG..................................................................................................................................................
+>484406 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGCGCCTAACACATGCAAGTCGAAGGTAGTGGCGAACGGGTGAGTAACACGTGACCAACCCGCCCCCCCCACCGGGACAACCTCGGGAAACCGAGGCTAATACCGGATAGGAGGGGACGGGGTCGCGGCCCATCAGGTAGACGGCGGGGCGAAGGCCCGCCGTGCCGACGACGGGTAGCCGGGCTGAGAGGCCGATCGGCCACATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCGCAATGGGGGGAACCCTGACGCAGCGACGCCGCGTGCGGGAAGGAGGCCTTCGGGTCGTAAACCGCTTTCAGCAGGGAAGCGGTACCTGCAGAAGAAGCCCCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCGAGCGTTATCCGGATTCATTGGGCGTAAAGCGCGCGCAGGCGGCCCGCCAAGCGGCCTCTCGAAGCCGGGGGCTCAACCCCCGGAAGCGACCCGA-ACTGGCGGGCTCGAGTGGGGCAGGGGAGGATGGAATTCCCGGTGTAGCGGTGAAATGCGCAGATATCGGGAGGAACACCGACGGCGAAGGCAGCCCTCTGGGCCTTCACTGACGCTGAGGCGCGAAAGCTGGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCCAGCCGTAAACGATGGGCGCTAGGTGCGGGGCCGTGCCGCAGCCAACGCATTAAGCGCCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCAGCGGAGCATGTGGCTTAATTCGAAGCAACGCGAAGAACCTTACCAGGGCTTGACAT-CAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCCGCCGCATGTTGCCACTCATGCGGGACCGCCGGCGCCAAGCCGGAGGAAGGCGGGGACGACGTCAAGTCATCATGCCCC--ATGCCCTGGGCCGCACACGTGCTACAATGGCCGGCACAGCGGGCAGCGGACCCGCGAGGGCGAGCGAATCCCTTAAAGCCGGCCCCAGTTCGGATCGGAGGCTGCAACCCGCCTCCGTGAAGCCGGAGTTGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATGCGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACCCGAGTCGTCTGCACCCGAAGCCGCCGTCGAAGGTGTGGAGGGTGAGGGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484401 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCTACAGGCTTAACACATGCAAGTCGAGGG-ACCGGCGCACGGGTGAGTAACGCGTATCCAACCTGCCTCTGACTGAGGGATAACCCGTCGAAAGTCGGCCTAATACCTCATGGTCAGGGATGGGGATGCGTCTGATTAGCTTGTTGGCGGGGTAACGGCCCACCAAGGCTACGATCAGTAGGGGTTCTGAGAGGAAGGTCCCCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGGCGAGAGCCTGAACCAGCCAAGTAGCGTGCAGGAAGACGGCCTATGGGTTGTAAACTGCTTTTATGCGGGGATAGGTACCGCATGAATAAGGACCGGCTAAT-TCCGTGCCAGCAGCCGCGGTAATACGGAAGGTCCGGGCGTTATCCGGATTTATTGGGTTTAAAGGGAGCGTAGGCCGTGGATTAAGCGTGTTGTGAAATGCAGGTGCTCAACGTCTGCACTGCAGCGCGAACTGGTCCACTTGAGTGTGCGCAACGCAGGCGGAATTCGTCGTGTAGCGGTGAAATGCTTAGATATGACGAAGAACTCCGATTGCGAAGGCAGCTTGCGGGAGCACAACTGACGCTGAAGCTCGAAAGTGCGGGTATCGAACAGGATTAGATACCCTGGTAGTCCGCACGGTAAACGATGGATGCCC-GTTTCAGGGGT-GACCAAGCGAAAGCATTAAGCATCCCACCTGGGGAGTACGCCGGCAACGGTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGAGGAACATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCCGGGCTTGAATTGAAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCGGCTTAAGTGCCATAACGAGCGCAACCCCTTTCTTCAGTTGCCACTCTGTAGATACTGCCACCG-CAAGGTGGAGGAAGGTGGGGATGACGTCAAATCAGCACGGCCCTTACGTCCGGGGCTACACACGTGTTACAATGGCCGGTACAGAGAGTTGATTTTGTGCAAACACGATCTAATCCTT-AAATCCGGTCCCAGTTCGGACTGGGGTCTGCAACCCGACCCCACGAAGCTGGATTCGCTAGTAATCGCGCATCAGCATGGCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCAAGCCATGAAAGCCGGGGGTGCCTGAAGTCTGGGCCTAGGGCAAAACCGGTGATTGGGGCTAAGTCGTAACAAGGTAGCCGT
+>484394 div_ratio=1.098 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGGAGTGGCGGACGGGTGAGTAACACGTGGGCAACCTGGCTCATAGAGGGGGATAACAGAGAGAAATTTCTGCTAATACCGCATACTATGAGATGGACCCGCGTCTGATTAGCCAGTTGGCAGGGTAAGAGCCTACCAAAGCGACGATCAGTAGCCGATCTGAGAGGATGAACGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGGATATTGCACAATGGGGGGAACCCTGATGCAGCGACGCCGCGTGAGTGAAGAAGTATTTCGGTATGTAAAGCTCTATCAGCAGGGAAGCAGTACCTGAATAAGAAGCCCCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGTAGACGGAATGGCAAGTCTGAAGTGAAATGCCCGGGCTCAACCCGGGAACTGCTTTGGAAACTGTCGATCTGGAGTGTTGGAGAGGTAAGTGGAATTCCTGGTGTAGCGGTGAAATGCGTAGAGATCAGGAAGAACACCGGAGGCGAAGGCGGCTTACTGGACAAAGACTGACGTTGAGGCTCGAAAGCGTGGGAAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAATACTAGGTGTCGGTCGGTGCCGACGCAAACGCAATAAGTATTCCACCTGGGGAGTACGTTCGCAAGAATGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGAGATCCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCGTCAGTAGCCACTCTGATGAGACTGCCGGGGATAACCCGGAGGAAGGCGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCGACACACGTGCTACAATGGCGGAAACAGAGGGAAGCGAGGGGGCGACCCGGAGCAAATCTCAAAAATACCGTCTCAGTTCGGACTGCAGTCTGCAACTCGACTGCACGAAGCCGGAATCGCTAGTAATCGCGGATCAG-ATGCCGCGGTGAATCCGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGGAGTCGGTAATGCCCGAAGTCAGTGCCGAAGG-AGGACAGATAACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484391 study_id=39086 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGTGCC-AATACATGCAAGTCGAACGCAGTGGCGAACGGGTGAGTAACACGTGGGTAACCTACCTCTTAGCAGGGGATAACATTTGGAAACAAGTGCTAATACCGTATACTAAGAGATGGACCCGCGGTGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAATGATGCATAGCCGAGTTGAGAGACTGATCGGCCACAATGGGACTGAGACACGGCCCATACT-CTACGGGAGGCAGCAGTAGGGAATCTTCCACAATGGGCGCAAGCCTGATGGAGCAACGCCGCGTGTGTGATGAAGGGTTTCGGCTCGTAAAACACTGTTATAAGAGAAGCGGTATCTTACCAGAAAGGAACGGCTAAA-TACGTGCCAGCAGCCGCGGTAATACGTATGTTCCAAGCGTTATCCGGATTTATTGGGCGTAAAGCGAGCGCAGACGGTTATTTAAGTCTGAAGTGAAAGCCCTCAGCTCAACTGAGGAATGGCTTTGGAAACTGGATGACTTGAGTGCAGTAGAGGAAAGTGGAACTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAAGAACACCAGTGGCGAAGGCGGCTTTCTGGACTGTAACTGACGTTGAGGCTCGAAAGTGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACACCGTAAACGATGAGTGCTAGATGTTCGAGAGTGTCGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGC-GTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATTATTAGTTGCCACTCTAGTGAGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGCATATACAACGAGTCGCCAACCCGCGAGGGTGCGCTAATCTCTTAAAGTATGTCTCAGTTCGGATTGTAGGCTGCAACTCGCCTACATGAAGTCGGAATCGCTAGTAATCGCGGATCAG-ACGCCGCGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGAGAGTTTGTAACACCCAAAGCCGGCGTCTAAGGTGGGACAGATGATTAGGGTGAAGTCGTAACAAGGTAGCCGT
+>484379 study_id=39086 non_ACGT_percent=0.0000 decision=named_isolate
+GACGAACGCTGGCGGCGTGCCTAATACATGCAAGTAGAACGCAGTTGCGAACGGGTGAGTAACGCGTAGGTAAC-TGCCTGGTAGCGGGGGATAACTATTGGAAACGATAGCTAATACCGCATACTACCAGATGGACCTGCGTTGTATTAGCTAGTTGGTGGGGTAAGGGCTCACCAAGGCGACGATACATAGCCGACCTGAGAGGGTGATCGGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGACGGAAGTCTGACCGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAGCTCTGTTGTAAGAGAAGCGGTATCTTACCAGAAAGGGACGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGTCCCGAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGCGGTTAGATAAGTCTGAAGTTAAAGGCTGTGGCTTAACCATAGTA-GGCTTTGGAAACTGTTTAACTTGAGTGCAAGAGGGGAGAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAGGAACACCGGTGGCGAAAGCGGCTCTCTGGCTTGTAACTGACGCTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGAGTGCTAGGTGTTAG-TAGTGCCGTAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATCCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATTGTTAGTTGCCACTCTAGCGAGACTGCCGGTAATAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGCTGGTACAACGAGTCGCAAGCCGGTGACGGCAAGCTAATCTCTTAAAGCCAGTCTCAGTTCGGATTGTAGGCTGCAACTCGCCTACATGAAGTCGGAATCGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGTCGGCGCCTAAGGTGGGATAGATGATTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484376 study_id=39086 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAAGCGGGG-ACGGGTGAGTAACACGTGGATAACCTCCT-ATAAGACTGGGATAACTTCGGGAAACCGGAGCTAAACCGG-ATACTTATAGATGGATCCGCGCCGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGCGGTACCTAATCAGAAAGCCACGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGTAGGCGGTTTTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAG-GGCATTGGAAACTGGAAAACTTGAGTGCAGAAGAGGAAAGTGGAATTCCATGTGTAGCGGTGAAATGCGCAGAGATATGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGTCTGTAACTGACGCTGATGTGCGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAAATCTTGACATCCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTAAGCTTAGTTGCCACTCTAAGTTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGATTTGGGCTACACACGTGCTACAATGGACAATACAAAGGGCAGCGAA-CCGCGAGGTCAAGCAAATCCCATAAAGTTGTTCTCAGTTCGGATTGTAGTCTGCAACTCGACTATATGAAGCTGGAATCGCTAGTAATCGTAGATCAGCATGCTACGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGCCGGCGTCGAAGGTGGGACAAATGATTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484369 study_id=39086 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGTGCCTAATACATGCAAGTCGAGCGAAGCGGGG-ACGGGTGAGTAACACGTGGATAACCTCCT-ATAAGACTGGGATAACTTCGGGAAACCGGAGCTAAACCGG-ATACTTATAGATGGATCCGCGCCGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGCGGTACCTAATCAGAAAGCCACGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGTAGGCGGTTTTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAG-GGCATTGGAAACTGGAAAACTTGAGTGCAGAAGAGGAAAGTGGAATTCCATGTGTAGCGGTGAAATGCGCAGAGATATGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGTCTGTAACTGACGCTGATGTGCGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAAATCTTGACATCCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTAAGCTTAGTTGCCACTCTAAGTTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGATTTGGGCTACACACGTGCTACAATGGACAATACAAAGGGTGGCGAA-CCGCGAGGTCAAGCAAATCCCATAAAGTTGTTCTCAGTTCGGATTGTAGTCTGCAACTCGACTACATGAAGCTGGAATCGCTAGTAATCGTGGATCAGCATGCCACGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGCCGGCGTCGAAGGTGGGACAAATGATTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484365 study_id=39086 non_ACGT_percent=0.0000 decision=named_isolate
+..........................................AGCGGGG-ACGGGTGAGTAACACGTGGATAACCTCCT-ATAAGACTGGGATAACTTCGGGAAACCGGAGCTAAACCGG-ATACTTATAGATGGATCCGCGCTGCATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCAACGATGCATAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTATTAGGGAAGCGGTACCTAATCAGAAAGCCACGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGTAGGCGGTTTTTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAG-GGCATTGGAAACTGGAAAACTTGAGTGCAGAAGAGGAAAGTGGAATTCCATGTGTAGCGGTGAAATGCGCAGAGATATGGAGGAACACCAGTGGCGAAGGCGACTTTCTGGTCTGTAACTGACGCTGATGTGCGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAAATCTTGACATCCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTAAGCTTAGTTGCCACTCTAAGTTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGATTTGGGCTACACACGTGCTACAATGGACAATACAAAGGGCAGCGAA-CCGCGAGGTCAAGCAAATCCCATAAAGTTGTTCTCAGTTCGGATTGTAGTCTGCAACTCGACTACATGAAGCTGGAATCGCTAGTAATCGTAGATCAGCATGCTACGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGCCGGCGTCGAAGGTGGGACAAATGATTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484357 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GACGAACGCTGGCGGCGCGCTTAACACATGCAAGTCGTGCGAAGCGGCGGACGGGTGAGTAACACGTGAGT-AGCTGTCCTAAGGAGGGGGATAACGCCTGGAAACGGGTGCTAAAACCCCATACTAACCTGTGTGCTCGCGGCCTATCAGCTAGTTGGTGAGGTAACGGCTCACCAAGGCTAAGACGGGTAGCCGGCCTGAGAGGGTGTACGGCCACACTGGAATTGAGATACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGGGCAATGGGCGAAAGCCTGACCCAGCGACGCCGCGTTGGGGATGAAGCCCTTCGGGGTGTAAACCCATGTTGTAGGGGACGCGGTACCCTACGAGGAAGCCCCGGCTAAC-TACGTGCCAGCAGCCGCGGTAAGACGTAGGGGGCAAGCGTTGTCCGGAATTACTGGGCGTAAAGGGCACGCAGGCGGTGCGCCAAGTCGAGGGTGTAAAGTTACGGCTCAACCGTGACATTGCAATCGATACTGGCGCGCTGGAGTGCGGGAGAGGGAAGTGGAATTCCCGGTGTAGCGGTGAAATGCGTAGATATCGGGAGGAACGCCAGTGGCGAAGGCGGCTTCCTGGCCCGCGACTGACGCTCATGTGCGAAAGCCAGGGGAGCGAACCGGATTAGATACCCGGGTAGTCCTGGCCGTAAACGATGGGTGCTAGGTGTAGGCCTGTGCCGCAGTTAACGCGATAAGCACCTCGCCTGGGGAGTACGGTCGCAAGGCTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCACGTGGTTTAATTCGATGCAAACCGAAGAACCTTACCTGGGTTTGACATGCAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTGCGCCTAGTTGCCAC-TCTAGGCGGACGCCGGCGACAAGTCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCTTTAAGCCCAGGGCGACACACGTGCTACAATGGCCAGCACAGAGGGCGGCAAGTCCGCGAGGGCAAGCGAATCCCTTAAAGCTGGTCTTAGTTCGGATCGCAGTCTGCAACCCGACTGCGTGAAGCCGGAATCGCTAGTAATCGCCGGTCAGCATACGGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACCCGAGTTGGGTGCTCCCGAAGCCGCCGTCGAAGGAGTGTCTGATAAGGGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484347 div_ratio=1.058 study_id=38595 non_ACGT_percent=0.0000 decision=named_isolate
+................................................................................................................................................................GGGTAAGTGGCTCACCAAGGCGACGATCCCTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTAGGGTTGTAAAGTACTTTCAGTTGGGAGGCGTTACCAACAGAAGAAGCACCGGCTAAC-TCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTGATTAAGTTAGATGTGAAATCCCCGGGCTTAACCTGGGAATGGCATCTAAGACTGGTCAGCTAGAGTCTTGTAGAGGGGGGTAGAATTCCATGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACAAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGTCGATTTGGAGGTTGTGGCTTCCGGAGCTAACGCGTTAAATCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACTCTTGACATCCAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCAACTCAAAGGAGACTGCCGGTGATAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGAGTAGGGCTACACACGTGCTACAATGGCGTATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGAACTCATAAAGTACGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTAGATCAG-ATGCTACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTTACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACCGT
+>484343 study_id=38595 non_ACGT_percent=0.0000 decision=named_isolate
+...............................................................GTATGGGG-ATCTGCCCGATAGAGGGGGATAACTACTGGAAACGGTAGCTAATACCGCATACTATCGGATGAACCCATATGGGATTAGCTAGTAGGTGAGGTAATGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCCTAGGGTTGTAAAGTACTTTCAGTCGGGAGGCGTTACCGACAGAAGAAGCACCGGCTAAC-TCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTTGATTAAGTTAGATGTGAAATCCCCGGGCTTAACCTGGGAATGGCATCTAAGACTGGTCAGCTAGAGTCTTGTAGAGGGGGGTAGAATTCCATGTGTAGCGGTGAAATGCGTAGAGATGTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACAAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGTCGATTTGAAGGTTGTGGCTTTCGGAGCTAACGCGTTAAATCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACTCTTGACATCCAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCAACTCAAAGGAGACTGCCGGTGATAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGAGTAGGGCTACACACGTGCTACAATGGCGTATACAAAGAGAAGCGACCTCGCGAGAGCAAGCGGAACTCATAAAGTACGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTAGATCAG-ATGCTACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTTACCACTTTGTGATTCATGACTGGGGTGAAGTCGTAACAAGGTAACCGT
+>484338 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCTACAGGCTTAACACATGCAAGTCGTGGG-ACCGGCGCACGGGTGAGTAACGCGTACCGAACCTGCCCATCACACAGGGATAGGCTTGCGAAAGCAAGATTAATACT-GATGGTGATGGATGGCGGTGCGTCCCATTAGGACGTTGGCGGGGTAACGGCCCACCAATCCTTCGATGGGTAGGGGTTCTGAGAGGAAGGTCCCCCACATTGGAACTGAGATACGGTCCAAACTC-TACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGGCGAGAGCCTGAACCAGCCAAGTAGCGTGCGGGATGAAGGCCTTGTGGTCGTAAACCGCTTTTATCAGTGAATAGGTAGCTGAAGAAAAAGGACCGGCTAAT-TCCGTGCCAGCAGCCGCGGTAATACGGAAGGTCCGGGCGTTATCCGGAATTATTGGGTTTAAAGGGAGCGCAGGCGG-GAGTTAAGTCAGCTGTTAAATATCAGAGCCCAACTCTGTTAT-GCAGTTGAAACTATATTTCTTGAGTACGCACAGGGATGGCGGAATTCAGGGTGTAGCGGTGAAATGCTTAGATATCCTGAAGAACTCCGATCGCGAAGGCAGCCATCCGGAGCGTAACTGACGCTGAGGCTCGAAGGTGCGGGTATCGAACAGGATTAGATACCCTGGTAGTCCGCACGGTAAACGATGAATACTCGCAGTTCGCGAGTTGTCCAGCGAAAGCGTTAAGTATTCCACCTGGGGAGTACGCCGGCAA-GGTGAAACTCAAAGGAATTGACGGGGG-CCCCACAAGCGGAGGAACATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCCGGGCTTGAAC--GAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCGGCTTAAGTGCCATAACGAGCGCAACCCTTTTCTACGTTTGCAACTCCGTGGATACTGCCGCCG-CAAGGCGGAGGAAGGTGGGGATGACGTCAAATCAGCACGGCCCTTACGTCCGGGGCTACACACGTGTTACAATGGTCGGAGCAGCAGGAAGCTACCTGGCGACAGGATGCTGATCCCA-AAACCCGGCCTCAGTTCGGACTGGAGTCTGCAACCCGACTCCACGAAGCCGGATTCGCTAGTAATCGCGCATCAGCATGGCGCGGTGAATACGT-CCCGGGCCTTGTACACACCGCCCGTCAAGCCATGAAAGCCGGGGGTGCCTGAAAGCCGGGCCTAGGGTAAAACCGGTGATTGGGGCTAAGTCGTAACAAGGTAGCCGT
+>484333 div_ratio=1.149 study_id=38595 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTAGCTACAGGCTTAACACATGCAAGTCGAGGG-ACCGGCGCACGGGTGAGTAACGCGTATCCAACCTGCCCACCACTTGGGGATAACCTTGCGAAAGTAAGACTAATACCCAATGGTGATGGATGGGGATGCGTCTGATTACCTTGTTGGCGGGGTAACGGCCCACCAAGGCGACGATCAGTAGGGGTTCTGAGAGGAAGGTCCCCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGACGAGAGTCTGAACCAGCCAAGTAGCGTGCAGGATGACGGCCTATGGGTTGTAAACTGCTTTTATAAGGGAATATGTACCTTATGAATAAGGACCGGCTAAT-TCCGTGCCAGCAGCCGCGGTAATACGGAAGGTCCGGGCGTTATCCGGATTTATTGGGTTTAAAGGGAGCGTAGGCCGGAGATTAAGCGTGTTGTGAAATGTAGACGCTCAACGTCTGCACTGCAGCGCGAACTGGTTTCCTTGAGTACGCACAAAGTGGGCGGAATTCGTGGTGTAGCGGTGAAATGCTTAGATATCACGAAGAACTCCGATTGCGAAGGCAGCTCACTGGAGCGCAACTGACGCTGAAGCTCGAAAGTGCGGGTATCGAACAGGATTAGATACCCTGGTAGTCCGCACGGTAAACGATGGATGCCC-GCTTTGGTAGC-GGCCAAGCGAAAGCATTAAGCATCCCACCTGGGGAGTACGCCGGCAACGGTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGAGGAACATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCCGGGCTTGAATTGAAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCGGCTTAAGTGCCATAACGAGCGCAACCCCTCTCCTTAGTTGCCACTCTGGGGACACTGCCACCG-TAAGGTGGAGGAAGGTGGGGATGACGTCAAATCAGCACGGCCCTTACGTCCGGGGCTACACACGTGTTACAATGGCAGGTACAGAGAGACGGTTGTACGTAAGTACGATCAAATCCTT-AAAGCCTGTCTCAGTTCGGACTGGGGTCTGCAACCCGACCCCACGAAGCTGGATTCGCTAGTAATCGCGCATCAGCATGGCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCAAGCCATGAAAGCCGGGGGCGCCTAAAGTCCGGGCCTAGGGCGAAACTGGTAATTGGGGCTAAGTCGTAACAAGGTAGCCGT
+>484332 div_ratio=1.148 study_id=38595 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTAGCTACAGGCTTAACACATGCAAGTCGAGGG-ACCGGCGCACGGGTGAGTAACGCGTATCCAACCTGCCCACCACTTGGGGATAACCTTGCGAAAGTAAGACTAATACCCAATGGTGATGGATGGGGATGCGTCTGATTAGCTTGTTGGCGGGGTAACGGCCCACCAAGGCGACGATCAGTAGGGGTTCTGAGAGGAAGGTCCCCCACATTGGAACTGAGACACGGTCCAAACTCCTACGGGAGGCAGCAGTGAGGAATATTGGTCAATGGGCGAGAGCCTGAACCAGCCAAGTAGCGTGCAGGATGACGGCCTATGGGTTGTAAACTGCTTTTATAAGGGAATATGTACCTTATGAATAAGGACCGGCTAAT-TCCGTGCCAGCAGCCGCGGTAATACGGAAGGTCCGGGCGTTATCCGGATTTATTGGGTTTAAAGGGAGCGTAGGCCGGAGATTAAGCGTGTTGTGAAATGTAGGCGCTCAACGTCTGCACTGCAGCGCGAACTGGTTTCCTTGAGTACGCACAAAGTGGGTGGAATTCGTGGTGTAGCGGTGAAATGCTTAGATATCACGAAGAACTCCGATTGCGAAGGCAGCTCACTGGAGCGCAACTGACGCTGAAGCTCGAAAGTGCGGGTATCGAACAGGATTAGATACCCTGGTAGTCCGCACGGTAAACGATGGATGCCC-GCTTTGGTAGC-GGCCAAGCGAAAGCATTAAGCATCCCACCTGGGGAGTACGCCGGCAACGGTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGAGGAACATGTGGTTTAATTCGATGATACGCGAGGAACCTTACCCGGGCTTGAATTGAAGGTGCTGCATGGTTGTCGTCAGCTCGTGCCGTGAGGTGTCGGCTTAAGTGCCATAACGAGCGCAACCCCTCTCCTTAGTTGCCACTCTGGGGACACTGCCACCG-TAAGGTGGAGGAAGGTGGGGATGACGTCAAATCAGCACGGCCCTTACGTCCGGGGCTACACACGTGTTACAATGGCAGGTACAGAGAGACGGTTGTACGTAAGTACGATCAAATCCTT-AAAGCCTGTCTCAGTTCGGATTGGGGTCTGCAACCCGACCCCACGAAGCTGGATTCGCTAGTAATCGCGCATCAGCATGGCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCAAGCCATGAAAGCCGGGGGCGCCTAAAGTCCGGGCCTAGGGCGAAACTGGTAATTGGGGCTAAGTCGTAACAAGGTAGCCGT
+>484331 study_id=38944 non_ACGT_percent=0.0000 decision=named_isolate
+ATTGAACGCTGGCGGCATGCTTTACACATGCAAGTCGGACG-AGTGGCGAACGGGTGAGTAATATATCGGA-ACGTACCGAGTAATGGGGGATAACTAATCGAAAGATTAGCTAATACCGCATATTATTCGAGCGGCCGATATCTGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCAGTAGCGGGTCTGAGAGGATGATCCGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGTCTGAAGAAGGCCTTCGGGTTGTAAAGGACTTTTGTCAGGGAAGCGGTACCTGAAGAATAAGCACCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGAGCGCAGACGGTTACTTAAGCAGGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCGTTCTGAACTGGGTGACTAGAGTGTGTCAGAGGGAGGTAGAATTCCACGTGTAGCAGTGAAATGCGTAGAGATGTGGAGGAATACCGATGGCGAAGGCAGCCTCCTGGGATAACACTGACGTTCATGCTCGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTCAATTAGCTGTTGGCTAGTAGCGTAGCTAACGCGTGAAATTGACCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGATGATGTGGATTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATGCAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCATTAGTTGCCACTCTAATGAGACTGCCGGTGACAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGACCAGGGCTTCACACGTCATACAATGGTCGGTACAGAGGGTAGCCAAGCCGCGAGGTGGAGCCAATCTCACAAAACCGATCGTAGTCCGGATTGCACTCTGCAACTCGAGTGCATGAAGTCGGAATCGCTAGTAATCGCAGGTCAGCATACTGCGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGGAGTGGGGGATACCAGAAGTAGGTTACCACGGTATGCTTCATGACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484326 study_id=38944 non_ACGT_percent=0.0000 decision=named_isolate
+ATTGAACGCTGGCGGCATGCTTTACACATGCAAGTCGGACG-AGTGGCGAACGGGTGAGTAACATATCGGA-ACGTACCGAGCAGTGGGGGATAACTAATCGAAAGATTAGCTAATACCGCATACTGTTTGAGCGGCCGATATCTGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCAGTAGCGGGTCTGAGAGGATGATCCGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGTCTGAAGAAGGCCTTCGGGTTGTAAAGGACTTTTGTCAGGGAAGCGGTACCTGAAGAATAAGCACCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGGGCGCAGACGGTTACTTAAGCAGGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCGTTCTGAACTGGGTGACTAGAGTGTGTCAGAGGGAGGTAGAATTCCACGTGTAGCAGTGAAATGCGTAGAGATGTGGAGGAATACCGATGGCGAAGGCAGCCTCCTGGGATAACACTGACGTTCATGCCCGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTCGATTAGCTGTTGGCTAGTAGCGAAGCTAACGCGTGAAATCGACCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGATGATGTGGATTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATGCAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCATTAGTTGCCACTCTAATGAGACTGCCGGTGACAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGACCAGGGCTTCACACGTCATACAATGGTCGGTACAGAGGGTAGCCAAGCCGCGAGGTGGAGCCAATCTCACAAAACCGATCGTAGTCCGGATTGCACTCTGCAACTCGAGTGCATGAAGTCGGAATCGCTAGTAATCGCAGGTCAGCATACTGCGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGGAGTGGGGGATACCAGAAGTAGGTTACCACGGTATGCTTCATGACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484325 study_id=38944 non_ACGT_percent=0.0000 decision=named_isolate
+ATTGAACGCTGGCGGCATGCTTTACACATGCAAGTCGGACG-AGTGGCGAACGGGTGAGTAACATATCGGA-ACGTACCGAGTAGTGGGGGATAACTGATCGAAAGATCAGCTAATACCGCATACTATTCGAGCGGCCGATATCTGATTAGCTAGTTGGTGGGGTAAAGGCCTACCAAGGCGACGATCAGTAGCGGGTCTGAGAGGATGATCCGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATTTTGGACAATGGGCGCAAGCCTGATCCAGCCATGCCGCGTGTCTGAAGAAGGCCTTCGGGTTGTAAAGGACTTTTGTCAGGGAAGCGGTACCTGAAGAATAAGCACCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGAGCGCAGACGGTTACTTAAGCAGGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCGTTCTGAACTGGGTGACTAGAGTGTGTCAGAGGGAGGTAGAATTCCACGTGTAGCAGTGAAATGCGTAGAGATGTGGAGGAATACCGATGGCGAAGGCAGCCTCCTGGGATAACACTGACGTTCATGCTCGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCCTAAACGATGTCAATTAGCTGTTGGCCAGTAGCGTAGCTAACGCGTGAAATTGACCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGATGATGTGGATTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATGCAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCATTAGTTGCCACTCTAATGAGACTGCCGGTGACAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGACCAGGGCTTCACACGTCATACAATGGTCGGTACAGAGGGTAGCCAAGCCGCGAGGTGGAGCCAATCTCACAAAACCGATCGTAGTCCGGATTGCACTCTGCAACTCGAGTGCATGAAGTCGGAATCGCTAGTAATCGCAGGTCAGCATACTGCGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGGAGTGGGGGATACCAGAAGTAGGTTACCACGGTATGCTTCATGACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484322 study_id=38595 non_ACGT_percent=0.0000 decision=named_isolate
+GCT-ACTGCTATTGGGATCGTTAAGCCATGCAAGTCGAACGACGTGGCGTACGGCTCAGTAACACGTGGATAACCTACCCTTAGGACTGGGATAACCCTGGGAAACTGGGGATAATACTGGATACCTAAGGATGGGTCTGCGGCCGATTAGGTAGTTGGTTAGGTAATGGCTTACCAAGCCTTTGATCGGTACGGGTTGTGAGAGCAAGAGCCCGGAGATGGAACCTGAGACAAGGTTCCAGGCCCTACGGGGTGCAGCAGGCGCGAAACCTCCGCAATGTGAGAAATCGCGACGGGGGGATCCCAAGTGCCAT----TCT--TAAC--GGG--A-TGGCTTTTCATTAGT-------GCTTTTGGAATAAGAGCTGGC-AAGACCGGTGCCAGCCGCCGCGGTAACACCGGCAGCTCTAGTGGTAGCAGTTTTTATTGGGCCTAAAGCGTCCGTAGCCGGTTTAATAAGTCTCTGGTGAAATCCTGCAGCTTAACTGTGGGAATGCTGGAGATACTATTAGACTTGAGATCGGGAGAGGTTAGAGGTACTCCCAGGGTAGAGGTGAAATTCTGTAATCCTGGGAGGACCGCCTGTTGCGAAGGCGTCTGACTGGAAC-GATCTGACGGTGAGGGACGAAAGCTAGGGGCGCGAACCGGATTAGATACCCGGGTAGTCCTAGCTGTAAACGATGCGGACTTGGTGTTGGGCAGTGCCGAAGGGAAGCTGTTAAGTCCGCCGCCTGGGAAGTACGGTCGCAAGACTGAAACTTAAAGGAATTGGCGGGGGAGCACACAACGCGTGGAGCCTGCGGTTTAATTGGATTCAACGCCGGACATCTCACCAGAGG--------GAGGAGGTGCATGGCCGCCGTCAGCTCGTACCGTGAGGCGTCCTGTTAAGTCAGGCAACGAGCGAGACCCACGCTCTTAGTTACCACACTAAGGGGACCGCCTATGATAAATAGGAGGAAGGAGTGGACGACGGTAGGTCCGTATGCCCCGAATCCTCTGGGCAACACGCGGGCTACAATGGCTGAGACAATGGGTTCCGACGCCGAAAGGCGGAGGTAATCCTCTAAACTTAGTCGTAGTTCGGATTGAGGACTGTAACTCGTTCTCATGAAGCTGGAATGCGTAGTAATCGCGTGTCAC-ATCGCGCGGTGAATACGTCCCTGCTCCTTGCACACACCGCCCGTCACGCCACCCAAAAAGGGATTGGATGA-GGATGATTCGAATCTAGTTTTTTTAAGGAGGGCGAAGTCGTAACAAGGTAGCCGT
+>484320 study_id=38100 non_ACGT_percent=0.0000 decision=named_isolate
+GACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAAC-GAGTGGCGAACGGGTGAGTAATACGCGGGCAACCTGCCCCTCTCTTCGGGATAAGCTTTGGAAACGGGGTCTAATACCGGATGGCGGGGGATGGGCTCGCGGCCTATCAGCTTGTTGGTGGGGTGACGGCT-ACCAAGGC-GCGACGGGTAGCCGGCCTGAGAGGGTGGTCGGCCACACTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGGATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGGGGGATGGAGGCTTTCGGGTTGTAAACCCCTTTCGGCGCGGGAAGGGTACGCGTCAAAGAAGCGCCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGCGCGAGCGTTGTCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGCTTGTCGCGTCTGCTGTGAAAC-GCGGGGCTCAACTCCGCGCGTGCAGTGGGTACGGGCAGGCTGGAGTGCGGCAGGGGTGGCTGGAATTCCTGGTGTAGCGGTGGAATGCGCAGATATCAGGAAGAACACCGATGGCGAAGGCAGGCCACTGGGCCGC-ACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGTTGGGAACTAGGTGTGGGGCTGCGCCGGAGCTAACGCGTTAAGTTCCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGCGGAGCATGCGGATTAATTCGATGCAACGCGAAGAACCTTACCAAGGCTTGACATGCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCCCGTGTTGCGACTCACGGGGGACTGCCGGGGTCAACTCGGAGGAAGGTGGGGACGACGTCAAATCATCATG-CCCTTATGCCTTGGGCTTCACGCATGCTACAATGGCCGGTACAGAGGGTGGCGATGCCGTGAGGCGGAGCGAATCTTGTAAAGCCGGTCTCAGTTCGGATCGGGGTCTGCAACTCGGGCCCGTGAAGTCGGAGTCGCTAGTAATCGCAGATCAGCACGCTGCGGTGAATACGTTCTCGGGCCTTGTACACACCGCCCGTCACGTCACGAAAGTCGGCGACGCCCGAAGCCCGGGTCGAAGGCGGGGTTGGCGATTGGGACGAAGTCGTAACAAGGTAGCCGT
+>484315 study_id=39086 non_ACGT_percent=0.0000 decision=named_isolate
+GACGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAAC-GAGTGGCGAACGGGTGAGTAACACGTGGGTGATCTGCCCTGCACTTCGGGATAAGCTTGGGAAACTGGGTCTAATACCGGATAGTGTAGGATGAGCTCGCGGCCTATCAGCTTGTTGGTGGGGTAATGGCT-ACCAAGGC-GCGACGGGTAGCCGGCCTGAGAGGGTGTACGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGGGGGATGAAGGCCTTCGGGTTGTAAACTCCTTTCGCTAGGGACGCGGTACCTAGATAAGAAGCACCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCGAGCGTTGTCCGGAATTACTGGGCGTAAAGGGCTCGTAGGTGGTTTGTCGCGTCGTCTGTGAATT-CTGGGGCTTAACTCCGGGCGTGCAGGCGATACGGGCAAACTTGAGTGCTGTAGGGGTAACTGGAATTCCTGGTGTAGCGGTGAAATGCGCAGATATCAGGAGGAACACCGATGGCGAAGGCAGGTTACTGGGCAGT-ACTGACGCTGAGGAGCGAAAGCATGGGTAGCGAACAGGATTAGATACCCTGGTAGTCCATGCCGTAAACGGTGGGCGCTAGGTGTGAGGTCGTGCCGTAGCTAACGCATTAAGCGCCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGCGGAGCATGTGGATTAATTCGATGCAACGCGAAGAACCTTACCTGGGCTTGACATACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTGTCTTATGTTGCGACTCATGAGAGACTGCCGGGGTTAACTCGGAGGAAGGTGGGGATGACGTCAAATCATCATG-CCCTTATGTCCAGGGCTTCACACATGCTACAATGGTCGGTACAACGCGCTGCGACACTGTGAGGTGGAGCGAATCGCTGAAAGCCGGCCTTAGTTCGGATTGGGGTCTGCAACTCGACCCCATGAAGTCGGAGTCGCTAGTAATCGCAGATCAGCATGCTGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACGTCATGAAAGTTGGTAACACCCGAAGCCGGCGTCGAAGGTGGGATCGGCGATTGGGACGAAGTCGTAACAAGGTACCCGT
+>484309 div_ratio=1.043 study_id=38595 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGTGCCTAACACATGCAAGTCGAACGAAGTGGCGGACGGGTGAGTAACGCGTGGGTAACCTGCCTCACACTGGGGGACAACAGCTGGAAACGGCTGCTAATACCGCATAGTGTGAGATGGACCCGCGTCTGATTAGCTAGTTGG-TAGGTAACGGCTTACCAAGGCGACGATCAGTAGCCGACCTGAGAGGGTGACCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGAGTGAAGAAGTATTTCGGTATGTAAAGCTCTATCAGCAGGGAAGCGGTACCTGACTAAGAAGCCCCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTTACTGGGTGTAAAGGGAGCGTAGACGGCAA-G-AAGTCTGAAGTGAAAGCCCGGGGCTCAACCGCGGGACTGCTTTGGAAACTGTTTTGCTAGAGTGCTGGAGAGGTAAGTGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCTTACTGGACAGTAACTGACGTTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAATACTAGGTGTTGGTCGGTGCCGTCGCAAACGCAATAAGTATTCCACCTGGGGAGTACGTTCGCAAGAATGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAAGTCTTGACATCCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTAAGTAGCCACTCTTGGGAGACTGCCAGGGATAACCTGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGATTTGGGCTACACACGTGCTACAATGGCG-TAACAAAGGGAAGCGAGCT-GTGAAGCTGAGCAAATCTCAAAAATACG-TCTCAGTTCGGATTGTAGTCTGCAACTCGACTACATGAAGCTGGAATCGCTAGTAATCGCGGATCAG-ATGCCGCGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGGAGTCAGTAACGCCCGAAGTCAGTGCCGAAGGCGGGACCGATAACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484305 study_id=38646 non_ACGT_percent=0.0000 decision=named_isolate
+ATTGAACGCTGGCGGCAGGCCTAACACATGCAAGTCGAACG-AGTGGCGGACGGGTGAGTAATGTCTGGGA-AACTGCCCGATGGAGGGGGATAACTACTGGAAACGGTAGCTAATACCGCATACCATCGGATGTGCCCAGATGGGATTAGCTTGTTGGTGGGGTAACGGCTCACCAAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCCATGCCGCGTGTATGAAGAAGGCCTTCGGGTTGTAAAGTACTTTCAGCGAGGAGGCGTTACTCGCAGAAGAAGCACCGGCTAAC-TCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGCACGCAGGCGGTCTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTTGAAACTGGCAGGCTTGAGTCTCGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACGAAGACTGACGCTCAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACG-CCTAAACGATGTCTATTTGGAGGTTGTGGCTTCCGGAGCTAACGCGTTAAATAGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGAC-GGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCAACTCAAAGGAGACTGCCAGTGATAAACTGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGCATATACAAAGAGAAGCGACCTCG...............................................................................................................................................................................................................................
+>484304 study_id=38646 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAAC-GAGTGGCGAACGGGTGAGTAATGCGTGACCAACCTGCCTTGTGCACCGGAATAGCTCCTGGAAACGGGTGGTAATACCGGATGGCATGGGATGGGGTCGCGTCCTATCAGCTTGTTGGCGGGGTGACGGCC-ACCAAGGC-TTGACGGGTAGCCGGCCTGAGAGGGTGACCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGCGGGATGGAGGCCTTCGGGTTGTAAACCGCTTTTGATTGTCAGCGTGTAGCTTTCGAATAAGCACCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTATCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTTCGTCGCGTCCGGTGTGAAGT-CCATCGCTTAACGGTGGATCTGCGCCGGGTACGGGCGGGCTGGAGTGCGGTAGGGGAGACTGGAATTCCCGGTGTAACGGTGGAATGTGTAGATATCGGGAAGAACACCAATGGCGAAGGCAGGTCTCTGGGCCGT-ACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGGTGGATGCTGGATGTGGGGCTGTGTCGGAGCTAACGCGTTAAGCATCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGAAATTGACGGGGGCCCGCACAAGCGGCGGAGCATGCGGATTAATTCGATGCAACGCGAAGAACCTTACCTGGGCTTGACATGCAGGTGGTGCATGGTCGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGCCGCGTGTTGCAACTCACGTGGGACCGCCGGGGTCAACTCGGAGGAAGGTGGGGATGACGTCAGATCATCATG-CCCTTACGTCCAGGGCTTCACGCATGCTACAATGGCCGGTACAACGGGATGCGACACCGTGAGGTGGGGCGGATCCCTGAAAACCGGTCTCAGTTCGGATCGCAGTCTGCAACCCGACTGCGTGAAGGCGGAGTCGCTAGTAATCGCAGATCAGCACGCTGCGGTGAATGCGTTCCCGGGCCTTGTACACACCGCCCGTCAAGTCATGAAAGTGGGTAGCACCCGAAGCCGGCGTCTAAGGTGAGACTCGTGATTGGGACTAAGTCGTAACAAGGTAGCCGT
+>484303 study_id=38595 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAAC-GAGGGGCGAACGGGTGAGTAATGCGTGACCGACCTGCCCCATGCACCGGAATAGCTCCTGGAAACGGGTGGTAATGCCGGATGGCATGGGATGGGGTCGCGTCCTATCAGCTTGATGGCGGGGTAACGGCC-ACCATGGC-TCGACGGGTAGCCGGCCTGAGAGGGCGACCGGCCACATTGGGACTGAGATACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGCGCAAGCCTGATGCAGCGACGCCGCGTGAGGGATGGAGGCCTTCGGGTTGTAAACCTCTTTTGTTAGGGAGCGTGTACCTTTCGAATAAGCACCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGTGCAAGCGTTATCCGGAATTATTGGGCGTAAAGGGCTCGTAGGCGGTTCGTCGCGTCCGGTGTGAAGT-CCATCGCTTAACGGTGGATCCGCGCCGGGTACGGGCGGGCTTGAGTGCGGTAGGGGAGACTGGAATTCCCGGTGTAACGGTGGAATGTGTAGATATCGGGAAGAACACCAATGGCGAAGGCAGGTCTCTGGGCCGT-ACTGACGCTGAGGAGCGAAAGCGTGGGGAGCGAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGGTGGATGCTGGATGTGGGGCCGTGTCGGAGCTAACGCGTTAAGCATCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGAAATTGACGGGGGCCCGCACAAGCGGCGGAGCATGCGGATTAATTCGATGCAACGCGAAGAACCTTACCTGGGCTTGACATGCAGGTGGTGCATGGTCGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGCCCCGTGTTGCAACTCACGGGGGACCGCCGGGGTTAACTCGGAGGAAGGTGGGGATGACGTCAGATCATCATG-CCCTTACGTCCAGGGCTTCACGCATGCTACAATGGCCGGTACAACGGGATGCGACAGTGCGAGCTGGAGCGGATCCCTGAAAACCGGTCTCAGTTCGGATCGCAGTCTGCAACTCGACTGCGTGAAGGCGGAGTCGCTAGTAATCGCGAATCAGCACGTCGCGGTGAATGCGTTCCCGGGCCTTGTACACACCGCCCGTCAAGTCATGAAAGTGGGCAGCACCCGAAGCCGGCGTCTAAGGTGAGGCTCGTGATTGGGACTAAGTCGTAACAAGGTAGCCGT
+>484296 study_id=40682 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGCGCCTAACACATGCAAGTCGAAC-GAGTGGCGAACGGCTGAGTAACACGTGGGCAACCTGCCCTCCTCTTGGGGATAGCCTCGGGAAACCGAGGATAATACCCGATAGAGAAGGATGGGCCCGCGGCCTGTTAGCTTGTTGGTGGGGTAGAGGCT-ACCAAGGC-ATGATGGGTAGCTGGGTTGAGAGACCGACCAGCCAGATTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCACAATGGGCGAAAGCCTGATGCAGCGACGCCGCGTGCGGGACGAAGGCCTTCGGGTTGTAAACCGCTTTCAGCAGGGACGCGGTACCTGCAGAAGAAGCCCCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGATTCATTGGGCGTAAAGCGCTCGTAGGCGGTCTGTTAGGTCGGGAGTTAATC-CGGAGGCTCAACCTCCG-CCCGCTCCCGATACCGGCAGACTTGAGTTTGGTAGGGGAAGGTGGAATTCCTAGTGTAGCGGTGGAATGCGCAGATATTAGGAAGAACACCAGTGGCGAAGGCGGCCTTCTGGGCCAA-ACTGACGCTGAGGAGCGAAAGCTAGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCTAGCTGTAAACGATGGACACTAGGTGTGGGACCGTGCCGCAGCTAACGCATTAAGTGTCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCAGCGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAGGGCTTGACATGCAGGTGGTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTAGGTTAAGTCCTGCAACGAGCGCAACCCTCGTCGTATATTGCCACCTATACGAGACCGCCGGCGTCAAGCCGGAGGAAGGTGGGGACGACGTCAAGTCATCATG-CCCTTATGTCCTGGGCTACACACGTGCTACAATGGCCGGCACAATGAGCTGCCAACCCGCAAGGGCGAGCGAATCTC-TAAAGCCGGTCCCAGTTCGGATTGGAGGCTGCAACCCGCCTCCATGAAGTCGGAGTTGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATGCGTTCCCGGGTCTTGTACACACCGCCCGTCACACCACCCGAGTCGATTGCACCCGAAGTCGTCGCCGAAGGTGTGGTTGGTAAGGGGGGTGAAGTCGTAACAAGGTAGCCGT
+>484294 study_id=33866 non_ACGT_percent=0.0000 decision=named_isolate
+GATGAACGCTGGCGGCGTGCTTAACACATGCAAGTCGAACGAAGTGGCGGACGGGTGAGTAACGCGTGGGGAACCTGCCCTATACAGGGGGATAACAGCTGGAAACGGCTGCTAATACCGCATAGTATAGGATGGTCCCGCGTCTGATTAGCTGGTTGGTGAGGTAACGGCTCACCAAGGCGACGATCAGTAGCCGGCTTGAGAGAGTGAACGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCGACGCCGCGTGAGTGAAGAAGTATTTCGGTATGTAAAGCTCTATCAGCAGGGAAGCGGTACCTGACTAAGAAGCCCCGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGGGGCAAGCGTTATCCGGAATTACTGGGTGTAAAGGGTGCGTAGGTGGCATGGTAAGTCAGAAGTGAAAGCCCGGGGCTTAACCCCGGGACTGCTTTTGAAACTGTCATGCTGGAGTGCAGGAGAGGTAAGCGGAATTCCTAGTGTAGCGGTGAAATGCGTAGATATTAGGAGGAACACCAGTGGCGAAGGCGGCTTACTGGACTGTCACTGACACTGATGCACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAATACTAGGTGTCGGGCGGTGCCGCAGCAAACGCAGTAAGTATTCCACCTGGGGAGTACGTTCGCAAGAATGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCTGGTCTTGACATCCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATCTTTAGTAGCCACTCTAGAGAGACTGCCAGGGATAACCTGGAGGAAGGTGGGGACGACGTCAAATCATCATGCCCCTTATGGCCAGGGCTACACACGTGCTACAATGGCGTAAACAAAGGGAAGCGAAGTCGTGAGGCGAAGCAAATCCCAGAAATAACGTCTCAGTTCGGATTGTAGTCTGCAACTCGACTACATGAAGCTGGAATCGCTAGTAATCGTGAATCAG-ATGTCACGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCATGGGAGTCAGTAACGCCCGAAGTCAG..................................................
+>471785 study_id=37997 non_ACGT_percent=0.0000 decision=symbiont
+..........GGCGGCAGGCCTAACACATGCAAGTCGAGCG-AGCGGCGGACGGGTGAGTAATGTCTGGGG-ATCTGCCCGATGGAGGGGGATAACTACTGGAAACGGTAGCTAATACCGCATACCATCGGATGAACCCAGATGGGATTAGCTAGTAGGTGGGGTAATGGCTCACCTAGGCGACGATCCCTAGCTGGTCTGAGAGGATGACCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGCACAATGGGGGAAACCCTGATGCAGCCATGCCGCGTGTGTGAAGAAGGCCTTCGGGTTGTAAAGCACTTTCAGCGGGGAGGCGTTACCCGCAGAAGAAGCACCGGCTAAC-TCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCGAGCGTTAATCGGAATTACTGGGCGTAAAGCGTACGCAGGCGGTCTGTTAAGTCAGATGTGAAATCCCCGGGCTCAACCTGGGAACTGCATTTGAAACTGGCAGGCTAGAGTCTCGTAGAGGGGGGTAGAATTCCAGGTGTAGCGGTGAAATGCGTAGAGATCTGGAGGAATACCGGTGGCGAAGGCGGCCCCCTGGACGAAGACTGACGCTCAGGTACGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCTGTAAACGATGTCGATTTGAAGGTTGTGGCTTTCGGAGCTAACGCGTTAAATCGACCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAATGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTACTCTTGACATCCAGGTGCTGCATGGCTGTCGTCAGCTCGTGTTGTGAAATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTATCCTTTGTTGCAACTCAAAGGAGACTGCCGGTGATAAACCGGAGGAAGGTGGGGATGACGTCAAGTCATCATGGCCCTTACGAGTAGGGCTACACACGTGCTACAATGGCGCATACAAAGAGAAGCGATCTCGCGAGAGTCAGCGGACCTCATAAAGTGCGTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTGGATCAG-ATGCCACGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTGGGTTGCAAAAGAAGTAGGTTACCACTTTGTGATTCATGACTGGGGTG.....................
+>471528 study_id=37895 non_ACGT_percent=0.0000 decision=named_isolate
+.........................ACATGCAAGTCGAGCGCAGCGGCAGACGGGTGAGTAACGCGTGGGA-ATCTACCCATCTCTACGGAACAACTCCGGGAAACTGGAGCTAATACCGTATAGAGATGGATGAGCCCGCGTTGGATTAGCTAGTTGGTGGGGTAATGGCCTACCAAGGCGACGATCCATAGCTGGTCTGAGAGGATGATCAGCCACACTGGGACTGAGACACGGCCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGAAAGCCTGATCCAGCCATGCCGCGTGAGTGATGAAGGCCCTAGGGTTGTAAAGCTCTTTCAACGGTGAAGCGGTAACCGTAGAAGAAGCCCCGGCTAAC-TTCGTGCCAGCAGCCGCGGTAATACGAAGGGGGCTAGCGTTGTTCGGAATTACTGGGCGTAAAGCGCACGTAGGCGGATACTTAAGTCAGGGGTGAAATCCCGGGGCTCAACCCCGGAACTGCCTTTGATACTGGGTATCTCGAGTCCGGAAGAGGTGAGTGGAATTCCGAGTGTAGAGGTGAAATTCGTAGATATTCGGAGGAACACCAGTGGCGAAGGCGGCTCACTGGTCCGGTACTGACGCTGAGGTGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGGAAGCTAGCCGTTGGCCGGTGGCGCAGCTAACGCATTAAGCTTCCCGCCTGGGGAGTACGGTCGCAAGATTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGCAGAACCTTACCAGCCCTTGACATCCAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTCGCCCTTAGTTGCCACTCTAAGGGGACTGCCGGTGATAAGCCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTACGGGCTGGGCTACACACGTGCTACAATGGTGGTGACAGTGGGCAGCGAGACCGCGAGGTCGAGCTAATCTCC-AAAAGCCATCTCAGTTCGGATTGCACTCTGCAACTCGAGTGCATGAAGTTGGAATCGCTAGTAATCGCGGATCAGCATGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTTGGTTTTACCCGAAGGCGC..................................................
+>471521 study_id=37891 non_ACGT_percent=0.0000 decision=named_isolate
+..........................................AGCGGGG-ACGGGTGAGTAACACGTGGGTAACCTCCT-ATAAGACTGGGATAACTCCGGGAAACCGGGGCTAAACCGG-ATACTTATAGATGGACCCGCGCCGTATTAGCTAGTTGGTAAGGTAACGGCTTACCAAGGCGACGATACGTAGCCGACCTGAGAGGGTGATCGGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTAGGGAATCTTCCGCAATGGGCGAAAGCCTGACGGAGCAACGCCGCGTGAGTGATGAAGGTCTTCGGATCGTAAAACTCTGTTGTTAGGGAAGCGGTACCTAACCAGAAAGCCACGGCTAAC-TACGTGCCAGCAGCCGCGGTAATACGTAGGTGGCAAGCGTTATCCGGAATTATTGGGCGTAAAGCGCGCGTAGGCGGTTTCTTAAGTCTGATGTGAAAGCCCACGGCTCAACCGTGGAG-GGCATTGGAAACTGGGAAACTTGAGTGCAGAAGAGGAGAGTGGAATTCCATGTGTAGCGGTGAAATGCGCAGAGATATGGAGGAACACCAGTGGCGAAGGCGGCTCTCTGGTCTGTAACTGACGCTGATGTGCGAAAGCGTGGGGATCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAAGTGTTAGGTAGTGCTGCAGCTAACGCATTAAGCACTCCGCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGAAGCAACGCGAAGAACCTTACCAAATCTTGACATCCAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCTTAAGCTTAGTTGCCACTCTAGGTTGACTGCCGGTGACAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGATTTGGGCTACACACGTGCTACAATGGATAATACAAAGGGCAGCGAT-CCGCGAGGCCAAGCAAATCCCATAAAATTATTCTCAGTTCGGATTGTAGTCTGCAACTCGACTACATGAAGCTGGAATCGCTAGTAATCGTAGATCAGCATGCTACGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTCACACCACGAGAGTTTGTAACACCCGAAGCCGG..................................................
+>471518 study_id=37888 non_ACGT_percent=0.0696 decision=clone
+................GTGCCTAATACATGCAAGTTGAGCGCAGCAGCGAACGGGTGAGTAACGCGTGGGGAAC-TGCCTTTGAGCGGGGGACAACATTTGGAAACGAATGCTAATACCGCATACTCAAAGATGATCCCGCGTTGTATTAGCTAGTTGGTGAGGTAAAGGCTCACCAAGGCGATGATACATAGCCGACCTGAGAGGGTGATCGGCCACATTGGGACTGAGACACGGCCCAAACTCCTACGGGAGGCAGCAGTAGGGAATCTTCGGCAATGGACGAAAGTCTGACCGAGCAACGCCGCGTGAGTGAAGAAGGTTTTCGGATCGTAAAACTCTGTTGGTAGAGAAGCGGTAACTACCCAGAAAGGGACGGCTAAC-TACGTGCCAGCAGCCCGGGTAATACGTAGGTCCCGAGCGTTGTCCGGATTTATTGGGCGTAAAGCGAGCGCAGGTGGTTTATTAAGTCTGGTGTAAAAGGCAGTGGCTCAACCATTGTA-TGCATTGGAAACTGGTAGACTTGAGTGCAGGAGAGGAGAGTGGAATTCCATGTGTAGCGGTGAAATGCGTAGATATATGGAGGAACACCGGTGGCGAAAGCGGCTCTCTGGCCTGTAACTGACACTGAGGCTCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGAGTGCTAGATGTAGG-CTGTATCGCAGCTAACGCAATAAGCACTCGCCCTGGGGAGTACGACCGCAAGGTTGAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTTAATTGGAAGCAACGCGAAGAACCTTACCAGGTCTTGACATACAGGTGGTGCATGGTTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATTGTTAGTTGCCACTCTAACGAGACTGCCGGTGATAAACCGGAGGAAGGTGGGGATGACGTCAAATCATCATGCCCCTTATGACCTGGGCTACACACGTGCTACAATGGATGGTACAACGAGTCGCGAGACAGTGATGTTTAGCTAATCTCTTAAAACCATTCTCAGTTCGGATTGTAGGCTGCAACTCGCCTACATGAAGTCGGAATCGCTAGTAATCGCGGATCAGCACGCCGCGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCACGGAAGTTGGGAGTACCCGAAGTAGGTTCCTAAGGTAA......................................
+>471517 study_id=37887 non_ACGT_percent=0.0000 decision=clone
+ATTGAACGCTGGCGGTATGCTTAACACATGCAAGTCGAACG-AGTGGCGGACGGGTGAGTAACGCGTAGGA-ATCTGCCTGATAGTGGGGGATAGCCCGAAGAAATTCGGATTAATACCGCATACTATCAGATGAGCCTGCGTAAGATTAGCTTGTTGGTAGGGTAAAAGCCTACCAAGGCGACGATCTTTAGCTGGTCTGAGAGGATGATCAGCCACATCGGGACTGAGACACGGCCCGAACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGGGCAACCCTGATCCAGCAATACCGCGTGTGTGAAGAAGGCCTGAGGGTTGTAAAGCACTTTCAATTGTGAAGCGTTAACTTTAGAAGAAGCACCGGCTAAC-TCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGTAGGCGGTTTATTAAGTCAGATGTGAAAGCCCCGGGCTTAACCTGGGAACTGCATTTGAAACTGGTCAACTAGAGTATGGTAGAGGAAAGTGGAATTTCTGGTGTAGCGGTGAAATGCGTAGATATCAGAAGGAACATCAATGGCGAAGGCAGCTTTCT-GACCAATACTGACGCTGAGGTACGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGATAACTAGCCGTTGGGTAGTGGCGAAGCTAACGCGTTAAGTTATCCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATCCAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCCTATCCTTATTTGCAACTATAAGGAGACTGCCGGTGATAAACCGGAGGAAGGCGGGGACGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGGAAGGACAAAGAGCCGC-AAGCCGCGAGGTGTAGCTAATCTCATAAACCTTTTCGTAGTCCGGATTGGAGTCTGCAACTCGACTCCATGAAGTCGGAATCGCTAGTAATCGTAGATCAGA--GCTACGGTGAATACGTTCCCGGGTCTTGTACACACCGCC......................................................................................
+>471516 study_id=37887 non_ACGT_percent=0.0000 decision=clone
+.TTGAACGCTGGCGGTATGCTTAACACATGCAAGTCGAACG-AGTGGCGGACGGGTGAGTAACGCGTAGGA-ATCTACCTAATAGTGGGGGATAGCCCAGAGAAATCTGGATTAATACCGCATACTATCAGATGAGCCTGCGTAAGATTAGCTAGTTGGTGAGGTAAAAGCTCACCAAGGCGACGATCTTTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATATTGGACAATGGGCGCAAGCCTGATCCAGCAATACCGCGTGTGTGAAGAAGGCCTGAGGGTTGTAAAGCACTTTCAATTGTGAAGCGTTAACTTTAGAAGAAGCACCGGCTAAC-TCCGTGCCAGCAGCCGCGGTAATACGGAGGGTGCAAGCGTTAATCGGAATTACTGGGCGTAAAGCGTGCGTAGGTGGTTTGTTAAGTTAGATGTGAAAGCCCTGGGCTCAACCTAGGAACTGCATTTAAAACTGGCAAACTAGAGTATAGGAGAGGAAAGTGGAATTTCAGGTGTAGCGGTGAAATGCGTAGATATCTGAAGGAACATCAATGGCGAAGGCAGCTTTCTGGACTAATACTGACACTGAGGTACGAAAGCGTGGGTAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGACAACTAGCCGTTGGGTAGTGGCGAAGCTAACGCGTTAAGTTGTCCGCCTGGGGAGTACGGCCGCAAGGTTAAAACTCAAAGGAATTGACGGGGACCCGCACAAGCGGTGGAGCATGTGGTTTAATTCGATGCAACGCGAAGAACCTTACCTGGTCTTGACATACAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGTAACGAGCGCAACCCTTATCCTTATTTGCAACTATAAGGAGACTGCCGGTGATAAACCGGAGGAAGGCGGGGACGACGTCAAGTCATCATGGCCCTTACGACCAGGGCTACACACGTGCTACAATGGGAAGGACAAAGGGTTGCTAAGCCGCGAGGTGGTGCTAATCTCATAAACCTTTTCGTAGTCCGGATCGGAGTCTGCAACTCGACTCCGTGAAGTCGGAATCGCTAGTAATCGTGGATCAG-ACGCCACGGTGAATACGTTCCCGGGTCTTGTACACACCGCCCGTC..................................................................................
+>471515 study_id=37886 non_ACGT_percent=0.0000 decision=named_isolate
+AACGAACGTTAGCGGCGCGCTTAACACATGCAAGTCGAGCGAAGCGGCGCACGGGTGAGTAACACGTAGGTAATCTGCCCCCAGGTGGTGGATAACGTTCCGAAAGGAGCGCTAATACAGCATGCCGGGG-ATGAGCCTGCGGCCCATCAGCTAGTTGGTAGGGTAATGGCCTACCAAGGCGAAGACGGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCGACGCCGCGTGAGTGATGAAGGCCTTCGGGTTGTAAAGCTCTGTGGAGGGGGACGCGGTACCCCTTTAGCAAGCACCGGCTAAC-TCTGTGCCAGCAGCCGCGGTAAGACAGAGGGTGCAAACGTTGTTCGGAATTACTGGGCGTAAAGCGCGTGTAGGCGGTTCTAAA-GTC-AGTGTGAAAGCCCTGGGCTTAACCCAGGAAGTGCA-CTGAAACTACGAA-CTTGAGTCCCGGAGAGGAAGGCGGAATTCTCGGTGTAGAGGTGAAATTCGTAGATATCGAGAGGAACATCGGTGGCGAAGGCGGCCTTCTGGACGGTGACTGACGCTGAGACGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGGGTGCTAGGTGC-GCGCGGTGCCGTAGCTAACGCATTAAGCACCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTCAATTCGACGCAACGCGCAGAACCTTACCTGGGCTAGAAAATTAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATCGTTAGTTGCCACTCTAGCGAGACTGCCGATTTTAAATCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGTCCAGGGCTACACACGTGCTACAATGGGCGGTACAGACGGTCGCGAACCCGCGAGGGAA-GCCAATCCGAAAAAACCGTCCTCAGTACGGATAAGAGTCTGCAACTCGACTCTTTGAAGTTGGAATCGCTAGTAATCCCTGATCAGCAGGCAGGGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTCGATTGCTCCAGAAGTGGCCCCCCAAGGAGTGGTTGGTAACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>471514 study_id=37886 non_ACGT_percent=0.0000 decision=named_isolate
+AACGAACGTTAGCGGCGCGCTTAACACATGCAAGTCGAGCGAAGCGGCGCACGGGTGAGTAACACGTAGGTAATCTGCCCCCAGGTGGTGGATAACGTTCCGAAAGGAGCGCTAATACAGCATGCCGGGG-ATGAGCCTGCGGCCCATCAGCTAGTTGGTAGGGTAATGGCCTACCAAGGCGAAGACGGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCGACGCCGCGTGAGTGATGAAGGCCTTCGGGTTGTAAAGCTCTGTGGAGGGGGACGCGGTACCCCTTTAGCAAGCACCGGCTAAC-TCTGTGCCAGCAGCCGCGGTAAGACAGAGGGTGCAAACGTTGTTCGGAATTACTGGGCGTAAAGCGCGTGTAGGCGGTTCTAAA-GTC-AGTGTGAAAGCCCTGGGCTTAACCCAGGAAGTGCA-CTGAAACTACGAA-CTTGAGTCCCGGAGAGGAAGGCGGAATTCTCGGTGTAGAGGTGAAATTCGTAGATATCGAGAGGAACATCGGTGGCGAAGGCGGCCTTCTGGACGGTGACTGACGCTGAGACGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGGGTGCTAGGTGC-GCGCGGTGCCGTAGCTAACGCATTAAGCACCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAACCGGTGGAGCATGTGGTTCAATTCGACGCAACGCGCAGAACCTTACCTGGGCTAGAAAATTAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATCGTTAGTTGCCACTCTAGCGAGACTGCCGATTTTAAATCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGTCCAGGGCTACACACGTGCTACAATGGGCGGTACAGACGGTCGCGAACCCGCGAGGGAA-GCCAATCCGAAAAAACCGTCCTCAGTACGGATAAGAGTCTGCAACTCGACTCTTTGAAGTTGGAATCGCTAGTAATCCCTGATCAGCAGGCAGGGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTCGATTGCTCCAGAAGTGGCCCCCCAAGGAGTGGTTGGTAACTGGGGTGAAGTCGTAACAAGGTAGCCGT
+>471513 study_id=37886 non_ACGT_percent=0.0000 decision=named_isolate
+AACGAACGTTAGCGGCGCGCTTAACACATGCAAGTCGAGCGAAGCGGCGCACGGGTGAGTAACACGTAGGTAATCTGCCCCCAGGTGGTGGATAACGTTCCGAAAGGAGCGCTAATACAGCATGCCGGGG-ATGAGCCTGCGGCCCATCAGCTAGTTGGTAGGGTAATGGCCTACCAAGGCGAAGACGGGTAGCTGGTCTGAGAGGATGATCAGCCACACTGGAACTGAGACACGGTCCAGACTCCTACGGGAGGCAGCAGTGGGGAATCTTGCGCAATGGGCGAAAGCCTGACGCAGCGACGCCGCGTGAGTGATGAAGGCCTTCGGGTTGTAAAGCTCTGTGGAGGGGGACGCGGTACCCCTTTAGCAAGCACCGGCTAAC-TCTGTGCCAGCAGCCGCGGTAAGACAGAGGGTGCAAACGTTGTTCGGAATTACTGGGCGTAAAGCGCGTGTAGGCGGTTCTAAA-GTC-AGTGTGAAAGCCCTGGGCTTAACCCAGGAAGTGCA-CTGAAACTACGAA-CTTGAGTCCCGGAGAGGAAGGCGGAATTCTCGGTGTAGAGGTGAAATTCGTAGATATCGAGAGGAACATCGGTGGCGAAGGCGGCCTTCTGGACGGTGACTGACGCTGAGACGCGAAAGCGTGGGGAGCAAACAGGATTAGATACCCTGGTAGTCCACGCCGTAAACGATGGGTGCTAGGTGC-GCGCGGTGCCGTAGCTAACGCATTAAGCACCCCGCCTGGGGAGTACGGCCGCAAGGCTAAAACTCAAAGGAATTGACGGGGGCCCGCACAAGCGGTGGAGCATGTGGTTCAATTCGACGCAACGCGCAGAACCTTACCTGGGCTAGAAAATTAGGTGCTGCATGGCTGTCGTCAGCTCGTGTCGTGAGATGTTGGGTTAAGTCCCGCAACGAGCGCAACCCCTATCGTTAGTTGCCACTCTAGCGAGACTGCCGATTTTAAATCGGAGGAAGGTGGGGATGACGTCAAGTCCTCATGGCCCTTATGTCCAGGGCTACACACGTGCTACAATGGGCGGTACAGACGGTCGCGAACCCGCGAGGGAA-GCCAATCCGAAAAAACCGTCCTCAGTACGGATAAGAGTCTGCAACTCGACTCTTTGAAGTTGGAATCGCTAGTAATCCCTGATCAGCAGGCAGGGGTGAATACGTTCCCGGGCCTTGTACACACCGCCCGTCACACCATGGGAGTCGATTGCTCCAGAAGTGGCCCCCCAAGGAGTGGTTGGTAACTGGGGTGAAGTCGTAACAAGGTAGCCGT
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/sample_aln2.fasta	Mon Jan 09 08:07:45 2017 -0500
@@ -0,0 +1,700 @@
+>N2726
+LLLAYHVLIPAIHLDLLIGALRDLSLLALLSCLVLLLAVMLLALLQGKGLFRALANLSRT
+NESVADGAHKGTLELVPDLLRILATPRDPMDERLRDQDQRLAVELLTNVRHLIRAPLPGI
+YGYAQTHNTSQDDESRDFLERVRYQGHNFLRLINELLHTSRLPTTENLGEDKEPTDLQSL
+LLEIHGHVGRAKQTRGPEKDPEFPKHTPYAGEPKRLKVELVNKVMSKDRYTPGTKICGAA
+RRNSERLIILVLDTGPGLPPDDMSRIFVVFYRIGEEGHQAALGLAIVKSYPDPHGSTITA
+ECKVAGNTKFKKKPIL------
+>N1397
+------------------------------------------AVLLNRNLIRPLSNLAHG
+PERFAGKTLRLVFDLAQDALRLLDRPLNPLEERLDVISPRVEFEFLSNVAQELKTAITGI
+LGYAAQ-DIALNESPRDYLERAKRPAAKLLRLTHGLLDEN----------EDDSGDLQTD
+LIGSTELLYGLGQVGGQEQD---PDTKPVSGEATPLAGILLNLLTKAGAYTPGGKIVVSL
+RRDGDKIVIGVEDFDKGIPPQAMDVIFKSFYGA-AVRNVVQVPLAELKRVSELHSGSITP
+EHEAGGDTTFAAMRALEGP---
+>N4972
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------------------------DATYLPLILLNVKSTAESYTPGLKILVSA
+RRDGNRVVIAVRDTGVGLP-----RIYHSFYKHGAARADQNVGNAIVKSVVAL----ITP
+DHEASGSTTFPGS---------
+>N3970
+FFIPTEILLLKFDLQLLGCARDEDLKLMLLSKQQLMLTVILLTSLLAVHLGSGLRYLVKS
+RATGKPGVLRLTMEPFPDALRISGDDFNALASKLEDDGPLPVGDNLATVEHPPTFDITDI
+YSYTRELSIRLMGKENVFLGGHKANGNQLHRPFNKLYDSTRMHTHAKLVRVTGLISMDTL
+LRPGTHVLGGLCRAKTGDENR---------------------------------------
+------------------------------------------------------------
+----------------------
+>N3339
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+----------LCQIKTIEMDIDLPITPS---EARKLAAVLRNMKNKAWPYTKGLRIFVGL
+MRDADQIVTTVANTGRGLP--HFERAFGEAYHNV-----MSVGSEIVN--VGMHGGTTTA
+EPEDDGRTTFIGSHQLENT---
+>N1727
+------------------------------------------------------------
+---------------------------------------------------ERRTALTGA
+LG--NVLNAQLEGVAIEFLETRNDETQQLLRLIANFLDKPRLNC-AKLHVDGGPGDLQTA
+LRQALAILDGL-QAQGTEVQSDLPKGVAAV-KATQLPLNLLNVRPNSTSYTDGGAINVAV
+WRDDEVISMGVVDVGRLVPPEKMQRIFRDMYGAG---STIIIGIAVSNSLVTLHAGTIPP
+EDASAGSTTYAASHVLKAAATS
+>N4410
+YLVVENALKTGNALKLLMLNLRQLLRQLMLGNIVHILLVLLLPLLRGCHLSGGLRNVAKD
+VKRLCSTDLRLVFERVPDGLRVRAECRKAVAERSDDTKPHPGGE-----NYHIRSNFTLI
+LGYSVEVSAELSALPVKFLNVGVASDEQLIRLITTFLNSTILKSGAKISLDGEPCELKG-
+----LKKLKGLTPNIGVESQGGLPYVPQ---QGTKLGFILVNEADETRIYTEGGDIFVGN
+WRDTERSTLGAVDSAHEVPPESMELIFRT----GLTRAETFSGLSNKKTVHDLHISTVAA
+QGNDAGESTFPESDVLGAT---
+>N2051
+ILVARPVLPTAEDLELLLGFLRELVILLLDGQLAVQLAGGLLTLLLSCGLLVPLPHVAEA
+VERICIGSVSTVYEAVPDSLRVLAKELEALVERIEEPPPRIAGELLTNINHSIK------
+LGFQKELNGELSSESIIFLEFQGSSPNVLVRLITNFLELSRFKATDKNA--DELIDLQAL
+LYQSLAERGVNTDQKGRHPESNLPKSPA---TNTSLALVLPNQMDSATSYTNGGVIVAST
+YRDDARCHKGVVDTNSKLPPELMGGVFEVMYNTGICRNALFVGLALIQSVQLLHAGSITA
+ELASSNSKTFATSSQV------
+>N3338
+----------------------QLQLLLLNATAATLIFDVLSVLLVGLGLLGPLKNMACA
+GGKITTGSFQTIYEKLGDVLKVLAKPLQAIEEALDNPKSMLLGE-------NGVGTATGI
+MDCPEPTNLELENPAVALLGLERGLAFGLMRLILDFVDRGR--AGGKLVLDGQPLELAEL
+LVQPLDQFEELDQFSGLEVQGSLSNSRPNCEHAAALRSCLHNSTCAEFPYTGGLLILVTK
+WRGDSRIPKLIVETDVMLPPAAPNQIFDKLYGDGQSKERE-VGLKIPKSMLALHIGVITR
+EHESAGSTTFAKTH--------
+>N2452
+-------------------------------------------------ILVPGRNLAKL
+IDRICRGRYRIEYARLPDSQKVLGKHLKSVAELIESTEKRIRNDLLANCNFTFKSPATGI
+MGYPDKLKAALEGEYITFLDNDKSEYLGLDRAIAIFLGSSR----DKVSLDREAVDVEKL
+LKEGLEVLNTIKEQKGREFENNLPDKRPG--SGTPLPLILTNLYNSEATYTNGGKILISE
+WRTDE-LPKFVVDAGSQLPPEPMENI----YGTDKVRNEHTAGLDILSSVIALHIGTIAR
+EHESAGSTTFATSKAV------
+>N1718
+PLVTHGKVLIGVIIVLLLAFLRELEQLLMLLMMVMNMLILLLILLMGRSLITPLRNLVQI
+DGKITNKDKRAVSDKVHDKARVKAKAFKPRGDKLDADEPRVDTNLLVNTT----------
+-DYADPCGGQLQGEEPQFKDYGKLQEASLDRLLTEFLDFTRLGAGGGIRLDREPVELQVL
+LDQGAP-LRFACFNDDPDILRDFPDKVYWMGALDELPL---LFKNDGGDYTPGTRILVAI
+WRDVSKATIAVGDPGPGMRNQD-----------RGIRPSSELGLAIYSSDVALHSGSITP
+NAGVAGNTSFPQNLYYET----
+>N1866
+------------------------------------------------------------
+-----------------------------------GEGPRMDLAVLGKVSHGAKTEVTGA
+L--ADVVGAGLNGEGPDFLKIHKIDEGQILKLLTEFLDYSRNDAGSNLGLEKQAVELQTL
+LEAGLQILRCLGQQT-AETVREEPEKAFVV---TPLPGALLLGRKEESPYTKGDKIFVSR
+WREGDSADIQVGDTGLGFPPQQMDRMFSSHYHEESMR---RDGGAICKSISTERTGTISS
+ENEARGNTTFFPAG--------
+>N577
+-----GVLVVSNILDLLLYYLRHLHVTRLLGMCTKNLLPHLLTMIMNKKLWKRLRNLTRD
+EYTAHIGDLSAVLESLADSARVAAKQLKTIATKLDGEEERVEA------THQQQAADTGI
+NGYANI------------------DAPKLLKLIGGLVNSARLNAGDNISLSKEMVDLRDL
+LSEGLKTIKDLNQEHGTEQVRDAPD--NPLGDTAELP--LLNYSRPNGVYTAGTRIPVSA
+WRDGERVENAVGDVGIGFPLNELDKIF---VRMVMVRPKAAV-LALESSVIALHLGTVTH
+QHEATATTTFPGPIRK------
+>N4255
+------------------------------------------------------------
+-------------------ARVVGPPLKPIEEKLDEEPAKAPVGLLVTNSQL-QKAKTGT
+LGYADIMGPQLSTEPKDFLKYLMIDAKQLVRLIDEFLNATRLDTGENVALDKGMVDVHHY
+PDGGLDNLNTLNEEKATEKIKDAPDSAVEVGDGTELPLALLNTNILNCCYKEGDKILVST
+WRDGDRGEINVGDTGGVYPLQEMSRIF---VRTVVKRTTEDT-HALEKNIVALHGGTVTK
+EHEDAGTTTFGGPEKK------
+>N4474
+------------------------------------------------------------
+------------------------------------------------------------
+-----------------FLATNRVETQTLTQLVNDFLNAHRL--GAKTSLNSDPVDLTQL
+LFATLDNLHIVSQCKGTETDLDLADTGNLVGD-GSLPVILLNLKKGSSSYTSGGGILVSI
+WKDGERVVIGPGHTGTGLPPENLERIFC-----GASRTAQAVG-AIVKNVLALPIESISG
+DHQAAGSAAFPRSDVLHST---
+>N3014
+------------------------------------------------------------
+------------------------------------------------------------
+-----------------------------------------LSADAKLALESSPLDLKAL
+LQQGLEELNWFADSAKTESELDLADKTDTR-DASGLPLILLNLKKGAAAYTSGGTILVSI
+WQDGERVVIEPNDAGNGLPPESMVTI----YRQATTKAGLAV-NAEVKDVVALHLDTMTP
+IQAASGSAAFSQPHILS-----
+>N3243
+--------LVQVDLELLPALLRELHLVLLSGQVVLLLLVLLPALLLVRALIHPLRSLARS
+HDRISTGILRLVKEPKPDALLPMGPLMAPMAERQETSNPRTAEGLLADVHAVMKTSENGL
+LTCGDNFNVESCDEPRNF--CVGKSGDELLRLVADFLGTSRVDAGVKLALASETVDLHSL
+LRKGVDMVQEEHDTMAIDFEQQVVEASAG----TLGSLALKEALTEEALYTTGGAIITAK
+KRDATRCVTTVGNTGKGFEPEVMGKIFLSFYRLDVSRVPLTVGLAVTKSVLALKVGTITP
+QHEADGATTFVVVYYVEAISDL
+>N3234
+---------ESNTMGLLLANLRELQLVLLSADICLLLYILLLELLLGRQLKPPLRNLCRP
+HNPLQTGLDKEVQERKPDVLIPMGKLLNEKSERLEESYERLAGGLLTDISNADRTSKS-L
+LGCACNLNLDLCDDPRDFIEAADNTAHDLMRLVGDFLDASRISAESKGTLASEPIDLQDI
+LKKAVSLVASLKA-----FDSDLVNPCPGLGDSTHGPGKLRNQRVGEPCYTAGGKIVVGV
+KRNPSRTGFYVEDTFEGAPPGMMERILLGFYTIGIIRVSLEVNFAIVKSIEAINVGTCTP
+KRHADGQTTFSANYC-------
+>N500
+VKVEGSVLSATLTVELLLAYLREMTGVLVSQNTCLLLFVLLLALLLGKDLKDSLRDLDKP
+HERIKLAHQKLVEVRHPDVLIQLGRLLNPMAERLEESNERIMGGLLADGSSALRTSGSAL
+LGCATKLNIDLCDEERAFQEFPDLGASELLRLVANFLDTC---STITLKLAAGPTELQEV
+LRAGASLAAS-NSAKGLGFNQELVNAPRSLGESTKG---LRNERPAESRYTYGNRILVKV
+KKEAHRVVITVGDTGRGLPPGEKERIGLGFFVIGITKVDADNTLAIVKTVATLKIGSITP
+DHESNGQTTFTANYELDGTSQA
+>N1824
+AIVEKPGLKAGLTIELLLGYLRELNAVLLPADCCLLLFLQLLVLLLGRELSESLRNLAKP
+NEKISTGQHKLVHEAKPDVLIPLGKVLNPTAEKLEDSEQRAPASLLADGNPANRESSSGV
+LGCAGKLNIDLCDTARDIQESAEQGVAALIKAVYSFLKAP---EADKNKLLSQPVDLHKI
+LSPGVFLVSGYKSTH----DEELVNEPPGITESTEGELKLKNQSAVIGSYTFGGPILVSV
+KRDPQRVVITIEDTGNGAAAGEMEKVLLGFYQSGIACVDLHGGLAVTKTVSALKVGSMTP
+EHEPEGHTTFAINFTL------
+>N760
+LAVDEHVVIADLTVELLLAYLRELNPVLLTQACCLLLFVHLLALLLGNNLKAGLQNLAKE
+TERISTGHRKNVNEKQPDVLVPLGTVFNPVPEGLEQTPERVGGPLLPEGNDLYRTSFSQL
+LGCGGLLDYELCDCVHDFQEGAGQASASLAKLVYDNLDDN---ADGKLKIESGPNDLHAI
+LRPSVCLVACLSS-----VGGELVEQPPEFTQGTVGPAKLKNDPQMEGAYTYGGVIHASG
+KRDPHRVLIRVEDKDAGLPPGQMDRVLLGFERVGVEDVDLKNGLAIVNAVDALKIGSISP
+EDEGDGETTFYGHYCLDGTIGA
+>N3270
+LRVDDGVVKAEVTIELLLSYLRELNAVLTSEECCLLLFVQLIGLLLGKELKDALRNLARH
+HEGCSTLQQKKVAEPQPDVLIVLGKLANRMAEKLEQSNERVEGGLLPEGNSALKTSASGL
+LGCGGPITIDLCDAPREFQEPGAKQAHELSKLVYIFLDAS---ASDKNKLEDEPIDLHKI
+LKPGISVIAALSRT----VDGEAVDEPPSKTQAKEGPLKLKNHLSSEGAYTYGGSIFVSV
+KRDPYTVIISVENAGEGHPPGDMGRVLLGYYIVGIASCELAGGLAIVNSEAALKVGSITA
+KQEGVGQTTFYENYHLD-----
+>N2473
+--------------------LRELHAVLLSENCCLLIFQQLLGLLLGSELKEALRNLARA
+HEQITHGAQKMVAEAQPDVLIVFGKLANRMPEKLEEADESVAGGLLPEGNRQLRTAASGL
+LGCGGPITIDLDDAPRDFQEASSMSAGELVKLVYDFLDAS---SVDKNKLENQPTDLHNI
+LRPGVSKEAYLSR----EFDQELVDESSTITQVEEGSLKLKNHLSLEASYTYGGTILVSV
+KREPQRVVISVENAGEGFPPGDMDRVLMGYYIVGVASVDLNDGLTIVNIVAALKVGSISA
+KHEGEGQTTFLSNESID-----
+>N2693
+PAVENVVVKAQLTIELLVSNLKVLLAVLLSDRVCILLFIELLGLLLGKELKQPLHNLAKH
+HSHISTGQAKKVAEAKPDVLIVFEKFANRMAEKLEELDERTTGGLLPQGNRALRNPGSGL
+LGCGSGSTIDLSDTPVDFQDQNGIEAKGLKKLVYDRLDAS---AVSKNKLMEARTDLHKI
+LRPGVSVEPSL---KGLENDQELVDNPPSTTEVKQGQ-RLINLLSLAGFYTYGDAIFVRV
+KRDPQRIVVSVENGGQGFSRGHMDSVLSGYYILSLSSVELQGGLAISNIVSALKVGSICP
+KHQADGATTFYGGAD-------
+>N3782
+PAVEEGVVKAELTIELLVSYLRELNAVLLSDKCCLLLFIQLLGLLLGKQLKQALRNLARH
+HEHVSAGQEKKVAEAKPDVLIVPEKFANRSAEKLEKTDERTAVGLLPQGKRALRTPSSGL
+LGCGGGITIDLSDTPVDFQEEGSRGASGLMKLVYDFLDAS---AVSRNLLQNQPTALHKI
+LKPGVSVEPSLSRTK----DQELVDNPPTPTQVKDGPTELQNHLTLADSYSHGGTIFVSV
+KRDPQRIVISVENGGEGFPRGEVDRVLSGYYMVGIATVDLQGGLATSNIVSTLKAGSICP
+KHEAEGATTFYGGDDIDG----
+>N3195
+VIVEKGVLLVGGDLQLLQAFLRELEVIRLASEICLLTFILLLTLLLGKSLVEPLRALARK
+HDRVTEGEKKLVKDKAPDQLIPADKLLNPMEEKVEEDTPRIADGVLTDVGSAMRTAHSGL
+LGCADTFNPDLCDEPREFQQGADALAHQLLTSHGDFLEAARVLGDANLSLAAEPADLQGL
+LKEGIALGASLKE-----LDRELVDEVVAEGDFAHGPLKLKNGRQGAPSYTGGGHILVSL
+KRDGSRAVLAVDDTGDSMPPGALERIFQAFYRIGIARVDLDVGLALVKSSADLKVGTITP
+QHDSDGQTTFSMDYY-------
+>N1514
+--------SVDADLKLLVAYLKELNLVLLASDICFLTFILLLALLLVKALEDKLRNLARS
+QDRISTGDHKAVDQHRPDPLIPVGKSLNPVSENLEDAEPRLLGQLLADVGYPIKTSNSGL
+LGCALRININLCDEPQNFAECRDKCAQELVRLVDAYLEASRVGASAKLT---EPVDVHEL
+IEQGMSLVAGANEGTG----RDLVEKETSYGDNTRGLLNLNNSVAADSAFTAGEGKLVSG
+KRDGHRVVIAVQDDGGGMNPGEMKRINVSFYRIGVTRIEI-VGLAIVKSVSALKVGTITP
+QHPADEQTTFCVGLFIDATSEA
+>N3523
+MVTGGGILQVGGDLKLLVAYLRDLYLCLLTASICLLAVFFLLALLLGRELTSPLRNLARP
+NTRIAVADKKTVKEFPDDALVPVGKSLDPKPEKLEEPSPRILGGLLGSVGSPLRQSKSGL
+LGCAHGFNIDMCDTPQDFGEVQDNCEHELMRYVADYLEAERVSAGGKFSLTLDPVDLQAL
+LGAGMSLTA------NLEEDRDLVQAQPSAG-IMHGPLSLKNALAGDDSFTKKDKILVQG
+KRDSHWVVIDVQDEGQNLSPGAMQEIFIVFYRIGLARV-LLVGVAVVNSIIDLKVGTIGP
+QHDADGQTTFALNLY-------
+>N4513
+--------TVTGDLDLLVAYLRELYLCLLASSICVLTIFFLLALLLGKDLQDPLCNLARP
+HERISGGDKDSVKEFPPDALIPVGKSLNPTPEKLEENNQFILFGLLGSVGQPLRTGASGT
+LGCAHRFNIDLCDLPPEFAETQDKCAHELIRYVADYLEASRVGAGGKLNLGLEPVDLQCL
+LNHGMFVSA------NLEEGRDLVEAQPTYG-TTRGPLGLKNDLAGGGSFAAGDNILVSG
+KRDAHRVIIGVQDDDMGMSPGGMGQIFISFYRIGVARMNLSVGVAVVKSVIALNVGTITP
+EHDADGQTTFVLDQYNDETT--
+>N4118
+RFVVPFVLLVKPPFALLLPNLRELGLVLLAGKLVLLLIVALLKLHLGSCHCEPMFDFAHE
+HDRDAGGHQRLTRERDPDSLQPKSRLMASMTERIEETVPIISGGQLADVSHDKRMAVSGH
+AGCANDFNIDICDEPSDFQHADSNTGHELMRLVSDILQDARVIAGAKMAL---GFDLLEL
+LPEQIDLVATRSEAK----DAELVTMPPPTGKSTHLPLDLSNATTIEPVYTRGAKILSSM
+QEDAGRIAIKVDNTTYSLPRENMDRVFLNFYRIGDGFVDLAVGLAATKPVLELKIGTIVP
+QHEAAVKTTFDVDYK-------
+>N2790
+------VLLVSLGFALLLAWLRELKPILIAARRVFLLIIHLLALLLTKALIEPMFNPPRQ
+QKRICPGHQRSLKESESDVLIPMSDLLATLTERLEESYPTLGGGLLSALSSPTKTSKSGL
+LGCADSTKINLCDELRDFQLPHAKTSHELLRLPSDFEDNSKVTSGAKIALGARAVDLLKL
+LFQEVELA------KGPEFDEELVDGPAVVG-DKNLPMSLGNATRTQTPYTPGGKIATRM
+KRDADKLVIKVHELGGGLPREYHERFLSEMYRASVAYV-APVGLAIVTSVVELKDGTITP
+QHDSDGLTTFPVRYFMDAAGTG
+>N2003
+------------------------------------------------------------
+----------------------------------------------AEVSHVARGSKSGM
+LGCAHRVNIDLCDEPKDFQEGDGSAAQNLLRLVEDFLTTSRKTSSAKMGAGAAPVDLLSL
+LGEEVDNVG------GAEFDEELVEAPASVG-DTTLALNLANMRTGESPYTPGSRIVTAM
+KKDAQRCVIKVDDTGEGLPREPMASIYLQIYTIGVNYI---VGYAIVKSVVILKVGTITG
+KHEASNQTTFVPSYSLD-----
+>N4744
+--------LAEKGFALLMGFLKNLEGLLLAGPLVLLLVVHLLALLLGPDLVNPLFNLAQE
+HSNVLPGHKRIGMERIPDALVPKSGYLAPLSEFLEASVPRVAAALLAEVGHLQRLGDSGM
+LGCGHKLNLDVCDDPRKFQDPSGKGAFELPRLVSGVLNNSRVDSGAKMAEGPAPVILLPL
+LGEEVELV------IGTEYDQELVETSPNVGVNLPLKVELVNQVTGKGHYTPGSRIDTGI
+KRDAKKCVIGVDDTGNSLPREGAQFIFVQVYPVGIQYENA-VGLAILLSPHELKVGTITS
+HAEAEGQTTIAANYNLDATANA
+>N2799
+AFVQDGVLLAPTGFALLMGFLKELEGMLLVGKVVALLITHLLELLLGPNLIQPLFNLARE
+HEHVLPGSARKGTEQSSDELEPKSGLLAPLTEQLEQVLPRAAAGLLKEVPHVLSIEMSGM
+LGCGHKSNLNLCDDPKEFQEAQGKIDNELGRLVSAELDNNRVLSGAEMEDVPAPVILLSA
+LGELVDLIASRSET---EFDQELVESPSGVGVDLTL---LANLIGGESLYTPAGKIVSAI
+KRDADKCVIFVDDKSSNLPREEAEKIFLKIYPIGVNYKNVDVGLAIVKSVVALKMGTITS
+QAEAEGQTTFAVSSTLTASHSA
+>N3677
+AFVKDEVLLAPVGFALLMGFLKELQGMLLVGKIVLLLITHLLELLLGPNLVQPLFNLARE
+HEHVLPGSTRKGKEQSSDALIPKSGLLAPLTEHLEQVLPRAAAALLAEVSHVLSIEMSGM
+LGCGHKSNLNLCDDPKEFQEAPGKQDNELGRLVSAELDNSRVDSGAEMEDVPAPVILLSL
+LGELVTLI------RGQEFDQELVESPSGVGVDLPLPTDLANLITPESLYTPAGKIVSNI
+KRDADKCVIFVDDKSSSLPREEAEKIFLKIYPIGINYENVAVGLAIVKSVVALKMGTITS
+QAEAEGQTTFAVSAT-------
+>N3997
+------------------------------------------------------------
+---------ILVKESLADALIPPSKLLKPKTESLEDNVPRIKAGLLADVSNAMGLSFTAL
+LGCAPAYGIDLCEESKDFQEETANDSHNLVRLVSAFLEDS---AGAKIALGIQPVDAQDL
+LFENVSLVGVR---RGVEWDQEFVAASPMVGGTTHLPLGLSNQVMGVPNYTP-TKIINAM
+KRDADRVAITVQDAGMALPRSNMEQICQQFYRVSIATSDVHTGLAIVKEVTPLKVGTISP
+QHGANEQTTFEVNYGIEATSKA
+>N4446
+LFVSNGVLQLNIDFGLLMNYLREVDLVLLYKTAVILGFMALLTLLLGRNLIN--LNLTRQ
+ADKESTAHERKVVGRKSDALIPKSSVLNPLTESLEESGPHFGGGLLADVSNLKRTSKSGV
+LGCTDKLNSQLCEEKRNFDEQDAKENPALVRLVNEFLRDARVSSPAKLA---DPADVQEL
+LKEKVVVIARRGE-----FGQELVKVPPSVGSSGPLPLNLKNELTGLAAYTPGGSIDTST
+KRDGDRAAICVEDVGHALPREFMSKICHLFFRRGVAFEDEQVGAAIVKRVKALTVGTFTA
+QHDGDGDETLAIAINLDATT--
+>N4505
+QYIGGSVMIVKPDFGLLVAYLREFELVAFAGRNIVFRIALLLIMLLNKDLAHPQLDLARA
+NQKVATGQGRLVTERQPDALTPKTSMLKPSGDRMDESVPNITSGLFAAVSHLLPIGLSGL
+LGCATKYNVKIAEQQTAFHDEFAGTTHDLLRLKEAFLEDTRITKGAKIPVDHQPVDCEAE
+LVERTELADNPGNPHGVEFDEELVAEPPT-------PLILNNNLESEPSYNSGSADITSN
+KRDAERVARQVGDVGVAIPREKMSKVANKFFPVGVAFVKLAVELVATWAVHSLKVGTITP
+QHPGDGNTTFCDTFNLHGTTIA
+>N3800
+---------------------------------------------LGGGLVNPQLDLAKD
+REKISTGHGRLVKERQPDQLDPKSKMLNPESERLDESTPKFGGGLLAHVAHVLRTSIGGL
+LGCALSLNIDLCEDPDDFHQEFAEGAYDLLRLSQAFLEQERVAAGSKIA---EPVDVQAL
+LGEHVEIVDKHAE---QEYNQELVAQGTSLGSQTHLP-PIKNILVAEPAYTPGVKIITSL
+RRDADRVARSSDDVGTLLPRDNMSKVPPEYFRVGVGFVDFVVGLVTVKSVQDLKIGTITD
+QQPGDGHTTFCGNFN-------
+>N606
+AKVGNFLLALKVEFNLLLANLRALLLVLLAGREALLMLVRLLALLLGVALATPLWNLART
+HSHIKTGHPRAVKEVRPKALLAAGKLMHPMTEQLEDAVPRHGGSLLGEISHSFRSNPTGL
+LGCAEKSNTALCEE--EFKEGYDDAPFSLVREVVNFLDGSKVDAGASLSLEADPVDLQGF
+PSEGATLAACLNE-----KSQMAVIFGPTATEGTKLPLLLKNAMTGEAQYTCGFTPIVAM
+KRDENREGIEVADTGPGGPKSQVESLVILYYKAGIALGDLSPGFATIKSVAKLKVGTITP
+LHEDNNHTAFKLTYNKG-----
+>N2450
+QKVPSGVLIVPLDFNLLLAYVRALAAILLEGAEVGLMFVRVLKLLLGRSLIAPLSNQARA
+QDRIMTGHLPMVKELHPDPLIPQGRQLDPLYEKLEDGLPRVGSGLLADIAHSMRLEASGL
+MDCAENFNIILCDE--NIEEARDSPAHSLLRLVPGFLDDKRLDGGAKLSLGTEPVDLQEV
+LVEGVQFVAP-SQTKGVEFGTEIVEGGPGIGDSTQL---LKNQISINRTYSAGGKIFVPQ
+QRDATRVVLAVEDDSTGLPAEQMQRIFSTFYKLGVPIVGLSVVFAIAKSLVVLKVAAVTP
+EHEANGQTTFAFNYY-------
+>N2206
+-----------------------------------------------------LRDLTSG
+QDNISAGNVRADMERADDNLTPLGKPLNPKNDPLERTPPRSKQG----VSHATHSDVTGV
+LGSPDALNVELYNEPKDFLSKHTKSM-----SVNDFLEGQRLKVGAKKVLASTPIDLLDL
+LADGVDLVLALFMTEGAEFDHELVAGVVGDG-PSHLPLALLNMLSDENQYTPGAHIIVPL
+KQDGDRIVTAVLDTGEGAPPKAANRLYLSFYAIGAERVDLIVALANPTNVVILRPGTITS
+EHESEGDTTFAAKLL-------
+>N2963
+--------------------------------------------------------ISRG
+VDQVSAGHLRYMAERAPDPLVPMGNLLQSIVASLEDDEPRV-------VTAGMRTSVAGV
+LVCIDCLSENLCDNKRGFLERKKREAQNLYRKVSDTGTESRLGMGPKLGLARSPVDLQVL
+LKDGVSLV---SQVDGVELGVQLVQGKAGDGESAHLPLELL-HLTENTPYTAGGVIYVTS
+KRGGGRLKTDVDDVGKGAAPENMEPIFGQFYKLGVAQVRLHKTLSIGKTVHPLKVGTVSP
+DREAEDDTTFGAALELSGTAAA
+>N3558
+VNLISEVLIVPTDHDLLLCYLRELPLVLLGGEVEDLMIVLLLVLLLGPLLLDQLLHYTWV
+TDRASVGHIIIVDEPQPDALLKIAKLLGPMGEREEKDEPRVCSGLLVAKQPLMRTQIVAI
+LGCAAVASVQLCDQPRGFLGVNKANAQDVARMVSTFNKDDRLDVGAKLS---AVYELQLL
+LSEGHALYASL---EGLEYQMEVVQMNPSAGESAILP-TLLNSEGNDSPYSPGVEIIVCM
+KRNFDRVPRTVEDSAEPLPPDGVESITAAFYKLVIARVTGQVSVSIVNSILALKGGTVSA
+DRDDEGDVTFDINEEFDATQKV
+>N3863
+FSLVKAVLLVPLGHDLVSALLRSLHLVLLGGKIALLMIVLFSVLLLGPLKVKDPKHYTWG
+CERVSTPHVIFVDEPNGDALLPIAQALNCMAERGEVNEARVCGGMLGDVSPLARVQATGV
+LGCAEVMSVESCNHPKNFLESDKTSGSKVPKKVSTHSEADRLDVVKKV---GSLVDLPEL
+LAEGVDLS---SQADGIEYTTPFIANPPASGDNAVLP-TLQNNQNQEKPYSTGPSKIVKL
+QRDKDRVVREVEDSASNLPPEEVNLITSGYYKYGVAVVPVLLNATITKSVVSLKVGAITP
+EQQASSDTTFKLSDQ-------
+>N3117
+------------------------------------------------------------
+--------------------LPIAEVLNSMAEREETNEPRVCGGV-GDVTPLARVQITTV
+LGCQDIMSVELCDHTRSFLESNKSSAQNVPQKVSTFNESERLDVGKKLS---SLVDLLTI
+LSEGVDLAASL---DGLEYTAEFVEMPPASGDSTVLP-KLLNSHNQETPYSPGNMIIVAM
+KRDGDRVVREVEDSAHGLPPEEVNTI-ASFYRLGVAVVMLQMNASIINSIVSLKTGTITP
+DRDNEGDTTFDISEELDAAAKA
+>N700
+--------------------------------ELALLLLTLLQLLLGQELVPPLSNLDKA
+EATIDQGQIKKVLEKLTDGLRIAADVLDIRNEELEEAENSNENVVLAHIAHHLRGADTGI
+LGYTDIINPELRTGGRNFLGGVKKLCHQLGRLRTGFLESSRLKAVYKVGLDADNVELKAL
+LLPGAALLSHL-----TEQQTELPETPHIDGEGTDLPKAILNQLRATRMYTPGEKIVVSI
+ARDDARILVVVEDTKADSAPE----------RGSGTRHEQAVSHAITKDTVTEHFGTNTP
+SLSCGGSTTFSVVTIY------
+>N3869
+----------------------------------------------GFHLSIAQPNLARC
+EGRGSKGHGSVVLERLSDGLTILSDALAAEANKLEVTEKRLGYDL-ANVHQEVRCVITTI
+LLYSNAAATEFTGTNKEFLNKVKSDGRQLGKLLEDFLESGRLHAGPTLCQECEKVDLEAL
+LLEGVNLL---SVSKGRGIQLAIPKPPPLVGSLSLLTLPLLNMSGPAGGYTGGDKIAVAF
+NRSGHRVTVGCEDTGYG---------VEGLYQGAKTKGEVSVGLAIVKDVSILHDGSVAT
+EPSDDGHSTPGAKKE-------
+>N342
+--LSPAVLQLLMDANLFVASLKELIMLLLGAYTVLLLLSLLLELLLGALLLTPLHNLPKA
+DGHLTKGLSEQGLESVADGPAIIAKGLGAVSEDVSSGHPKRGFAL-ANVNHGGRAKFASI
+LSF-----------PREFLSFARKNGIQLCALMEAYLKQGRLAAGTSLCQDCLPV-----
+LMEVVGLLSTLDPAVGTSRHKKAPNDPQLSGTATTLPLSLLNRIAEVGVYTPGNLIINDL
+SRDAERVVIALEDAAGGFKPDE------GFCQV---------GLDIMKGLALLQSGSVVP
+TEGAGGNTTFYPIGDV------
+>N1357
+------------------------------------------------------------
+---------HPVLERLTDGLPIDARELSALQDVLETARPRLHFALLAHVHVNTRYVYTGL
+LSF-YIVGAKFKGEAREFLNTMQGEGLPLLRLLDDYLD-----------QHCHTVDFELL
+LLDGVGLLSGLSSTRGKTINVHVGDSSPLVAKATRLPLGLANKLAIGGSYTPGDDITVTF
+RRAGRRMTEQVASSDSSF---------------QAVKPDGGIGLAIVESMKYQQNGCIAA
+ERDAGGDTNFGIKRDFEA----
+>N3856
+------------------------------------------------------------
+--------------------------------------------------------VSGI
+LSYAKSLGVDLAKEGKEFLDSERKQGQPLIRLQENYLENSRFEAAATLCSGSDHADLGVL
+LHE-VGLLPELSATRAKARFSGLPKPKDLVGSATELSLSLTNKASDGASYTTKQSIIVAF
+LRQLERVAAEVEDTGPGAPPDSMN---AGFYVSGASK----VGLAIVKAATVLHGGVTAV
+TEEAGSDSTFGHQRVGEAT---
+>N4686
+----STVLPIPPDAILFCALLRRIVTLLLDAFLIEHLLVYLLPLLLGLALLQALRQLAGA
+GARVSNGHSRGAIHHIKTALSVLATALNSMAEGLESAKPQVTFALLATSYHEVC------
+-KYNGAIGVDLKTNTPDLLNESKANGEELIRHLTELLSKNRLEAGAAVCQSCELSDVRIL
+LLAGSALLKILCTDGGKALSLDGPKCPPAVGGPAPVSPAIVNEMTDTGAYSSGDPIIVGY
+GSDEE-DIKAATPTAKGPVPNDL----------GPWKLKALVGPALNSSTRSLHGGSIAH
+EHDGDDNVGFKSKSVFEATN--
+>N2092
+------------------------------------------------------------
+-------------------------TLNAAAENMQSARPRFNFALLEDADHL--------
+--YLEHLGIELVDEARGALNDGRDNGVGLGRLLEDYMEKSRLESHAKTYQDA---DLPAL
+LAELQSLLGLLRTTRGRSRDLSIPDTPCLVASATELPISLVNTQNCAGTYIPAHVIFVAF
+SKTGIKATNGVAEVGNGLPPD-------------ATKAKSAGG--ILASSSGLHGGAIAH
+E--SQGGTAFSTVHIWETTNTG
+>N2277
+------------------------------------------------------------
+----------------------------------------VETALLVEVAHDVRCVETAV
+LSYAIP--PELRDSEKDFLDDRKNPGQQLTRLLDAC------------AKDCEPVDLQKL
+LLRGVGLLMSLSTTKGVAMELALPFPPPFTGASTELPLALFNSLFPTGNYTQGEAIQVST
+ESDGDLKAVNVDDTGSGLPPDD---VSLSFYHANATDTGA--------KVLVLHGGSLAP
+DHDKGADTTFHSKHVLEAAA--
+>N2000
+------------------------------------------------------------
+------------VENAKDNLPVAAAKTKKLAESLADARPKINDALLVIVSHRLKCLVSGF
+LTYANRLGTQKGDSDREFMNGGRHSVQELGRLLDDYLVATRVEPSATIRQDSGVIDAKSL
+LLEGVGLLST-----GFAAEFNLPDPPPNIGEASQLPLPILNRLSKAKSYTAGQPIQTSM
+SREADLKVTVVDDSGRALS------ITVNFYHKNMTSTQAGINLT---SRTVLHGGNVAP
+KQTLGGDTTFGGKTILQA----
+>N224
+----------------------ELISLMLPNKVVLFLLPLILALLLGFLLLRALSDVARP
+GPWFSAAVIHSVLERLTDGLKILAKNADPLAEANENGKPDISRPLLLIITHSVYCVVSGI
+LSYTNLPGKELKDEERAFLDDERNKVQQLLRFLDDF-----------LGGACAPADIDSL
+LLASAELLSALSTKQSLEAGLLLPKSHQVLGKYAQLPLPLLNVLVRAGRYTAGDGIQVEV
+VRDGEFLVILLADTGRSLPPAQMPR---------------AVGSNIVKTVTVLHGPSIAP
+EHNIGGDKGFGTKAEANVTGSD
+>N1851
+------------------------------------------------------------
+-----------------------------LAESFELTEARPKEPLLVNVQHELRPTQIGI
+LSYANKLAAELRNNNQQFLDAGRRGGEQLTHLMGVYLDTSRLLAGAVLAQDCE-VDFEAL
+LLDGV------DATKGVAHKLDLPHPFHLAGEASQLPVLLVNKLNANGAYTHGQAITVAL
+TRDGDLVIIVVEDTGRGL---------------GSNRSEAGVGLAVPKPVTVLHGGSIAE
+DLEAGGDATFGVKHIL------
+>N4160
+------------------------------------------------------------
+-------DHRQVLERISDGLPILATASPPMAESQEATKPRRGPSLLVHVNHEARCTSTAL
+ESYKNGMGAEKKDEHRGFLDEKSNEGAKLARLLDGYINCS-----PALEQNCEQVDLKSV
+LLEGLGLLATLIVL-GVAAEVDLPPATDLAGHATQLPLALLNKVTSNDGYTQGDSIVVLM
+SRKGEIMSILIEDSLAGQPPK--------------KKDEGTVGLAILKSLGVLRGGAVAP
+QSDNGGDSTFAIDH--------
+>N1290
+------------------------------------------------------------
+--------------------------LNPLAEALEAAMPRYATALLVHVNIELRCGLTGI
+LTYAATLGVELNEDAREFLDHSRADTAQLIRLLDDYLDGQRLQETANRGQDSDQLDIVVL
+LLSGVGMPAEIV----IAIQRLLPTVSDILGKGADLRLPLNQKVAPAGGYTPGDAINVAN
+TRDGELLTIMVTDTGIGT--DIMTSIAGPFYH-------EGVGLAILKGIVVLQHGGIAA
+KHGKGGETTFK-----------
+>N4551
+------------------------------------------------------------
+---------------------ITEKTANPMLEDLEPPKDEINTGLPGSVSHEPRCVVTGI
+LSYGPHTGPELTGFQRTFLQRMSRAGTALLKLLDKYVDSLRVKGAAKRVQDCNGADLDLL
+LLEGVHLSPSLRASRGVSVPLDLPSPAPVVGRDGDLPLVLVHVKTPVVPYTEGCVIIVAD
+GRGGERVVVCVEDYMCSLPPDD-----------AATRARKATLVIDAKSVAILHGGPIAP
+KHQLAS----------------
+>N1223
+------------------------------------------------------------
+--------VRYVIEHLTDGLPILNNPLSPLAAVLEPLKPNITSGSLSKV-HK-----SDI
+LRYDHEYSKELQDHPREFLDGARHG---LMRLVDDYTEANPLALAAKFVEDVAPQNLDCV
+LVTGVSLLPGLSVTRGPSVETSYPTIAPLLGTQTELALLLSNKEEAEAYYTEGSHIAGGT
+MVDAHRTLRLIEDNGPGMPPED----ACCYYHM--------AGLEMTREVTLLRGGTLAP
+HHESAEQKTISARG--------
+>N4823
+------------------------------------------------------------
+----SKGNVKAVLGNLADGLITLAKYKSPMSDGLEGAPQKISAALLENVEHGLRYLLTGI
+LSFTHKVGTELTEDAHEFLDAARKGGQSLLRLVDKY-------AGAMLVQNEGPIELEGL
+LIQGVSRLSALSKFRGLTVQHDLANQPPLKGASTQLALPLLNRLSKTGGYTPGSLIVVDI
+SRDSERTMIVIEDTGWN-------------YRTSAVKRKEQVGLAPIRSVAILNDETIAE
+TNTPGGDTTLALKDF-------
+>N5
+------------------------------------------------------------
+-------DFRMVLERLSDGLLILAPVMTPMGEDLETPKPVICALLLANVRHEDRCVITGV
+LSYAQWIVSKLKDEAMEFLEVVRK--------LDEFLHESNLEPGAKLVQECGPVDLAKL
+LLEGVSLLGVLNKTRGIALDLEFPNEPPLTNKSAGLPLPLLNNIVSAGPYTPGGKIIVAI
+SRDGERTSITVEDTGPGLPPEDM--------------RDVAANLAISNSVANLHAGTIAE
+ESNGGGDTSFGGKHILDE----
+>N4640
+------------------------------------------------------------
+--------------------------------------------------------ITDI
+LTYATRIGTELKDQTKEFLDGFPCDSRMLRRLLQDYLQGGR---GDKLVQECNTVNLEDL
+LLEGVAVLTKLSATRGVAVDLQAPNRAPLVGQATGLPLPLLNKKAEQGPYTLGSKITVAL
+SRGGPRIVTKCADTGSGLPPEEMNR----------FKPPEGVGLAIARTVGVLADGSVAP
+EHQAGGETTFAVKHTLQT----
+>N3489
+LLLARLDLKVIMDPALFMATLRTLKTLLLQEYSVLLLPALLLPLPLKLDLATVLKNLVRP
+KAKETTGTDKIV--RVTEGLLVVPVTLPPKEEALEKPISRIKSSLLAEV-------LTGV
+LTYVTRAGPDLKNQVMGFLDTFRYDGRQLWRLLEEYLE----------VLDHNTVNLEAI
+ILEGVSLLPALSKTRGPAVDLELPKRAPIVGHNTGLPMPLVNVVGGAGGYTNGSGIVVAL
+SKDGDKIVIGCPDTGDGLPPAEMDCVEDRFYH----------EIAIIRTVSVLADGTVAE
+HHEAFGQTTFSPKLPLQGAN--
+>N4604
+------------------------------------------------------KNLIRP
+NARISTGTGKLVLEVVTEALSIVAKHMPPKVETLEPANSRFTNDLLAEVTHDLRCVITGI
+LTYATSVGTELRDQTEEFLDGL------LQRLLDEYLAGGRLAVTDKLVEECNLVDLEDL
+LLAGVALLSNLSSSRGQAVDLELPEKAPLFGQASGLPARLLNEFSNAGTYTLGARIVVAL
+SRDGDRVVITCPDTGPGLPPEGMEPVEDPYYH----------GLAIVRTASVLTDGTVAE
+DHEGGGQNTFTVKHTLQA----
+>N2778
+------------------------------------------------------------
+--RQDTGHFSLVLEKGADGLRILARDLNPIAEGLEAGKPKTTANLLVKVTHDAHCLDTDI
+LAYMPWLNHELNDANKD-------EGKQLIRLLNNFIDISKVEAGAKLSDDSHAVQLEGL
+LIEGLQLLKTLSKNPGIPFRGELPAPAPMVGESKKLPIPLLNIFAGSSSYTAGSTFIVAE
+SRPGVRVPEMVTDTGPEKPPEDM----------------ESVGAAISKSVALLHQGSIAP
+DQEGKSDTTFGCTV--------
+>N3167
+VLLGHATLRKEVDAELFVPFLKSLVLLLLPAVRMPLLVYMLLALLLGYCLSRPLRSFARV
+TADLGANHYGLVVEWLLDGIRILGKSMDPANEDTEPQKAKVAHGLLHNVAHELLEMVTGP
+LSYEKKAHTERKANTHGFLEKCRTGGRG---------DCARLAKNSKLSQDNETVD-GSL
+LVGELAEPSDLTTVGGKKDAIEFPNPSPIPGAV---PVVLLNVLATTGNYTPGPKITVAM
+ARDGKRTLITVADTGPG-----------------TARAGQCTGIAIIKSVSFLHGTSFTR
+ERLAGGDTTFGEGKRV------
+>N2822
+------------------------------------------------------------
+--------------------RKLAKELDPLAETYEHTKPRVKAGLLGAVDLAPRSPATGI
+LSYATRIHAQLVENVRDYLQAIRRKGQQLNQLLNEFLDKSR----SKLTNETEPVDLKTL
+LITGFKLKSI-----TAQASFELPPPPPAVGIGPQLP-ALLNEVALADSYTPGFKITVPI
+GRDAEKVVVLVTDTQGG-----------------TCRGKDSAGLAICRSVIILHKGSISS
+PHQSDGDTTLSIRHIYDAD---
+>N15
+------------------------------------------------------------
+--------------------RILAKELEPKEEPNEAPKPRVGAAVLVNVNRNLRSVFTGI
+LTYAKCIHAELKDNDRDYLEAVRKN---LLQLLSREFDPSRL-------QDNDPIELKEL
+LLGALGLLTRQSSMRGHQREYEVPNPPTMASEA---SLELLNVVGPAGAYTPGGKIIVHI
+GRDGDRVVSLVEDTPPG---------------LGATHGRHDVGH---KSSVILHKGSIAP
+AHQAGGDTTFTVTH--------
+>N4554
+------------------------------------------------------------
+----------------------MASGMKNVADRLEDGAPRIAGELAAAPSPELRMTVAGV
+LGYSELLD----NVGRDYLEGNMTDASRLKRLINALLEQSRIAGGGKIMLEKEPVDLQRL
+LFGVVALLS---------CTFDLPERPPVMGASTRLRAALLNVLSTAIKYT-GAPIIETT
+-YNGDRIIICVEDEPRAIPPAQLDRA-----RKGGSVSHSQIGLAIDRTTCHLHGGTIYH
+ESEY---TCSAGAPTW------
+>N1267
+------------------------------------------------------------
+---------------------------------LEQNAQRISGELAASVSQAMRAAMAGV
+LGYAELLDAQQKNVEREYLEAKMGSARQLQRLITDLVEQNRLDGGGK--LDKEKVDLQNE
+LTSLISVLRDLSEEAGTEVSGDLP--------GTRLRIGLLNLLSSSLKYT-GGNITVSK
+KH-GDWIVIPVEDEGN-YPPENMERVFESFCKRGNSDSHSTLGLAIKKKVVGLHGGTILH
+QDET------------------
+>N3968
+------------------------------------------------------------
+---------------------------------------RIQLELAASVSQTLRVAVGGV
+LGYSELLDVHQPNVAKRYEEAHMTSAHALLRLITDLLSQ---NGEGKIMLDQEPVDVPDL
+LTNLVS---------NRQQQNDLPESPPAIGAATPIRTGLLNALSLAIKYTP-GSIKVSV
+RNAGDWIVVAVEDEGNG--PENLNRVGASFYRKSGTTAQSGLEMAIKKTVVDLHGGTILH
+EQEA---TCTAGAATF------
+>N4341
+-------LAVALDLGLLIRYLRESLLLMLLGLYLLLLLPILLQLLLGVSLILTVAHLEKP
+EDHCAAGNLRDVQGKVPDSLPILAQKLKAIEDR--DNEPRVLGELAASVSKGLRVGVAGV
+LGYSELLDVQQFNPSKDYLDSQRSEARSLGRLIVDLLEQTRLPGNSKA---IAAVSLQPA
+LAALVLVLRKL---------NDLPQRGPVLGAGSGLRTNLLNLCNIGVKYTT-GKIAVSH
+KGDGDWLIVAVEDEGN-CPPEELKHV----YPKGGNKKETALTAAIKKTVCNLHGGTILH
+EQEA---TCFTNPSTY------
+>N1673
+-------------------------------------LPLLLNLQLSIGTIKNVSHLATA
+SVHILASHLRAVHGHIQQPLRILASTHKHMKDIVDSNPPRTQGVLATRTSRGLKVGTGSV
+LGYSRGRDV----NAKQYLQSAKTGSRELPRLITDLLEQAKLCGTDKQMLEKDPVDLRNA
+LYVLVLIHWIPT------SEDDLPQLPPPLGAAARLRTAQLNCLSIAAKYAPGG-ITVNL
+RHDGDWSAIVVSDEG-GCPPKKLDRVIDSFS----EGHRKPLTLIIAKGVINLHPGTIMN
+NPGP---TCFGGATVYAAAAEK
+>N2378
+------------------------------------------------------------
+----------------------------------ESNPPRTGDVLAKSVSHTLKVGSASV
+LGYTIKGDV----DANQYLDKAKSLAKQLKRLITDLLEEAKLCGTDKEMLEEDLVELRGA
+LFPVCLIMWIPTEEARFQSEDALPQLPPP--AAARLRTAQLNGLSSAAKYATGA-ITVSL
+RHDSDWSPIIVSDDGS-CPPEKLDRVVKSLS----EGHRKTLSLIIAKGVVNLHHGTIVS
+---PSGDTCFGEAAVWAAATGK
+>N1020
+------------------------------------------------------------
+--KMLASHLRTVHGRTQQPLRILASTHKHMEDIVESNPPRTGGLLPASVSQTLKVGKASV
+LGYTHKGDV----NANQYLESGKSSEKQLKRLITDLLEEAKLCGTDKEMLDQDVVELREA
+LFANVLIMWIPTEDSSFQNEDDLPQLPPA--AAARLRTCQLNCLSIAAKYATGGTI-VSL
+RHDGDWSPIIVSDDGS-CPPEKLDRVVRSFS----EGHKKPLTLIIAKGVVNLHPGTIVS
+---PSGDTCFSEAAVWTAAAGK
+>N1459
+------------------------------------------------------------
+--------------------------------LKEDNRPRVQGKFAASATQSLSVGTAGT
+PGYSELLDVQQENAAKQYLQAAKNGKRQLPRLITNLLEQ--LKGMDKAMLEKTPVDLSEA
+LFALVLVL---------QAEKDLPKAPPIIGAATRLRTGLVNFLGIAVKYTGGG-ITVSL
+RHDGDWVVVVVNDEGH-YPPQNLDRVAASFF----ENSRKALTFAIKKTIISLHGGTILH
+EQEA---TCFGSAAPFAASAG-
+>N2641
+------------------------------------------------------------
+--------------------------------LLENNSPRSQGKLAASVSQSLRVGTAAT
+LGYSDLLDVQQESAAQQYLQTAKVGAKPVRRLITDLLEQ--LKGMDKAMLDKEPVDLSDA
+LFALVLVL---------QEEKDLPKIPPIIGAATRLRTGLLNLLGIAGKYTAGG-ITVSL
+RHEGDWVNVTVNDEGH-YPPQNLDRVMASFF----EGVRKPLTLAIKKTTINLHGGTILH
+---ALADTCFGSAAAFAAAAG-
+>N4681
+-----------------------------------LLFPLLLQLLLGHKLLMPLSRTVKA
+EQPIPTTELRLTDELLIDHLQKLEEKLDQIAEVPVNAPPRARNEFLPEVGAEMKTKFTKI
+LGYA--ADRSLGDSEDAYLGHLSVSQNELMILSIELLNGSAVDGAALL-LEDPEVEMAKV
+LASPVGVVKLLSDQKGVDLVINNPSTMPAVGDPTALRHLLLNKITNEATYTPGGHIPIAF
+ARDADRVVIRQDDAKKG-------------------------------------------
+----------------------
+>N3183
+TLLNLKILTFSLDLELLSSVAHELNTLLLLDALVELLFGLLLALLLGSILVQQLERLQKS
+AERIAGGHHKEVVHKGPDRLREK-DSTNQMAENPDYVRPSVKSEFLPAVTKELRAALPGL
+LGYGKDLDDELSEDLREYLVSLRKPAQQLTRLTFDILDDFKLKG-----LEQNNADLQFV
+LKKLVALIGPLLEDHGFVGDM-MPQAQTGIGEALNLKQVLLNALSKLSRYIPGHKITVRA
+RRDG----IPVEDT-----AETLDAI----------GRNQSLGLAITKRVGDLHAGAITI
+EEDPGS----------------
+>N4581
+------------------------------------------------------------
+-----------VLETSPEQLRALPECLNQFHERLEYNHPRGEDEFLAEVTHRFWAVRTSI
+LGYGETPKREVFNDKKKYLERTAPVAESLLSMIN-LLNLARVHTGDKLSMDSKPIDLQKI
+LLDGVDLVTVIGEEKGGEKPKDLPKSNQVIGEATALVQVLVNLLSSAIKYIPGAVISVSV
+VRDGKGVVVDVGDTGAGFPPEDLPRTF----HVAYSSGKGILGTAALKREADINGGVITV
+EDTPQGDTTLEEGQPEEK----
+>N3537
+------------------------------------------------------------
+------------------------------HERKENNEPPGHGEFLANVTHLMRSTITSI
+LGYGAIAKHEI-DGGENYISGYSSAGANLLRLIDNLLKHGRVQFGTRLSMEEQPKDTHQF
+LNDLEDDVMCIGEEKGMEQSLDLPDVGQLTGEAKHLNQKLLNLRASAIDYTSGGGVASPV
+KRDAECLLVGVE-----YPPEGLERIYRKFYKVAFGKGRASLASAIVKRGLQLQGGVITV
+DQAGGEETALLGKKVRPKAPP-
+>N3170
+--------VVEIDLELLNALMHSADVSDLLGDKLLLLQTLLLPFLLGRKLIKSLERIVKS
+AERVGSAHSRHVVQSAPDQLRELPAS----HQRSENAQPRGDGLFLANVAHSFWASSTNI
+LGYGKSLKRSVFNESHNYLADGSNPGSSLARLINDLLNFDRVHQEAKVSMESHPVDLQEL
+LVELVEGVKCIGDEKGTERPLELPEGNQMIGEATHLNQVLLNLLADAIKYTVGAEVPVTV
+TRDGDCLLIAVE------------------------------------------------
+----------------------
+>N1349
+------------------------------------------------------------
+--------------------------------------------FLANVIHDAWAAGTNI
+LGYTIVLKREVYNEEHNYLAAATAPGKNLARLIHDLLHFDRIHQFAKLSMQSQPVDLQNL
+LVDLIEGIKCIGEEKGTEGPLDLPEGNGTIGEATHLNRVLLHLLAGTIKYTPGSDVRVSV
+RRDGDCLLIAVQDSGAHYPPEELSRIF-KFYHVIYNAHSGLIGAAILKRGDQLHAGVVTV
+LQSSG----LGKKEVGPK----
+>N2089
+------------------------------------------------------------
+----------------------------QFQIQAENSEPRGNGQFLGQVVHNFWGTTTNI
+LGYGAILKRKVFNAPHNYLAQNGGDGASLDRLIDEELNFDRTHQNAKAGREAQPVDLQAL
+LSDAVKAIKCIGESSGAENDLDLPAGNQQFGEPFQLSEVLVNLMGATVKYTCGTEVAVSV
+RRDADCLLINVEDGEAMYPPEGLDRIYSKFYHVTYDKPTGVIGTAILKKGDPLHGGLITP
+MQTSN----LAKRDNQGKADP-
+>N1410
+------------------------ELLDNLGCALLLLLTLLLPFLLARKLVRSLDRLVRP
+VERIGRGHLRSVVEPAPDQLRELPASLNQFHEQNENAQPRGQGEFLANVAHNFWAVDTNI
+LGYGTILKREVFNESHDYLAEDSGEGQSLARLINDLLNYDRVHQNAKLGMDTQPVDRQGL
+LVDLVDGIKCIGSDKGAAPPLDLPESNQKVGEGTHLFQVLLNLLASTIKYTPGSEVSVSV
+RRDGDCLLIAVEDGGAAYPPEGLERIFDKFYHVSYIKPANVVGTAIVKRGDQLHEG--TT
+QQTSGGDTTLGN----------
+>N508
+------------------------------------------------------------
+--------------------------------------------FLANVAHNFWAVSTNI
+LGYGTILKREVFNESHDYLAEDSGEGQSLARLINDLLNFDRVHQNAKLGMETQPVDLQGL
+LVDLVDGIKCIGSDKGAAPPLDLPESNQKIGEATHLFQVLLNLLASTIKYTPGTEVPVSV
+RRDGDCLLIAVEDGGSAYPPEGLERIFDKFYHVSYIKPANVVGTAIVKRGDQLHGG--TT
+QQTSGGDTTLGN----------
+>N2659
+-------------LILLLAYLRSLEVLELAGGQLYLFYLLKLPFLLGKKLADALKPLVRH
+DEQEGEGHLRFILEREPDRLREVPQCLNQFHERMSTNEPRTSGEFLAEKTQSFWETRTSN
+LGYGALNKRDLFNDRASYLDRSSGGSSSLVNLFKSILNKGKAHTAAKLAMEFHPVNLQAL
+LLGLNDLVKAIVETKGAEHPAELPTGHQATGDAKNLGHVLMNLLYNDLKYTPGGAIAVTC
+RRDHDS--LEVGDTGDSNPPEGLQPIFSSFYHVTFNRAKGTLGAAIFKPPAELHGGVITV
+EHKPGGDTTLATAKVNPKAACL
+>N3669
+------------------------------------------------------------
+---------------------------------LAKNEPRDEFEFLAEVAHAFWPTDTRL
+LGYGTVLKREAFNERVRNLERTSASSTSLAALINGLLTASRVNTTAKTAMDSHPVNLQEL
+LLDQKALAKSINEETAKEMPMELPEGHQAVGQATKLGQVLMNLLYGDIKYTPGSAIKVSV
+RRSEDSIVLAVE------APQSLQRILVSYYHAAYNRATGTLGATISGRPPQLHGGVITV
+EESPGGDNTLLPKNVK------
+>N2906
+------------------------------------------------------------
+--------------------RETCNVLNQIHESLTKNERRPNGEFLADVTHTFWATFTAI
+LGYGGSGKRSVFDIKRSYLESKPGGGEKLMSLINALFKFPRVHTKAKLAMAPHAVNLQKL
+LLDVVQLVKPITEEKGAEKPLELPQGFEKVGGAEKLGQILCNLNVDTIKYTPGLAITVSV
+RRDADSIVAGIEDAGEGKRPESVQRVY-AYYHVSYSRAKGTLGTAILKRPAELHAGVITV
+QESPGGETTLHVKTAAP-----
+>N4522
+------------------------------------------------------------
+-------------------------------------------EFLVEVAHTFWSTPTSR
+LGYGALAKREVFDFKRSNLERVSTGGSSLVSLMNDALKFGRGPTTAKLAMEPHPVNLQDL
+LLNIIDLVRKIIEEKSAEQPLELPEGHQAVGEPDQLGQVLLNLLADALKYNPGAVITVAV
+RRDNDAVVLKVEDTGAGNPPEALQPIFVSFYHVAYSRARGILGASILKKSGQLHGGVITA
+EESPGGDTTLASKEAGPMAGAV
+>N286
+--------------------LPDKDILILLPALLLLYLNLLLKLLFGRKLVRPLRKAVRD
+PQRIADGHPRYALAKIPDTLPELPGLLHQIIAHLENKATKITQDYLANLEHSYPSTATGI
+IGYGEVFKRQLFDGRRVYLERVSGPALPLLRVANNLVNETRLEGGRP-SLGADVVELQNV
+LLDLVVVLRVLGEAQNAEWVAGLPAYSPDVGPRETLRQVLINKFCATREYTPNIRIHYAH
+ERDGARVAILVE------APEGLESIF-----LGYGAHATTLGIA--NIKTALHGGTVTV
+QQKSASDTTFAQSQVFTPYAAV
+>N2598
+------------------------------------------------------------
+-----------------------------------SEEPDATGDILGNSPHEFRVVKTGI
+LGYDETGKHEIFENRRSYLEV----DHQLLRMISELLTATRLEAIGKLGLDFTAVDSQAL
+LEPLTVLLRQLAEQKGVEWAFELPPKAREKGGPTLLRDMLMNLMANAVKYTPGIKIEVSL
+RKDSEQVMVGVHDT--GLPPEDLSNVFEN-----------GLGTAINSRIEETHGGKI--
+----------------------
+>N4350
+KSLKADVLLAGPDFDLLPPALRGPELFIALGPLIILLLATLMCLLLERFLVGQLRRLVKG
+IEKTAAGNARWVIDKA---LRDLAEVLDNMTERLDDKDARTGAQELIYVSQDVRTNITAI
+FGYAQFVDREMLENGRKYLEKLSGKTEHLSRMINIIIDPQRLSVGTR-ALDEEPVDLTQL
+LQEMVSLFKPLAADKAIEKAVDLPQHDKVVGEGFKLDQILTNLVTQALKLTPEHPIIVNV
+RKDGDRMIVDKNDTGVG------PRVFTIFYKKEFAKEMTSLGSAILRRRVALQGGAIAI
+E-YSGDDCTITMKEILAPAAA-
+>N4563
+------------------------------------------------------------
+-------------------------------ERYQTGDVKVDNAILAKVTHEFDTIGSGI
+LNYGQSINKELAKPPSNYLEMPDYCADQLVRSIHVLLIRTRLEKGV-LAMEADPMEQQPL
+LLQLVQLLRALAQEDGVELKLDLANNTPALDQPTALRQILMNLYNNSAIYTHGDEINVSI
+RRDGARLVVEVTNTGAGLPPEALDRIYSSFYRTEWSRSRGDLESAIDKLANELLSGTITA
+PDEPGNQATFTCKKLFAKAAEV
+>N4237
+------------------------------------------------------------
+-----------VLEIVPDALRETSEGVNMRCEQIEEAVPRGE---LGKVSHYLRVGTTGL
+LAYSENLDKEAADQAQAYLAECKIAAGELVHMITNLLDSNRLRQGA-LLLESVPVDLVCL
+LTHQVKPLRFLTEPMGPEVELELPEPKPVVSKPTFLQQKLLNVMDGALQYTPGTAIAGAI
+IRDSTRVTLTAQDTGASLAPEELS-IYESFYQTGFPQTPSYMGNAVSKKVADLHGGLVT-
+----GGHTTFELKANP------
+>N3563
+------------------------------------------------------------
+-----------------------------------GVEGRDISTFLANVGHQLSKGCTTI
+LSYNELLNVSLFDARLLYIARLRTAKKELPRMIDELDEVARLDTGAPLVLESVHVDMLAM
+LKDVVLLLQALEGAKGVETKMNLPEPTPTSGKATGLHQPLLGLEGDGLMFTPGGTIKGTL
+TRDGERTALFVQDTGL-LGPDNLEKVLASRLRHSYARSNPFLAKALSPHVTNLHEGTVTT
+----------------------
+>N1292
+------------------------------------------------------------
+------------------------------------------AEFLANVGQTLRAASTAI
+MVYGEPLKKDIYDEKRNYLTRMRKGEEELSRMIHELLDFCRLKTTAPSSLESVPVDMVVR
+LIEEVKLIRPLAEEKAVEREMGLPDRTPVIEKATKLDQVYLNDNPRPLLYTPGGPIAGSN
+RNDGTRVVLCLGDTGLDMPPQELE-VVSSFYPAGYSRAKSFVGVAVAKRVVDLHEGTLTA
+EEQ-----TFDIAAVLKAAGAG
+>N1218
+------------------------------------------------------------
+----------------------------QRAEFLEDGGPRVAGEFLGKVSHQTRAARTGI
+LNYGQLWNKELFEEPKAYLARKRIEAEELLRMLNELLESGRLGAGQGIERENEAVS--KL
+LTNLIEVLCSLAGDKGYEKELDLAAPQAETGQHAPLRGMLFNNFRAITMYTPSGRTSISH
+PRDGDRAIKGVADTGLGKPADEIEKVVDTFYPKGFG-HDVNIGMAIVWRIIGVHSGTITV
+EQEVPGDTTFTDTH--------