changeset 0:3cec538aab33 draft

Uploaded
author joachim-jacob
date Thu, 30 May 2013 07:13:55 -0400
parents
children da4426cac227
files README blat_indices.loc.sample blat_wrapper.pl blat_wrapper.xml test-data/databasetest1.txt test-data/input83.fas test-data/outputtest1.txt tool_data_table_conf.xml.sample tool_dependencies.xml
diffstat 9 files changed, 1309 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/README	Thu May 30 07:13:55 2013 -0400
@@ -0,0 +1,20 @@
+BLAT Galaxy wrapper - 1.0.0
+=============================
+<joachim.jacob@vib.be>
+
+SUMMARY
+-------
+BLAT is BLAST-Like Alignment Tool and is designed to 
+quickly find sequences of 95% and greater similarity 
+of length 25 bases or more.
+	  
+REQUIREMENTS AND INSTALLATION
+-----------------------------
+Install this tool in your Galaxy via the Toolshed
+
+   ) Third party code installation
+	BLAT binary will be installed automatically  
+
+DETAILS AND ISSUES
+------------------
+   ) First release
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/blat_indices.loc.sample	Thu May 30 07:13:55 2013 -0400
@@ -0,0 +1,7 @@
+# CLC Mapper requires the fasta file of the reference genome
+#
+#<name>	<dbkey>	<description>	<absolute path>
+# e.g.
+#hg19_chr21	hg19	Human chrom 21 bld 37 (hg19)	/mnt/genomes/hg19_chrom21/fasta/human_chr21_hg19_NT_011515.12.fa
+
+
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/blat_wrapper.pl	Thu May 30 07:13:55 2013 -0400
@@ -0,0 +1,167 @@
+#!/usr/bin/perl
+# blat_wrapper.pl
+# Joachim Jacob - joachim.jacob@gmail.com - 2013
+
+use strict;
+use File::Temp 'tempdir';
+use File::Copy qw(move);
+use File::Basename;
+use File::Spec qw(join);
+use Log::Log4perl qw(:easy);
+
+# ---------------------- Prepping Logging -----------------------------#
+########################################################################
+# Log levels: 			$DEBUG	$INFO	$WARN	$ERROR	$FATAL
+# ConversionPattern:	%d %-5p %F{1} [%M] (line %L): %m%n%n
+my $log_conf = q/ 
+    log4perl.category = ERROR, Screen 
+    log4perl.appender.Screen.stderr=1
+    log4perl.appender.Screen.layout=Log::Log4perl::Layout::PatternLayout
+    log4perl.appender.Screen.layout.ConversionPattern = %d %-5p %m%n
+    log4perl.appender.Screen        = Log::Log4perl::Appender::Screen 
+/;
+
+Log::Log4perl::init( \$log_conf );
+my $logger = get_logger();
+
+# ----------------- Getting parameters file ---------------------------#
+########################################################################
+my ($configfile) = @ARGV;
+my (%para);
+open(CONFIG,"<$configfile");
+while (<CONFIG>) {
+	if (/(\S+)==(.+)$/){ $para{ $1 } = $2 ; }
+}
+close(CONFIG);
+
+=Excerpt Config parameters
+			## first we pass some galaxy environment variables
+			galtemp==${__new_file_path__}
+			
+			## first we pass some galaxy environment variables
+			galtemp==${__new_file_path__}
+			
+			#if $refGenomeSource.genomeSource == "indexed"
+				referencepath==${refGenomeSource.index.fields.path}
+				range=$refGenomeSource.range
+			#else
+				referencepath==${refGenomeSource.ownFile}
+			#end if
+
+			input==$input
+			output==$output
+			q==$q
+			t==$t
+
+			advanced_params.use==$advanced_params.use
+			#if $advanced_params.use=="yes"
+				tileSize==$advanced_params.tileSize
+				stepSize==$advanced_params.stepSize
+				oneOff==$advanced_params.oneOff
+				minMatch==$advanced_params.minMatch
+				minScore==$advanced_params.minScore
+				maxGap==$advanced_params.maxGap
+				mask==$advanced_params.mask
+				qMask==$advanced_params.qMask
+				repeats==$advanced_params.repeats
+				trimT==$advanced_params.trimT
+				noTrimA==$advanced_params.noTrimA
+				fine==$advanced_params.fine
+				maxIntron==$advanced_params.maxIntron
+				extendThroughN==$advanced_params.extendThroughN
+			#end if
+=cut
+
+for my $para (keys %para){
+	INFO "$para\tset to\t$para{$para}";
+}
+
+
+# ---------------------- Prepping temp dir ----------------------------#
+########################################################################
+# within the temporary directory of Galaxy, we create a temporary dir
+
+my $galtemp = $para{'galtemp'};
+delete($para{'galtemp'});
+DEBUG "\nReceived Galaxy temporary directory:\n$galtemp";
+
+
+my $tempdir = File::Temp->tempdir('tmpXXXXX', DIR => $galtemp, CLEANUP => 1); 
+mkdir "$tempdir", 077 unless -d "$tempdir";
+INFO "\nTemporary directory:\n$tempdir";
+
+
+# -------------------- Assembling command  ----------------------------#                                                             
+########################################################################                                                             
+my $command = "blat ";   # this will ultimately be executed
+$command .= " $para{'referencepath'}";     
+if ( $para{'range'} ) { 
+	## format checking of the provided range
+	if ($para{'range'} !~ //){
+		ERROR "Range has be wrongly formatted: $para{'range'}";
+	} else {
+		$command .= ":$para{'range'}";
+	}
+} 
+                              
+$command .=  " $para{'input'}";
+delete($para{'referencepath'});
+delete($para{'range'});
+delete($para{'input'});
+
+$command .= " -out=blast9 -q=$para{'q'}  -t=$para{'t'}";
+delete($para{'q'});
+delete($para{'t'});
+
+my $output = " $para{'output'}";
+delete($para{'output'});
+
+if ( $para{'advanced_params.use'} eq "yes" ){
+	delete($para{'advanced_params.use'});
+	$command .= " 	-minScore=$para{'minScore'} -maxGap=$para{'maxGap'} -mask=$para{'mask'} -qMask=$para{'qMask'} -oneOff=$para{'oneOff'}  -minMatch=$para{'minMatch'} -tileSize=$para{'tileSize'} 	-stepSize=$para{'stepSize'} -maxIntron=$para{'maxIntron'} ";
+	if($para{'repeats'} eq 'yes' ){
+		$command .= " -repeats=$para{'qMask'}";
+	}
+	if($para{'extendThroughN'} eq 'yes' ){
+		$command .= " -extendThroughN";
+	}
+	if($para{'fine'} eq 'yes' ){
+		$command .= " -fine";
+	}
+	if($para{'trimT'} eq 'yes' ){
+		$command .= " -trimT";
+	}
+	if($para{'noTrimA'} eq 'yes' ){
+		$command .= " -noTrimA";
+	}
+}
+
+$command .= " $output";                                                                                                                                
+
+
+# --------------------- Executing command  ----------------------------#                                                             
+########################################################################                                                             
+run_process($command, "BLAT alignment", $tempdir);
+
+# --------------------------- Exiting  --------------------------------#                                                             
+########################################################################                                                             
+exit 0;
+
+
+### 					      Subroutines 						     ###
+########################################################################
+sub run_process {
+	my ($command, $name, $tempdir)= @_;
+	my $logger = get_logger();
+	INFO "\nProcess to launch:\n $command\n";
+	system("cd $tempdir; $command 2>/dev/null") == 0 or die "$name failed\nExit status $?\nCommand: $command";
+	if ($? == -1) {
+		print "failed to execute: $!\n";
+	} elsif ($? & 127) {
+		printf "child died with signal %d, %s coredump\n", ($? & 127), ($? & 128) ? 'with' : 'without';
+	} else {
+		printf "$name executed successfully\n", $? >> 8;
+	}	
+}
+
+
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/blat_wrapper.xml	Thu May 30 07:13:55 2013 -0400
@@ -0,0 +1,179 @@
+<tool id="blat" name="Align sequences with BLAT" version="1.0.0">
+    <!-- Additional info: wrapper compatible with versions ..... -->
+    <description>
+		to a reference genome
+    </description>
+    
+    <version_command/>
+    
+    <requirements>
+        <requirement type="package" version="1.0.0">blat</requirement>
+    </requirements>
+    
+    <command interpreter="perl">
+        ## it is recommended that you write a wrapper for your tool
+        ## and pass all parameters to that tool, which parses them.
+        blat_wrapper.pl $configfile
+
+    </command> 
+   
+    <inputs>
+        <param format="fasta" name="input" type="data" label="Query fasta sequences" />
+        <param name="q" type="select" label="Process the query as">
+			<option value="dna" selected="True">DNA</option>
+			<option value="rna">RNA</option>
+			<option value="prot">Protein</option>
+			<option value="dnax">DNA sequence translated in six frames to protein</option>
+			<option value="rnax">RNA sequence translated in six frames to protein</option>
+        </param>  
+        <conditional name="refGenomeSource">
+          <param name="genomeSource" type="select" label="Will you select a sequence database from your history or use a built-in index?" help="Built-ins were indexed using default options">
+            <option value="indexed">Use a built-in index</option>
+            <option value="history" selected="True">Use one from the history</option>
+          </param>
+          <when value="indexed">
+            <param name="index" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact the Galaxy team">
+              <options from_data_table="twobit.loc">
+                <filter type="sort_by" column="1"/>
+                <validator type="no_options" message="No indexes are available for the selected input dataset"/>
+              </options>
+            <param name="range" type="text" size="25" value="" label="Restrict the search space to this genomic range in the sequence database" help="Format = 'chr1:250000-260000' (i.e. name:startposition-endposition)" />
+        
+            </param>
+          </when>
+          <when value="history">
+            <param name="ownFile" type="data" format="fasta" metadata_name="dbkey" label="Select the sequence database" />
+          </when>  <!-- history -->
+        </conditional>  <!-- refGenomeSource -->
+      
+        <param name="t" type="select" label="Process the sequence database as">
+			<option value="dna" selected="True">DNA</option>
+			<option value="prot">Protein</option>
+			<option value="dnax">DNA sequence translated in six frames to protein</option>
+        </param>
+        
+        <conditional name="advanced_params">
+			<param name="use" type="select" label="Show advanced parameters">
+				<option value="no" selected="True">No</option>
+				<option value="yes">Yes</option>
+			</param>
+			<when value="no" />
+			<when value="yes" >
+				<param name="tileSize" type="text" size="3" value="11" label="size of match that triggers an alignment" help="Usually between 8 and 12. Default is 11 for DNA and 5 for protein." />
+				<param name="stepSize" type="text" size="3" value="11" label="spacing between tiles" />
+				<param name="oneOff" type="boolean" truevalue="1" falsevalue="0" checked="False" label="Allowing one mismatch in tile?" />
+				<param name="minMatch" type="select" label="number of tile matches" >
+					<option value="1">1 (for proteins)</option>
+					<option value="2" selected="True">2</option>
+					<option value="3">3</option>
+					<option value="4">4</option>
+				</param>
+				<param name="minScore" type="text" size="3" value="30" label="minimum score" help="This is the matches minus the mismatches minus some sort of gap penalty. Default is 30" />
+				<param name="maxGap" type="select" label="size of maximum gap between tiles in a clump" help=" Usually set from 0 to 3.  Default is 2. Only relevent for minMatch > 1">
+					<option value="0">0</option>
+					<option value="1">1</option>
+					<option value="2" selected="True">2</option>
+					<option value="3">3</option>
+				</param>
+				<param name="mask" type="select" label="Mask out repeats in reference sequence" help="Alignments won't be started in masked region but may extend through it in nucleotide searches. Masked areas are ignored entirely in protein or translated searches.">
+					<option value="lower">mask out lower cased sequence</option>
+					<option value="upper">mask out upper cased sequence</option>
+				</param>
+				<param name="qMask" type="select" label="Mask out repeats in query sequence" help="Alignments won't be started in masked region but may extend through it in nucleotide searches. Masked areas are ignored entirely in protein or translated searches.">
+					<option value="lower">mask out lower cased sequence</option>
+					<option value="upper">mask out upper cased sequence</option>
+				</param>
+				<param name="repeats" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="Report matches in repeats separately?" />
+				<param name="trimT" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="Trim leading poly-T" />
+				<param name="noTrimA" type="boolean" truevalue="no" falsevalue="yes" checked="True" label="Trim trailing poly-A" />
+				<param name="fine" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="For high quality mRNAs look harder for small initial and terminal exons. Not recommended for ESTs" />
+				<param name="maxIntron" type="text" size="10" value="750000" label="Maximum intron size" />
+				<param name="extendThroughN" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="Extent alignment through large blocks of N's? Not recommended for ESTs" />
+			</when>
+        </conditional>
+    </inputs>
+
+    <outputs>
+        <data format="tabular" name="output" label="${tool.name} on ${on_string}: alignments"/>
+    </outputs>
+
+    <configfiles>
+		<!-- this config file collects all parameter settings -->
+		<configfile name="configfile">
+			## first we pass some galaxy environment variables
+			galtemp==${__new_file_path__}
+			
+			#if $refGenomeSource.genomeSource == "indexed"
+				referencepath==${refGenomeSource.index.fields.path}
+				range=$refGenomeSource.range
+			#else
+				referencepath==${refGenomeSource.ownFile}
+			#end if
+
+			input==$input
+			output==$output
+			q==$q
+			t==$t
+
+			advanced_params.use==$advanced_params.use
+			#if $advanced_params.use=="yes"
+				tileSize==$advanced_params.tileSize
+				stepSize==$advanced_params.stepSize
+				oneOff==$advanced_params.oneOff
+				minMatch==$advanced_params.minMatch
+				minScore==$advanced_params.minScore
+				maxGap==$advanced_params.maxGap
+				mask==$advanced_params.mask
+				qMask==$advanced_params.qMask
+				repeats==$advanced_params.repeats
+				trimT==$advanced_params.trimT
+				noTrimA==$advanced_params.noTrimA
+				fine==$advanced_params.fine
+				maxIntron==$advanced_params.maxIntron
+				extendThroughN==$advanced_params.extendThroughN
+			#end if
+
+		</configfile>
+	</configfiles> 
+
+	<tests>
+		<test>
+          <param name="input" value="input83.fas" />
+          <param name="refGenomeSource.genomeSource" value="history" />
+          <param name="refGenomeSource.ownFile" value="databasetest1.txt" />
+          <param name="q" value="dna" />
+          <param name="t" value="dna" />
+          <param name="advanced_params.use" value="yes" />
+          <param name="advanced_params.tileSize" value="11" />
+          <param name="advanced_params.stepSize" value="11" />
+          <param name="advanced_params.oneOff" value="0" />
+          <param name="advanced_params.minMatch" value="2" />
+          <param name="advanced_params.minScore" value="30" />
+          <param name="advanced_params.maxGap" value="2" />
+          <param name="advanced_params.mask" value="lower" />
+          <param name="advanced_params.qMask" value="lower" />
+          <param name="advanced_params.repeats" value="no" />
+          <param name="advanced_params.trimT" value="no" />
+          <param name="advanced_params.noTrimA" value="yes" />
+          <param name="advanced_params.fine" value="no" />
+          <param name="advanced_params.maxIntron" value="750000" />
+          <param name="advanced_params.extendThroughN" value="no" />
+          <output name="output" file="outputtest1.txt" lines_diff="2"/>     
+        </test>
+    </tests>
+
+    <help>
+**BLAT Overview**
+
+BLAT_ is an alignment tool like BLAST, but it is structured differently. 
+On DNA, Blat works by keeping an index of an entire genome in memory. 
+Thus, the target database of BLAT is not a set of GenBank sequences, but 
+instead an index derived from the assembly of the entire genome. By 
+default, the index consists of all non-overlapping 11-mers except for 
+those heavily involved in repeats.
+
+.. _BLAT: http://genome.ucsc.edu/FAQ/FAQblat.html
+
+    </help>
+</tool>
+
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/databasetest1.txt	Thu May 30 07:13:55 2013 -0400
@@ -0,0 +1,772 @@
+>ENA|CAKG01028373|CAKG01028373.1 Drosophila suzukii WGS project CAGK00000000 data, contig drspszk_2131478
+AAAAATTTTTATATTTTATTTTTATGAAAATAGTTCTCCCTCTCATGTTAATTGATAAGT
+ACACTTTTTAAGTACACGTTTACATAAGTAAAAACAATTTCCTGAGAAATAGTTTTATCG
+ATCGCACCTATACGGGCGTTTTACATAAATCTCTTTTGGGCGAAACTCTGGGAAGAGTTT
+CCACCGAACTTAGCCCAAATAGATTGCTCTAAATCCACCGATAATGATATATTCATAGGT
+ACCGTTGACAAGAAACTTGGACAGTAAATTAAGCTCCGGAAACCCCAAATCCAATATAAT
+TACCTTCGTTATGAATGAGCTCCGACTTGGAGTTGGCCGATAAGGACCTGAAGAGGGCCG
+CCGAGTTGGGTCTGTAGGTGTCCAGCGAGGCAGACAGTTCCATCAGGGGCTTCATGATGC
+CCTTCAGGTGCTGCAGCTGCTCGCAGGCGAAGATCAGCCAGGAGCAGAACATCACGTCGC
+AGAGGTTGGAGTGGATCATCGAGAAGAGCACGTAGTAGATCTGAAAGGCGAAGCTGATCA
+TGTAGAACAGTCCGTGGCTGGCGTTCCAAGGGTAGAAGGACTTGATCGGCAGCCGCGGAA
+TCTCCACCGGAATGCTGGAGTTCGTTTCGTGGTCCACCACCATCTTGACGCTGTCCCCGA
+AGAAGGTGATCGTGGTCCAGGCGGTGGCCGAGGCCACGGTGGTCAGCATCACCAGGAAGA
+ACAGCTTCCTCATCTTGGCCAGGGCGATCGAGTGGTAGCGGGCATCTGATTCGGCGAACA
+GGGGGTGCGTGTTGACCTGGTTCCATATATTCAGGGTTCTGCAGAGATAGTTATTCTTAT
+TACTCCCAATCCCAAACGAAATTGCAGAATTGCCTAATTATTAATTTCCAACTACAATTA
+TATTCATTTTAAGATATAACCTAGAGCTATGCGGGATATTATGCCTTAACCAAGGGATTT
+TAACTTATATTAACAAAGTAACTGAGAGTCAAAATAACCTAAAGTAGGTTTTTCACAATC
+TTATTTAAAATGTATTTTTTTAATGTACCTCCCTTTTTCAAAGTATAAAATGCTCATTTG
+GGATACAAATTTTTGTGCCAGTTATTTTTTTACCTGTAGAAATTCTTCTGGTTGACGGCC
+AAGTAGATGAACTTGGTTATGCAGTGGGTGAAGAAGAGGGTGGTGATCGTGTTGCCCGAC
+AGCTCGTTCACCTCCTCGGCGTTGAGGGCCATGTTGACCAGGATGAAGGCGAACTGCATC
+AGCAGGAGTACCAGGTGCACCGAGGAGTAGACCTTCTTCATGAACGCACTGCCGCCCGTG
+AAGTTGTGCATGAACAGGCCCGAGTACTTCATCGCCCGTATATTGGGCATCAGGTCGGCC
+ACCAGGCCCGTATACTTGCTCGGCTGCATCGAGGTTGTCATCCTGCGAAAAATGGCTCGA
+CATAATTAATTGGGTTTCGCCAACATAATCAGCGATTATTGCCAGTGGATAAAGTGATGG
+GGGCGATGCGGAATCTTTTTCATATTCCGTCTGTGTGATTGGCTTTTGGTCTGTGTGCGA
+CCCAAAGAGGAAATCCTCTCCGAAAATGAATCGATTTCGCATGTTTTATTCATACTTGTA
+TAATGCATAATGCGGGGTTTTAATCGGTTGAATCGTTAGTGTCCGTTTAGCTTAAAGCCA
+GTATTTAATACTGAGATTGCGTTTTCTTGAATTGGTATGGCTAGGATGAATTTTTTTAAC
+AGAGTTTTCTTAGCTCAAAAAAGCCATTAAATGAAAATGCTTCAGTTAGCCCGACTAAGT
+TTTGATAAACTTGTAGTCTTCTTCATAAAAAAACAATTAAAGTTATTTTAAAATTTTAGG
+ATTGGAATAACACTTTTTTTGCAATTTGTACTTTACTCAAATTTAAAGAAAACAATTTAA
+TGTTTAATTTAATTTTAGATTTTAAATAACACTGTTTATAGAAAACTAAATTTTAATAAA
+TACAATTAAAAGTCGAAATGCTTTTAGATTTGGAAAAACAACCTGGATATAAATGGGTTT
+TTTTTTAATTTCTATGTATTTTTATATCGCCGTTAAAAATAGTAACACGAAGAAAATGTT
+TAATGTTTAGTAATTAAAAGGTTAGCACTGAGAGGTGTTGACTAATAAGTTGTAGAGCAG
+AAGTTTACCTTGCAATTGAGCCTTAAAAATTCAAATTTAATCGTTGTCTTGTAAACGGTT
+GTTAACTGAGTGCAAGCTAATGCACTTCTAGGCAAGCATTTCACTCACTGAGGCTATACC
+GGAATTATTTAAGATACAACGAGGGTTTTAAAACCGGGACCCAGTTAACCTGCCAGCAGG
+GCGTTGTCGACGTTAATGAAACGTGAAACCTGGAAGGTTAACGGGCTCTGCCGACAAGTG
+ATTGCTTCTTCTGTCGTCTGCCAGTACATAAGGACGTGTACTTTGAGGGCAGAGTTCCCA
+CGGCTGCAGCAAGGCCACGTTCAATCGGAGCCCTGAAACTTTCACTCCGACCCACACATG
+TTAATGAAAATATATGGCTGTGGGCCTAAAGCCGGCCTCGGAGTGCTTAAAAATTCAACT
+TTTAGCCACGTCCGTCCAAGATGGGTGCGTGGCAGACGCCGAATTCCCACAATTAAGTCG
+AACGCCCACGAACTTGCCGGCCGCCATGTCGCCGTCTCCAGGTCTAGGACTCAGGCCTGG
+GCCCTGGCCCTGTCCACGCGGCGTATGCGCAATGGGCAGCGCAGCACGGGATAGGGAAAC
+ACGCTCCTCTGGCTCCTCTGCGTGGCATCTGCGGTATCCGAACTTATGCAAATTTTAAAA
+GCATCGATTATTTTATTATGCCTGTTTGTATTTGTTGGCCCTAAGTGCCGCAGAGTCATG
+GGGAAGGGCATTCAGCCCCCAACTGCTGCCACGGAGCCTTCCCCGAATCGCTGACCCAAA
+AAATAACCCACATACCCATTTGCATGGAAATGTGTGCCCGGCCTGATGGATAGTTTGACT
+TTGTTCTTTTTTCGTTCTCAGTTCGAAAGCACCGAGGCTCAGTGGGCGCAGGAAGCCAAA
+TCGAACAGGAAATCCCCAGATATGGGGCAACAGAAGCTCTAAAGTAAGATGCGTTGCTTG
+CTAAAAGGACCTTTGAATTTGTGTTATCACCGGTACAATAACCCTTGCAACACTGTGCTT
+CAGCTCAAAAAATCATGCCAAAAAATCTGTAAAATATTTATAATCTAGATTACTAGCCGA
+ATAGATATAGTCTTGCCCTTCTGTATGTATGTCTATTACTATACAATTGTGTATTTTTTG
+AGCTAAAATTTATTTTTTTTAAAGGTCTAAGAATGTGTTTAGACAGGCCCGCGTCATTGA
+AATACTAAGAAAAGTAAAATGTTCCCATGGAAACCCTGTGGATGGAAGAAGAAGATAGTT
+TTTCGAATGCTCGACAAAGGTTTTAAAATGTAGTAGTACGTAATGTGAATACATCAGCAA
+CGGTTGTTTTCAGCCGCAGCTTACTATAAATTCGAATGTTTTGAAGTCACTTTTGTAGTG
+TAAGCTCCTCGTGTGATTTTTGAATATTCGACAATGTATTAAAATGATTATATATGTAGC
+TTATTACCCCACGGGGTAAAACTGTTTTGCTCTGTCGGCTCTCTGCAAAATAAATTTAGT
+CACTGCTTAAATGGAACACATGGGAAAACAAAATAGAACCCAACCCAAACTCCCAATAAA
+GTTATTTAAACTAGTTTTGGCAGTATTAACATGCAGTCAATGTGCCTGGAACACAATGTA
+CTTTCTAATACGATTCTAATTGCTGAAACACAATTGTAACTATGTTCCGGAATGTGAGTG
+TGGCCAAAATGGGTTGGACTTGCTGTTTTCAACGGGCAGTTGGTTTACACGGCTCAGATG
+GCTTAAAACTCATGTACGTAGATGGGGACTCAGACACAGATGTGGCAGCTCATGGATTAT
+TCAAATGCAGAAGTCTCACGAACACCAATTAATACGTGAATGCCCGCCAGTGTGGATCTG
+TTTTTTGTGCGACGGGATTTAACAATATTGATTTAACGTTTAATTGGACTGCACTCATCC
+ATGCTAACTGAGTTCCTGCTCGGTATTTCCCCTTTAGTCCTTCGTTTTGGTCGGTTTGTT
+TAATGGGTTCTGGCTGGAAATTTAATCACGCAGATGCGTTTGGCTCAATTAGCTAACCGC
+GGATGTTGTAAGCCCTGCAGCACTTTAACATTAATTATTAAGCAAACGCAAAATGAGCAG
+TGGCACGTACTTAATTTAAATTATAATTGATACGAGTAAACTAATGAGAATAATTCTCTT
+TGTTGTGGGCAGTGCAGATTTCGAAATGTTTCTCTTATAATTAATTAACCCAACAAATTG
+TTAATTTAAATGTCATTTTGGTATATATTTTTGATATATTAAGAGTATGACATAACGTAT
+GGCAGGCCCAAAAATATAGGCAACATTATTTTTCCTCACACCTCAAGGACACATTTTACC
+CAAAACGAAATGATTTCCAGGATGGGCACCCAAAAACCGCAAATCTTCCATATGACATGC
+CACAAGCACCAACAAAAAATCAACCGCAAGCTGTAAAACAATAAAAACTGAAAAATAAGC
+ATAAAAAGTTATTCGAGCAATCCATCAAATCGGTCATAAATTACGAAATCAATGCGACAC
+ACACGCACACATAATAAAAACTCGCTTTCACCCACACTCACAAGAAGAAAGCACCGACAC
+ATTCATGTGCTACGACTTTTTATTAAGCCTACGAGGAAAAATTAGAAATCAATACCAGCG
+AGGACAGAAAAATCTGTTAAATGACAAACAAAAAATGGCGAAAACAACAATCGGTTACTG
+TGTGTATGGGGGTCCTTTCCTTTTGCTCCTTTTGGTGTGTCTGTGTGCGAATGTGTCAGC
+ATCAGAAATTATCCGCTTTATTTTCGGACTGCCCGTAGCCCTCGACCTAGAGAAGCTTTT
+ACCAAAATTTATGGCTATGCATAACCGACATGGGAAACAACAACCGATTGAAAACACATA
+TACCCGTAGGTGCGGGTGTGCCGGAATTCGGGGTGTGCGAGTGGTCTGTGTGTGTGCCAG
+GCCATTAGAGAAGCAAAAGAAATGTTGACATTGTCATAAGAACGGCAAAGAAATGTGGGA
+GATGCGAACAACAACGGACGAGCGCAGGAAAGCGCAGGAATTATTATTATTTATTCCCGA
+GTTTTATAAGATTTCGGAAAGAGGTGCTGGGCGCTCATAAATTCTATCTTTGTAAGCACA
+CCGGAAGATTATTATGATGTTATTTGAAAACCAAACGGACGAAAATATACAACTACTAAT
+TATTTATAGAGGTTTAACTGTTTTGTGTAAGTAAAAAATGTTTATTTTTAAAATATTGTT
+AAATGAAATTGTATACTAAAGTAACTAAAGCAATATTTTATTATAGAAAATGTTATAGTA
+TTATTTTATTTTTGATCCATATTCTCGTTAAACAGATAAAGCGCTTTATGAGACCTAGCA
+GAGAAGTTTGCTATGTTGAGGTAATTGTATAAGTACGCCTTATGCAATAAAAAGCTACTT
+GAATACAATTTCTCTCCGTGCAGCTGTGCCTGTGTGCGTGCGGGTGTCATTCCTTTTGTT
+GGCCGCTGACAGGCAGACAGATTCCAACCGGAAGTCGCGGGAAGCGGAAGGAAATGCCTT
+CGTGGCTGCTTGCCGAGACAGTGTCAAAAGTTTAACTCTAGATTTATTTGCCATTTAATG
+CTGCAGCTCCCCCTTGCTTTGTACAGGAGTTATAGAGGAGTTATAAATCTCCCAGCTGTC
+TAAGCAGGTCAATGCTCAGGCCAACCTCCCGAGAAAGCCGCTGCATTTGCCTTCTCACGT
+TGCAGCTGCAGCCCAGTTCACCGCCCCCTGTCGACATTTGGACCAGTGTGAGGTCTGTTT
+GTTTGCTGCCTGCCACAAAGTTGTCAACGCGGCAACTAAACGAGTTTTGGTCTTGTGGTG
+TTCTCTATAGGTATGTAGTGCGCCTGTGTTTGTTGGTGGGTTTCCTTTGTTGTCCTCCCG
+CCCGAAATTCGAAGTTGTTTTCCCCGCCGAGGGGCATGCGCAAGGAGAGTAACATACGAG
+ATGAGAGAGCGAGTGGTACAACATCTCGAAGTATAAGAGATGAGAGATGGCGTTGCCACG
+TAATTCAAAATTATATAAAAGCCGTATATAGGCCTATACTGTTTTGTTAAATCGTGCAAC
+AAAGTAAAATAATTTCATTGAACTATTTCGATAACAACAAACATGATATTTATATTTTTG
+AACTCTGGGAATGCACAAAAAGATTTCATTTCAGAAAAGATTTCATTTCAGTAACCAGTT
+CAAAACATCATATTTTGAAATGTTGTTTTCTGATTGGCAGTAAAATAATTTTAATTTATA
+ATATTTTTTGAGGTTTGTGGGCACTAAAATTCCAGAAAGAACGAAGAAATAATAATCCTT
+GTAGGTCATAATTCTGTTGGTAAGAGAACCCAACTGAAGTAAATGCCTTAACCTCTCTAA
+AGATTTAAATCAAAGAATTTATAATCATCAATAATCCAACCAATATTAATTCAATTAAGT
+ATTATTAATTTGTTATGTAAGTATTGCTTCTTATTTAAGAGCATTTAGAATTCTGCATTT
+TGGGAGGAGCTCTAGAATTCTGAACTATCTGGCAGCACCATCGACTCACGTGCGTTATCT
+TTGACTCGGGGAGCCTGTGAAATGCAACAAGAGAATGTTCTCGCCATCCGATGGCTCTCT
+CCCTCGAGGGACTCGCTCTTTTCGCACAGATTCGTATAAGAAGAGAGCGGAGCAGCAACA
+ACAGTCGGAGAGAAAATAAGCCATCCACTGTTACGGGATCTCCGTTTGGGCCAGCAAAAC
+GAGCATGGCGACGAAAGGCAGCCAATGGCTTCGATTGGGAGCCAGTCAAAAATGGTCCAT
+CGACGGGAGATGAACAGCAACGAGAGCAGCATCCGCCAGCAGATCCGCAAGCCAAGTCGC
+TGCCAAGAGCCAAAACCAAAGCCAAAGCCAACCGAACCGGGCCAGGTCTAAAAGAGGACG
+TGTGTGGTAGTGAAGTGAGTGTACGTGGACGGGAGTGTAAGTGTCGGTGCCAGTGCATTA
+GTGTGGGTCGCAGGACCTCTTGAAGTCAGACAACGGCAGAAGTCCACTCCTTCGGTGCTG
+GTTCTTTGCTGCTGCTTGTTAGTGCTAAAAGCACGCAGCACGGAGTGCGCCAAAAGAACT
+ACCACTGCTGCAGACACAGCTGCCCCACATACACACCCGCCCGGTCAGGGAGGTGGAGGC
+GGAAACCTCCGCGGAGAAGCCCCCAGGAAGTGCCATTTGAATAGTAGTAGCAATAGGAGA
+TACGTAGACAACATACACGCTTTTCGTGGGCCTCTGCCCCACTTGCGTGGGTGTGCTCGG
+ATTTATGCAGCACTAGTTACATAAGCCATCATCATCATCGGCAGCAGCATCTGAAGACGG
+CCAAGGCATCGTTAACATCAGCCAGCTGCCATAAGTATGCTATGAATTTCGCTTTGCATG
+CGCCGAGCAGAGCGATACTGCTGTTGGGTGGGCTACGGGGGGGATAATGCCGCCGATACA
+GGACCAGCAATGAAAATCGCATTAGCATTAGGATGTGATAACAGCTGCTACCCGCCCATC
+AGCTGGCGACGACAACAGCACTCGGCTGCTCCACAATTACCAAGGCAACAATTGTTGTTC
+AAACTTTGGATAACGCATACGCACTGTTGCACTTGAGTTGTGCCCCAGTCGGAGAAGTCG
+CCTCAAAGACTCGGCCTAATGATTGTTATTGGGTGCCAAGGGTTATCCCAGAGGTTGTCG
+CACAATGCCCACTGAGGCATAGAAAGTCAGTTCGGGTGAATGCCGGTTTTTATAGGGTAA
+TGTAGACAAAGAAAGCGAAAAGCAAGTACTTTGAAGAGCATAATAGCACAGTTACTTTTA
+TTTGGTACCATCGCAATATTTCGGAGCAATGAGGCTTCAAGTCCTTCTGAGATATTTTTA
+ATTAATTAAGTTGGAATCGTTAAATAATTCTGTGGCTTTGAGAAATCCTTGATTTCTGAA
+GAATTAAGATAGACCTTTCAATTAACAATTTAAATAACCAGTAACAGAATTTGACCCAAA
+GGCTTATTTAATAAAGAAGATAGCTGCATTGCATATTTTAAATATTAACGAATTAATTTA
+ATTTAAATAACGAGTTATTAATTTAATAGGCCATTACTAAAATTAAGAATGCAATTTAGT
+TTGAGGTAATAAATTAGAGGCAGTCTCCAACTTTTTTATGCTCACAATATTTTTTTAGTT
+TTAAAAAAGAACATGTTTAGATTATTTAAATTTTTGGGACTGATCCTAGTTTTGTTAAAA
+ATGTACATAAGTAGTATTCATTCCGTAGAAAACAACGAAAGAAACACTCTAAAGTAAAAG
+AGATCGTGATGAAAAATCAACTAGGTTATAATTTATTTTCCGATCATTTCTATAAGAGCA
+ATACTATATAGTTCTGACGATATAGTTTTGACCTACAAATACAAATTTTATTTTTAATTA
+ACACACACTTTACACACTTTTTAATTTTACCCAATTTTTTTAATATCTAGAATTATATGA
+TCGTATTTTATTTACTAAAATGGATAGGTTAAATTGGACAATAATATTCAAAACCCTAGT
+TCGGTTAAATAAATGTTGTATTTTTATGAAAAGATAGTAAAGGTGCTAAAACTCATAGTT
+AGTTTCATCAGAAGTAACATACTTTACAGTATTATAATGTATATATTTAAAGCACCCTCA
+CATAATACCAGAGTTTAACTTTTCACATACAGAAACTATAGAGCACGATAATACTGCAAT
+AATAGAGGGAATTCACGTCACTTAATACCCGTATAAAAGACATCTGCTTATCTGCATTTC
+ACAGAGCTCTTTCCCTATTTACGACACCTTTTAAAACGATCGTCAAATTTGCTTCATATC
+ACTTATATAATGCCGGTGCCCCTAATTCCCGCAGGTGGCAAGTGAGACGGCTGCCTCTAC
+TTCCAGCAGCGCCATTTGAAGTCGGAAGCTGCATGGTTTTCGCATTTTTGCCACAATCAG
+GAGGAAGCTCATTAAAGCCAACAGCAACAACGGCAATACTAGAAATAAGCTGAAAGTTTT
+CCACCAGAAGGAAAGCGGGTTGGGGAAAGTGCGGGAAAAGGGAAGGGGAAAGGGAAAGGA
+AAAGGGAAAGCTGAAGCAAATGAGCGAAGTCTGGCACAGCGTGTGGGCGTCTGTGGGTGC
+GTGCTGGGGCGTGGCAAATTGGGGCAGCAGAAACATGATAAGGTCTCAAAATGTTACCAC
+AAAAATCCATTGGGAAGTACACAACATTTCCCATTCTGGCCGGCGCGTTGGAAAGTAAAC
+CGCAATTAAATTTGCATTAGGCAATAAAAACAAAGCGGAGTGGCCACTTGTTGTTGTCCT
+TATTGTTGTCTCAGCAGCTAATTACAAGAATTTTGCAGCAGTCGTGCCGAGCGGGATTAA
+AAAACAATAGATATGCCAGGACTGTAAATGCCTTTTCAGAAGTGCCACAAACACATGTAC
+ATAAAATAAAATAAAAACAAACACAGGAGCCGCGTTTACAAATAGAACACAATAAAGGAT
+ATTATGTTGCTGCCAACATGAGTAGAAAGTCAGCAAAAAAATCACCCCGAAAATAAGCTA
+ACAGCAACACCCCACAAAAATAAACTGAAAAAAAGGAAAAAGTTAAGAGCGGAAACAAAG
+TAAGAAAATCATAATGATGATGGATTAACTGCTCCCAGTTGATGCTGATGTTGTGTGAGT
+GAGAAAGCGAGTGAGTGGGAGGAGCAGCGGAAGTCGCAGCAGCAGCAGCAGCAGCAACAT
+CAACACAGCAGCAACATCGACACAGCAGCAACATTGCAACAGCAGCAGCAACAGCAACGG
+CCAAGCAGAATCAGGTTAGTTATTGTTACTTCTCGCCGACTTTTCCTTCCTTTCGCCCTC
+GTTATATACCATTTTTTGCCCGGTTTTGTGGTCCACTCGGCGGATGACCACAGTTTGTGT
+AAATCATTATTTATGCATTAATTATTAAAATATACACACACACAAATCGCCACTGGCAGC
+TGCCGTCAGCGGCGGTCATTGGGGAAAAGTCATTAATCTTGGAGAGCTTACACGGGGCTT
+TCGGGGTCAGTACATAAGAAATTACGACCGAAATTAGGTACGTGGGCGAGTGCTGGTTAG
+CTGGGAATATTGAGTGAGTGGGTCGCCCCCCCCCCTGCTGCCCACCGTTAATTGAAAGTT
+GGTAAGCTGGCAGTTGCAGAATCCCTTGTCGAAAATTTTCACGAGAAATCATGGCTGAAA
+TTCTAATTGCTGCAAGGAATTTCGGCTCCACAAACTTTTCACAAATCCAGCTGAAATTGA
+CAGAAGCTATGCTCCCATTTCGAAATCAGGTTTGCCTCCGTTTGACCTCAAACTCTTTTG
+TACGCTTCTTTCTGAGAATTCCTCACTCCTGTCGAGCTAGCCGAAATATTGATTAATTAA
+CGAGGCCAAGCAATCATAAGAATGTTCTATTGAAACTTGTTTTGCGATTGTCTGACCCTT
+CTTTAGATAAAAGTTAGATAATACTATCAATAATATTCCAGTCATGTTCTTTTGTTCAAG
+ACCCATTGCGAAAACGTGATGAACTCAAGATTAGACATCAATGGAGACTTTTATAGAGTC
+CCTGAGGTATTCCTTTATAAGCTTCTGGAACCATAAGTTTGATGCAATTAAATTTAATTT
+TAGCTGCATTTCTTTTTAATCTCATTATGGCAGTAAAAGCTTAACTTAGTCCGCCCCGGC
+CACCTTATCCACCATCAACTGGACTTTCTTCTTGGGAGCCCTCCAGGAGCCTGTAGACGC
+TGCAGGACACCGAAAAGTTTGCCAGAAAGAAGAAACTTGTCCAACTATACTAGAAAGTTA
+TTTGCGAATGTTTCGTTTTCTGCACTTCTAAGCAAAAGTTGTCCAACCTCCAATGAAATC
+GCATCGAGCAGAATGAAATATAATAAAAACACGCTCCGAGTTTGCCTTTTTGATAAACAA
+TTCAAACACGAAGCCCACACACATGCGACTGCAGATTCAATAACAATTTGGGCGAGGACT
+TTTCAACTATCCCCTTGTGCTACACCTATTAAAGGAGAATACCTTCAAAGAACTCTTGTT
+CCAATTGCTCTCGTACCTGGTAGTTACAATCTAATGGCAGAGAAGAGTTGTTTGGTGAAA
+ACATTTACGTGGTTAGTTATTATCTGCCGGTGGATACATATGTGTTCCTGATAGCAGCCA
+GGAAAAACACTTGAACTGTGCAATTAATTCTGCGACTGTCCTGTTAGCAGGGGAGTCCCC
+GAAAGTGACGTCTTCTTTCTCCGGCTGAGACTGCGAGCGTGCGTTCGTGCCATTTATGTG
+TGAGCTCGGCAGCGTGCCTAGCATTAAAGAATTTCCCAATGAAGTCATCCCGACCCGGGA
+GGGTCCCCAGACTCTCCAGCTTCGAGATAGCATAGCCCAACATCCTTCGAGACCCATTAG
+GAGGGTCTGTCGGTGGGGAAGGGAGGGGTGTTTATTTCTCTAACTGTTGTTGTCTCGTAA
+ATTACAGTTTTTGCCAGAGTCCTTTGTCCCTCGCATTGTGCTCTAGTTGGAAAATTAATA
+TAGACGTGCAAAATGGCTGACTCGGCAGTACGACTGTCTGCAGATCCTTCCAGGCCGCAT
+CCTTTGTATTTGCATTTGAAATTATACTGTCGCAACTGTTTGCCAGAGCCAGGTGAAGCT
+CTTAATGTTATTAATTCCCAAACAGGCAGACAATTTTGGCCCAAAAACGAGATGGAGAAC
+GGCCAAATGTGAGGCGAGGCAAGCCAGAAAGTACATTTGCAAATGGAATGCCAGAAGGCC
+CGGATGGAAGTGCATTAAATTGAGTGAAAAGCGACCGACTTCAAACTTTTAGACAGTCTA
+TTAGGCAAAATGGCTCTGTACAGTCCCTGACTAATCTACTTTATATGCAAAGCCCCAGCC
+ATCCAAAACTCATCCGAATTGAGTAAAATAATTGTTATCCAAAGGCCATTGTATGCTAAA
+CCAAAGCCTCTTAGAAGCTTTGGATGGTAGAACATTTTAAGCTGATTCAATGCGTTCAAT
+TTCAATGCAATTGACCCGAGTTCGGGTTTGGTTGGCAAGCTCATTATTCGGATTATGCAG
+ACAGATATAGTCGTTTAGTCGGTAAGTCCTATTTAAAGTTCTTTGCATTGCGCAAGTAGG
+CATTCGTCACTGAAAAAAACATTGTCTCTGTTGTTGATCTTTGTGGGGATTGCGGATAAA
+TAGGCGGGAATCATAAATATTCAAATTTTTATTCACACCATTTTGGAAACAATTATGCAC
+GCTAAAATCTAAAATAAATCGAACACTGTGGATGATTTGGAAATTATATCTGGTCTTTAA
+ATTTAGGTTAAATCCCCTACTATTCCTAGGTTATATTCGTCACATGCCAGGACCCGTAAT
+TTAGTTATTTTTAAAATCAACAATTCCGCCATTGGGAACCTACAACAGCTGTCGCCAAAG
+CTTTTTTTGTCAAACAATTTCTCAAAATATCTAATTAAGATACAGCAGGAACGGAAGTCG
+GAAATATCGAAGCAGAATTATTTGTCTAAGGTATCGCAAGGTTGGCAATCGAAGGCAATT
+AACAGGACAAAGGTCCGAAAGCCGCTTAAGGAAATGACAGGGTTCGATCCCACTCCACTC
+GCACCTTTCATTGCTCTTTCCCCTTCAAATCTGACTAATTTTAGCTACGCGTCTCTCGTC
+GGGTCCTTTTCGTAGAAAAAGGAGTGAAACTGCCTAAATGTTTGGACAATTAAAAAGGGT
+CATCCTTTAGAGCAGAAAAGAAAGAAGAACCAAACAAAGTGATTTTTTTGTTGGTGCAGA
+ATTTTAAAGTGGACCTAGCCAATGGTAGGGAAAACAATTTAAGTGGGATACCTTGGATAC
+CCTTGCCTAACAGTTACAAAATAAAAATTCTATGATTATTTTTAGACGTCTGATTTAACG
+TCGGATTTAGTCAAGAATTTTTTTTTTTTTAATTTAGATCTAATTTTGAATTTATGAAAA
+GATTTTCAAGCTATCAAATGTGGCTGTATATCAAATTTGAATATCGATTTCACATAAAAT
+ATGACGTCTACTTACTATATTTTATACTCAACATTGAAAAGTATATAATACCAAATAGGA
+GTAGATTTCTTATACGCTAAGTTCCTACTCACTTGTATCAGTTTTCCGATACCCTTTTCA
+CTCGCGTTAACAAAAAATCCAGTTTTCGCTTTTTCCGTTCCTTGCCTTTTTGTCCCCTTT
+CCCAACTTTTTGTTTGCCTGAAAATTGGTTTAATGGCCAAGCGCTTTGGCCAACACATAC
+ACACGCACACAGAGACGAACGCATATTGGGGCAATTTCGTGGGAAAAGCGGGAGGGACAG
+AGGCCGCGACATGCTCCGTCCCACTCGCTCTGTCAAAGAGGAAAAAGTGCGGTGGCACTG
+AGTAAAATAAATAAATGAAACAAAACAAGCTTAGCAACAACATGGAAACTTTACACAAAC
+TTTTGTGCCACGTTGTTGCAGTTGTTGTCGCCCGATGAGCCCGATAGATGTGTCAATAAA
+ATCAATATTTGCCCTGCCTTTGCGACTAAATGTTCAATTAGCGCATCAATCAAAGACGCT
+TGAGCGAGTCAAATGGGAGTTCGCCAGTGTATTTTGAGCCACTTGATACCGGGCTTATGG
+GATGATTTAGGAGTAATATTAACTGTGTGATTAGACCGCAAATATTTAACTAATTAGCTA
+ATAAGTTAAGTCCACACAGGGCCAAAACGCTGGGTACCCAGCAAATTGAGTTCAATTGGG
+TGAACTGCGCAAATAAATTCTGCTGGCTGATTTAACTGGGTAAGATAACCAATATGCATT
+AAGTTAAGCTCCTTAACCAAATGTCAAGAGAGGTCGTCCAAGTAAAACATTTTAGACCCA
+ATTTCCCTATATCAAAGGGGGTGATTAAAAGCGTAAATGTATTTTGCGGACGGCGATAAG
+CATAACTAGATTTTGGAATTAATAGACCGTATTTTACGACTCACCTTGACTCCTGTTTCT
+AAAGCAATAACATGGATACCAGCAAAGTTACGAAATTATTGAACCTAATTTGATGACGAA
+AAAGGGGGAAATAAATAAATTATTAAGGGAAAAATAAGTGCATAACTTTAGTCAGCAACA
+GCTGCATGTGTAAAATAATAACTTTGTTAAAAATAGGCCAATTTACCCAATTATATACAA
+TCAAAAGTAGGCAATAAAAACTTTTTCCATGATCAACAACTTTGATGATATGCAAATTGC
+TTGCCTTGCAAGGACAATGTTCCCCGCTTTTGTAAGGCTTTCATGTAATATATGAGATAG
+ATTTCCCCTGTGATTTATCTTTCATCTGATTTCGGTTGGCTCTGGCACAAGCCTTGACTT
+GCAGATGCAGCACACAATGATATTGGGGCTCTGCACTTAATCAAATAAATGGTTGACCAC
+TGCCTCGGCCCCAACTCAATTGCTCGGTTCGTCTGTTGACGGCGATTGCACGTAAAGCGA
+TTTTAGCTGCATTAACAGGACGAGCGAAATTGCAATCATTTATGCGCATTTAAAAGCATT
+AAGCGCGTAGCAGTCGCATTAATCATACGCCACGTGTGCCCGCCCCTCCGTCGTCTGCTT
+ATCGACGAGGCTGGCCTCGTGGCATGGGTAATCATTTGCCATGTTGACTGATTTGCAGCA
+GCAACATCAGCTGGACATCTGCTGCTGACCACGCAGCAGCACTTTCGTTACGACAGCGCC
+ACCCCCGCACACTGGTCCAGACTGATTTGTTTTGGCATGAACTCTAGTATAATTTTCAAA
+TCTATAGTATCACGTGTTTCATATTTTGAATAAACATAATAGGCTTGATATTTTTAATGA
+AAAACAAGAGAGAACCATATAGTCGACTGTCTCAACTATCAGATACCCGTTATTCAGCTA
+AAGGAAGTGCGAGAGAAATGGAGATATGCTTGCAAATAGGCGGTTTCCGAGATTGCACCC
+GTTATTTGCTTATATCTTTTTAGTGAATGGTCCGATTTGAACAATTTGATTTGGCATGTA
+GCTGGGTATTGATAGCCAGAAAAAATTGCATTTACACTTTTAGACAGGTTATTATATGGG
+CTTTTGTGGGCGTAAGAGTGGGACTTGCACTCCGCTGAAACAAACTTGTGCTGCTTCAGA
+ACCCTTGGAATCTGTATGCCGCATACAAACTATGTACATTTTATGGACATGGACATGGCT
+AGATCGATAGAGGGAATATTTATACTTTATAGGATTGGAAAAGATTCCTCCTACCTGTTA
+AATACTTTCCAACGAATATAATATAAGTATATTCAATTTAGAACATGCTTAAAATATATT
+AGTAATTAGTAATATTATAAAGAACTTAAACCAAGTAAACGAATAGCCTTAATTAGTTGC
+CATATGAGTGTGTAATAAAATTGAAGCAATAAGTTACTGATATTTTTTTTAAACATACAA
+AAACAAATAACATCTGGCCCAGTGTGCCAGTTGAAGCACTGCCACAAAGTCGCACAAAGT
+TATGCAATGAAACTTGCCAACTGAGAGTGCGTGAGTCCGAGTGCTCGTGTGTGTCCGTGA
+TTTCTGCGTTTGTGCCTGTTTGTGAGCGAAGGCAAATTTATGGCTAAATTTATGTGGCCC
+GAGACCCCTCAGAGGCTATCAGTGGGCCCCAACGAGTGTGCGACCCTTCATATATGGACA
+CTCCCCTACCGCTGGTCGAGTAAATATCCATGTACTGGGTCTGTGGCGTAAATAATTCAC
+TGTGAATTTTTAACATATTTTCAATTGAATAATTTATGAGCACAGAAACAACCTTCTGCT
+GCGGTAGGCAAGTCATCGGGTTCGCTATAGATACATTAGCTGCTGAGTTTTGGATCGGCT
+TAAATGACATTCTAAAGGAACAATTTACTGTGATATAGGGTAAAAATGCTTATTTTGTAT
+TGAAAAAAGGAAAACATAATGTGTTCTTTCTTTTATACAAATATATTAATACAATTAAAA
+AATATAGACCCTATATCGCCTACTCAACTAAGTATTTTTCTACATTTTTGTTCTACTGCG
+TTTATTTAAAGAAACCCCACACTGACTTAAATTGTTTGACCGTATAACGATATGTATGTG
+TACTTTATTCCGGAAGAAAAGGCGTTTAATTAGTGACCGGCAATTATAATCGGAGAAGTA
+AAATACAACCAGTTGCGCCGTTTGCTCAATTTCTGATGGAAGGACTTCGGTAGAGCCATA
+AATTTTAATGGCACATCTGAATAATTAATGCTTGCCACACATGCAATATTTTTAATTACT
+TTGTCGTCTCATTTATTTTTGGCCACAAGGCACAAAAACTTGCCCACAGAAATGTGCTGC
+TAGTTGCATGAAACGTTGATTAAATTATAATTATTATAAATGGCCATCGTTTGTGGCTAA
+TTTAATGAGCCAGGTTGTTTAAAATTAATTATAAAAGCTAAGTGCTCAAAGTGACCAGCC
+AAAGATAGTGTGTCCTTCAAAGTCACACCTTTGGATATATATACATTTTGTAAGTTTATG
+CCTAAATTAGACAAGTCACCTTGAGTAGATAATTCGGGTTGCCCTGGACTCTATATATGT
+GGTTGTGCTGCTTGGAGATTAAACCACTAAGCACATATTATTGGGATTATCAATCTACTC
+AACCTAATAACATAACGCACAATACCGCATTGATGATCTCCCAGAAAGTGCTCATATTGC
+TCATACGCCACGTTGCCACAGTCCATGTTATTTCCCATCGGGGCACTCATAAGTATGATG
+CTCCCATCGGACCCACTCACATGTCCATGCTCATCCACTTGATATTCGGATTCCTATCGC
+CACTTGGCATTGACCCACAAATTGCACAATTTTCGTTAACTGCCCAATTTGAATGTCACC
+GGGGTTCATCGAGGACCCATCAGTGGACCGGGCCGAGTTCGCTGCCTTCGATAATGTGTC
+TGCTCACTCGGCGAGAGCCACCTATAAATAAAACACAGATTTGTAGCCATTTTGTTCCAC
+AAAAAAATTAACTTAATTTGAAATGCGGCGGTCCGAAAGAGAAAAGAGAAAGCCGAAGCC
+AAAAGCCGCAAATATTTTTACGCTTCAGCGCGCCTTGTACGTGTATGGCACCGCGTATGA
+GTGTGGGTTCGGCCGCCTCGACTGTGAGTGTGTTGGTGCTCCTTTCGTGGTGTGAGGTTT
+TCGACATTAGGCATGCATTCAAGTTCTTGGGAAAGTCGCCCCAGAGTATCTTGGGTGGAT
+GTTCCAGCTCCCCAGAGCCAGCTAGGATCGCAAAACTTGGGATGTTAAATGGGCGTGGCA
+TCGTCTGCGCCACGTACACGCGAAAATTGACTTCGGAGGGAAAGTGTAGGCCAAGAAAGG
+AGAGCTTTTAACTGGGTTATTTTAACTTGTTTAGCAATTAAGCTGAGGAAAGTGAGCAAG
+AAAAAGGCCAATAAAAAATCTAATTCCCATTTAAAAGTTTTTAATATCAGTCTCATGTTT
+TGTTAAGCAAATCGTTCTTACCATCAAAAATCCCGATATCAAACCCTGTTATTATAGGCA
+TGATTACTTAGCCCGGGATCACTTAGGTTTTGTTTGATTCCCTTTTGGTTTGTCCAGTGT
+AGTCAGGGCTAGTCAAGTTATTTATAGATTTATGCACCCTCACGCCCAGTCCCGAATAAT
+CATTGCCGCCGGATCCGAGGCTTTGGGCCAAAATCGCTTGGGCCAGCAAATAGTTAATTC
+GCCATCTGTGTGTGCTTGTGAGCTGATGGTGTTTTTGTGGACCCGTGCGGATGAGCTGTA
+GTCCACATTATTGCAGCGCGACTGAGCAAACTACTTTGCCTGGGCTGCGCCGACCCTATT
+TCCTTCCAGGCCACTGGGGGAATCTTTTATATGTTCTCCGGTCTCAGCTTTCGCCTGCCT
+CTGGCGCACATCCCCAAGTAATGTTGGGTATCCCGCAACGTGTCCTGGCCTGGCCAGTAA
+TTAACCCCTTTATTAATATCCCAGCTGTAAAAGACTCATATGAGCTGTCTGACTGTGTGT
+GTTTGTTCTACTTGCCCAGGAAACTTTCTCAATCTCAAGAGTATCAGAGTTTGGAACACA
+TATGTTTAGAAATTTTGTAGTACATTTTATAAAAATCATTGCATTCCGCGTTGGCTTTTA
+CCGATACTGACAAGCTTAAAATAAATTTAAATCACGAAAATAAGATTTTTATGATTTTCA
+TATATAGTTAACCAAAGATAGCAAAAATAATGAACCTTTTTTAATTCTTTGATTTCTAGA
+TCTCTAGATTTCCCAAAATCATGAACAAACATATTTTGAGTTCCCTATGGTGCTAACTAA
+TGAAATATCAGTCTTGTTAAGTACACTTAACCTAATTTACTTAGCCCCTGTTAACTTTCC
+CGTAGCAAGGTGCTGTTAAGAACATCCCACAACTTTCCATTATCTACTATGCCCATCGAG
+TACTTAGGGTATCGGTTTCCCCGTACAGGACGCCCCATAAAGTTTCGCCCCATTGTTTGC
+CGTTACCAGGTGTGTAGCTGTATGCCCTGGCAGTCCTTGCCAATTACCCGAACCGTTGAT
+TCGCCAAACAAAGGATCTGAGATGGGAAAGGTGTTAAGTCATGCTAAATATAGTTGCTCG
+GCAGTTAATTAACGCACAGAGACATTTACAAACAGCGTAATATCAAAGTCAGGGCTGCAT
+ACGGTGGGGTTCCTGCGGCTCCGGGTGAATCCTCCGCTCAGTCTGTTGCTCCAGCCTCCG
+ATCCCGTTCTCGATCGCGGACGCGCTTCTTGCGAAGGTGGTAACTACAGCAGGCCTCACC
+ATCCTTCTTTGGCGACTTATCTTCTTGGTTACAGCCCTTTCCCCGAACTCCGTTGCGTTC
+GCCATCCCTAGTCGTATTTTCAATCGGCTCCAGCCCTCTATCCCGGTTCGTATCTCGATT
+CCTTGCCGAATCTCGGGGATGCTGCCTATCCCTATTACGATTCCGTTCAGTAACACCCCT
+TTCTTTATCCCTGCCCCGCTCCCTGACCTTTTTACCCCCTTGCTTTTCCTGCGGAGCCTG
+CGTTTCCTGCTGCAGAAGCACCCAGTCGTACACGGAGTCATTCAACAACGTCTGGTTCTT
+GAAGAGCACCACGAAAAGCTGACGCAGATAGAAATAGTCCGGATTTTCGGCGAAGTGCAG
+CTTGCGGCAGTACTTCAGGTACACGTAGAACTCAGTGGGCAGGCCGGCGCAAATGGCTTG
+GAGCGACATATTCGCCTTGCACTCGGCTATCTTCTCGTACTTCTGGACCTGCGACTGGGC
+ACGGATGCCCTGCCAGGGCAGACGACCCCGCTGGAAGTAGAGCAGCAAGTAGCCCACGGA
+CTCGAGGTCATCCCGACGACCCTGCTCCGCGTAGTGGGCCCGCACACTGGCGTAGCGAGC
+CGTGCCCACCAGATCCTTCTTCTCCGAGTAGCCGATGTGCTTCTGGGAGCGCAGGCTGTA
+GAACTTCTTGGCCAGCCCGAAGTCGATCATGAAGACCTGGGTGCAGTGGCGCCCGAGGCC
+CATCAGGAAGTTGTCCGGCTTGATGTCGCGGTGGATGAAGCACTTGCGGTGGAGCAGCTC
+CACGCGCGCCAGGATCTGATCGGCCAGCATCAGGGTGGTCTTGATGCTGAAGGACCGCGC
+GCAGAGGTTCAGGAGGTCCTCCAGGGTGGGGCCCAGCAGGTCCATCACCATGACGTTGTA
+CACCCCCTCGGTGCAGAAGTGCCGCACGTGGGGGATTCCCTCTCCGCCCCGCAGGACCTC
+GTAGATCTTGGCCTCACGGGGCAGCAGGGGATAGTTGACCGACGCGCTCTCCAGTTTAAT
+GGCCACCTTCTCGCCGTACTTGAGGCCCTCGGCCCGATAGAGCTCCCCGAAGGAGCCGTT
+TCCAATTCGACTCAGCAGGCGGTACTTCCCCGCCACTATGATTTCCGGCATGGATTGCTC
+CCCTTCCGAAGATCTTTGGGATCTCTGGCCATTGTCATGGTTACGATGCGGCTTATGGGG
+TGGTGATGGATGAGGCTGCTCTGTGCGGATCTGGGTTTGTGGGGGATTGGCGTCGGGGCT
+GCTCTGCCAAAACCTCTCGACCTTGCCACGCCTCCTTTCCGGTTCTGCCATGCGTTTTGG
+GGACTTTGCCGAACTTCTACGCTGCCAGAGGAGAAATGTTTCTGGCATTCAATTGTTGCC
+ACTTTTGATTAGTATGATGTGAAGTATGAGTGACTTTTCCCAGGTCTTCGATCTGAGCCC
+GAAAATAAGGTGAAAATTGAATACTTCCCAGTTGAAACACTTATTTAATAAAGCAGTGGT
+TTAACCATTTTAATTAAACTCAATATTGAGGCTTTATTAAATGTCAGGAATTTTTGCATT
+TATTCAGCTAGAGAAAATGAAATCACCGCACATCCAAGCCATTCCACATCACGTCCACTC
+TTCAGTGTCAGTTGGAAATATTTCATTTTGCTGAAATTGTTTTCGCAGCAAGTTTTCGTT
+CTTTCTGGTTTGTTTTCATCCATTTTTTGGCAGTTTAATAAACTTTGGCACTTATTTTCC
+AATTAGCTGTAGCGAAGTTATGCTGTCGAACCGACATTCTCGCTGCCGTCGCACATGTAG
+TTCGTCCTGTGGCGGGGATGTTCTGCCCGGAACCGGATTAATTTACTAAATTGATTACGT
+AACCTGACTGGCTCTATCATCTTCACATCCACCGCAAACATCGCCATCAAATATGGTGTG
+TGCATCACAGCTGCCAGTCACTTGAATGCTCGGCTGTCTGTTCGATGGGGACCTGGAATA
+CTTGCCCCTCGGGCTCTGCAAACTGCACTTTCAATTAGGAGAATTTGAACCGCCTACCAT
+CTACTCTTTTTCATACCCACACCCATGGAAAGTGAGGACGAAAAATAGTTTGCTTTTGTC
+CCAAAATGTTAAATTCCGAACTCTGAAGCACCCCTCTATTATCTATTTTGCCATTCGAAT
+GCTTCTGAGTTGATTAGATTTATGGGCAATCCGATTGTAAGCAGTCATAATTAAATTGCA
+CAGCCCAAATTCCGCTGGATTCGTTCCAAAAATGTTTGGTAAGCAGTATGTGAATGGGAA
+ACCGCGCATAATGCAGAGTTTGAATGGCAAAATAGTTTTGCAAACTAGGCGCAGTTGTCA
+TTTACATAAAAGCTGTGCTAAATATAATTGTTCCAAACGTTTTAGGTTCAGTTTTAGTTT
+GAAACACTGATTCCTCTTTGTTCCTAATATGCCATTGACATACTTTTGTCGCTCTATGAA
+TATTATTACTTTGTTTCCCAAAATTGTATTACATAAACATTAAAATTTACGGGTCAGTCG
+GTCTGATCTGCATATTTTTCCGCTTATAAGCGGCCATAAAATGAATTAATTGGCCACCTT
+GACAAATTGTAATGTCGAATTCACTTCCGCAGTTCTCGGGGAAGATTCCTCTGCGGCTGG
+AGTAGCGACAATCCAGACAACTAAATGCGAGGATCCGGCCATAAGCCCTTATTTATGCCA
+TGCGAATGAGCACATCAAGCGGATGGGAGACGAACCGGGAACAGGCCCACAAGCCACGTT
+AGTCCCGACTACTCACATGGGCACCTCCCCGTCCTATCCGTATCCCACATATCTTTCTAT
+GGCTCCAAGCCCGTAGGACCACCCATCGCATGCAATACTGCTGCCTTTATGGTTGCTTTG
+TAAGAGGCTCTAGGAAGATGTGGCATTAACTTAAAGCTTATGGCGCATTAATTTTAATTA
+AAATACTGCCGCAGCAGCCAGCGGCAATAAAAAGCAATGTTATAACTATCCAATCCCGGC
+CACTTCACCCCCTCCCCGCCGCTCTTTTGCAACTTTGAATGCTGGAAAAGTTCATCACGA
+AGCCTGTAATGATTAGCCATTTAAAATGACGGCGCACTTTTCCTATGAACATGCCCAACT
+TGGACTCTTTTTGCCACTTATCGCATCTTGTTTTTAATTTACAAGTGTCCCATCAATGGC
+TCGTTTCTCACACTCCTGCCCTGCAATTGAAAACATAAGTCCCCTCCAAACTTACCCCCA
+CCTTGGCCACGCCCCGTAATCCTTTATGATGGCTTGTCAAAGGTTATGACCAAATTGTCG
+GCACATGCTCCGCATATTTCATAGTTTTCTCCTCTTCAGTTCCCAATTTTTCGGTTGTTG
+TTCGGTTGAAGCCACAAAACTTTTTGGACAGCTGAATCATTTACATACACGCTCGATTGC
+CAGCCAGCTGGAGTTCTGCGGCCACATGGCGAATGTGTGACGGGATGTCTTGGGATCGGG
+ATGCTGTCTTCCCATTCGCATCGACTTATGCATAAACGCCTTTCCGGGTGTGCCCAAAAG
+TTTTTGTTTGATCTGTCAACAATGGAAGTGGTCTGAAAGTGCGAGAGCATCCATAAGTAT
+TTCAAATCTTAAAGTACATACTAATAATTGCAGGGTTCATCATCTGTTTTTAGGGTAACC
+TACAGCTGCTAAATGTTGGCAATTCAAATACTTATATGCTTTGAACAGTAAGCATTAACA
+TACCTACTCTCGATATCAGACAAGTGTAATGGTTATTATCGTGCCTAAACAGTTAAATTA
+TATCATAAACGTCTTATATTGCTTACTTTACTCAAATTTTAAGTGAAATAACCAGTGTAT
+GACGGATTCCTCAGGTTCTTATTGCCATATTTCTCCTCCTCCGCTGAACTCGACTTTCCG
+CACTTGCTGCTTCTCGCCTTGTAATGCAAATTAGTTCGATATGACTTGCTCAGCTCCCTC
+CCATGGCAGCCCTACAAAATTGCCTTAATGGAAATTATTATCATCGTGACAATGCGTCAC
+GGCCACGCCCACGCCCACTTCGAAGGGCGTTCGCCTGATTATCAGGGGCGGCGACAATTT
+CGCTGACATTGTTGCCAACAAGTTCCGTACGGAATGCGGGGGTACGAAAATTCCTGCACA
+AAAACTCATTAAAAGCGACGCAGAAGATGAACAGGAATTGCTAAGCAGGCGAGCCTACCC
+CTATATACACATTATATCTGCGCACATCAAACATCAGCGGATACAGGAAAAGTGTAAGGA
+TGACAAAGGCAAACAATGAGTTGCCAAATTGTTGAGACTCACTTTTTTCCACCTCCCAGC
+TGCCGGCTACGATAGAGATATAGATGCCAAATTATAGATTAAACAATGACGTGTTCCCGA
+TAACCGGCTCCCAACTCACACCGCCCAACGCCCGCCCCAAAGCTTAAATACATATTCAAT
+TTGTTGGCCGCCTTCGGGACACGTACATACAACATTAACATAATTTCGACGCGTTTCGGC
+AATTTGAACACGTTCAAGAACCGCATCCAAGCGTCCTTCAGCCCACTCCCACTCCCAGTA
+CCAGCACCGTACCCGAAACCCATCCAGCCCGTCGATTGTTTGCTATTTTTAAATTCCAAG
+GGCGTAACTAGAATTTAATTTCTCAACTGCCTAGTCGTGGCTTTGCGATGTCTAGGCTTT
+CGGTTGGAACACGTACATGCACTTGTTTCCTGGGTGGTAGAAGGAAGTATCCCGGTGGAA
+GGAGTATCACGGGCTGGAATCTCCCTGATCTGGGGTGGGCCCTTCAAGTTAAGCACATCT
+CAGGACCCAGCTAAGCCCAAAAACAGACATTTAGCATACGCTTGCCACAAAGTAGGCGCA
+TATGGGTGGCTTCTACTCGATATCCGTTTATTAATATCTCCAAGTGGCAGGTCTGCGTTT
+AAAAACAAATTAATCTTTGCTCCTGAAACGTAACATTAATCAAATAGATAAGGTGCCTGT
+TGAGGAAATTGGGGTTTCTCTATCGTTTATGTGGGAGTTAACGATGAAGATAAGTACACA
+GGTACATAAAGTACACAGTAATTTTATACAAATCTAAAAACAATGATGATGACCAACTGT
+CATCTTAACTGGCACTCCAGAAAACGGCCCTTAGAGGCTTTCCTTTTACTTTTCGATATG
+TTTTGAAGCAGTTTCGCTTTAATTGGATTGAATCATCTCTTGTTTTTAGAGAACTAAGCT
+GCCCATCACTTTTTAAGTTAATATCCTAAATTACACACATGTCCCAACTGATTTGTATTT
+ACCCAGCCATTTAAAGAGACTCTTATGCAACAACTTCCATCTCGCCTTGGCGGGCTTTAA
+TTTAAATCTCTCACGCTTTCACGCATGTGACTGGCGATGTTGTTGTAATTCCTGCCTGCT
+GCTTTTATGTCAACCAGGTCAAAACATGACCCCGGCCATTAACGAGGGGATCTTGCCCAC
+GCCCCTCCGCAGCGCCAAAACGTTTTAAATTTTTTGCCGCCCTGTGTGTTTTTCCCCCGG
+TTTCCTGTTCTTCATTTTTTATCTCAGCTGCTGTGAAAATCCGATGAAATATCTACTTAG
+GCACAAGCACGCGGCATGTGTGTGTGTGTTTAAGGACATTGGGCTTGTCTGTGTGGGTGC
+GTGTTTGCATTGGCATGTGTGACTTGGCATCAACTCGTGCGCAAAACAGTTTAAGAAAAT
+TTCATCTGTCTTGCATTTTAATGATTTAATTTTGCATAAGCTCATAGCGTCGACGTCCTT
+GCCCCGCCCCTTCCGCTTCCGCTTTCTCTTGCTCGCTTATCGGAAGCCAGGATGTGTGGC
+GCTATCGGGTTTCCCTCGGCTTTCCCTGATTGAGTGACATGTCAGTTGATGACATTAGCC
+AAAGCCGGCTTGCGTCTAACCGACGTGGGTCAGGCTAATCCGAGGCATTCCCGAATGTCC
+TGGCAATCAGGATCCTCTCACCTACTTGGCGCAAAGTTTGCCATTCCGGTGTACACAACA
+CGACGCACAATCCTCAAGTGTTGCCATAGTTGGTGGGGTCCGTTTGTCGGCTATGTTCAT
+CTCGGCAAACTTTGCAACTGGGGCCCGAGTTCATTATTTCGTTTTCCGCTACAATTTCTC
+AAAGGATATGCGTAATTTCCGAGCCAAGTGACAGCCGCCTGTTGGGGCAAGGCCCGTGCT
+CCTGCTAATGATGTCCTTCATGTCAACTGTGAGTTTCGTATTGCTTCCTGCCCGAACGGC
+CTCCATTCTGCGGCCGGAGGACGCCCTGAACCCAGATGCGACACCCCCATCCAATTCGCA
+CCTTCCGTTGACTTTGGCACGCAAACGAAATGAATCCGGCTCATCAACGTGGAAGTTCTC
+TGCTGATTTCTGCTGCCTTCACACCCCCAACGTTCGACTCCCCTTTTCCATTTGATTTTT
+CCGGTGCGTGTCCGAGGCGAGAATTGAGCCTTTTATTCGGATCTCACGTCCACATGTGCC
+CACTTGTCAACATCCTCTGGGTCCATCCATAGTGGTCCCTTGTTTGGGGTGGGAACAGGT
+TTTATGATCCGCAATTGCTGTTCCGGCATCCGCATGATTATGCCAACACGTTCTGCCATC
+TTGACGATTGTGAGGAACATGTTCGCAGAGCGATGGAGTTATTATCCTGTTAGTTCATGG
+AGCAAGAACAATAACCAAATTATGCTTAATTGGAGCGAAAAACTTATTCTTGGATAATTG
+ATGATAATTGGATCACTTTGGAAAGTTCGAATCATTCGATAAGTGGGGTAATATGTTAAA
+AAAGAGTGCCCTTCTCAAATTTCACATTTAAATTGGTTTGATTGTTACGTGCCCACAGTG
+TTAAATTAAGTGGATAAATATTATCGTGATCTAGTTCATTATTTTAAACTTTATCTTACG
+TATAAAATATTAAAGCTCGATATCTCTCTTAAAATATTTAATTTCATGTTAGTATTTATC
+TGACTGAAATGTCTCAGCCAATCTCTTAGTCAATGTTTTAGTTAAATTTATTAGTCCACA
+AATCAAAGCTAACAAAAATACGTTCGCCAACTCCTCATTTAAGTTTTGTCATACCGACAT
+CATGTTTTTATATAAATTTCTTGCTCGATAAATGAATATCATATTTAGTGAACGAATTTA
+TCTTCCCAAACACTTCATGTTCATGTTAACTTTTTCTGACAGCTAAGAAACTAGAACCTT
+TACCTGACATTGAGATGTTGGCTCACCTTGGAAGTGATTGACGTGTACCTAGCGAGTTGC
+AAGGAAATCAGGAACCATAGAAAATATTTAAAGTCTGCCTGAGTATCTGCACCCTGAGAA
+GCCCGATCGAAATACTTCTATTCAGAAGTCCAGCACCTCTTCTCGGTTAACTCGTGCGGT
+TAAAGCCTCTTCCTTCCACTCAATTATATAAAGCTGCAGCTGAGGAGAGGGAATAAATAA
+AACACGGAATCTCTTGAAATATTGAAAAAGTTTTACCCAAACGGAGATCAAGAACGAGCT
+GCCTGAAGGGAGGTGGGAGGTAAACCGAATGAGAATCCATTTGGCGGTGCACTTCGAGCA
+GAAGTTGAGTCCGAATCGGACAGTGCTAAGTTCCCACCCAGCTAACCGAAAGCTGGGCGA
+AATACGGCGGGAAGTAAACTGAATCCGAGGTGGGCTTAAGATGGGCGTGGCAATCGGTTT
+TCCGGCAGGGGTGGCCACATCTCCATTGCGGTAAGCCCTGCCAAGCACTCGCATATTTGC
+TGAACACTCAAAACGCGCTCTTACGGCGACAGAAGCCACCTCTCAAGGACGCCGGGATAA
+ATGTATGCAAAAGGAAGTCAATCGGCGGAAAACTGTAGTTGCCTCTCCACCCAAACCCAC
+TGCCATGTACATATATGTGTGTGGAGGAGAGCTCTTATTACACGTGCAAACCGAAATCAA
+CGAAATCCAAACACATTGGCAGAGCCTAAGTGTTTTCACCGAGGCGTCTGCAAATATGGA
+TCCAGGATACGGGGAAGATACACCAGGGTCCTCCACAAATGACAATGAGGGAGCTTGCAG
+AGCTTAAGCTCTTGTTTCTGTATCTTAAAGGAATTTAAATTAAGTTGTTGAAGAACTCTA
+AGTAAGTTAGGTTCATTTTAAATGTTACTCAGTTCTACAAAGGCAGGAAAAGTGAATAAC
+GAAATAAGCATATAAATTCGGTCATTCATTAAATTGGGATAGAGTCATACACAAAACGTT
+TTTCCCATTTCTTTTAGTTTCCAAATTTTAGTACAATTACTTTGCAGTCTTAACGAATAT
+TACATAAAATGTTACATTTTCAAAGTAGAAAATAAATCTCTCAAAGTTATGCAAGGTATA
+AAATGGCAAAGAAAGTTGACACTTCTTTTGGCACTATCCCCTTTTCAAATGTTTAAATAT
+TAAAAGCTGTCTTTTATAGATTCCTTTGCAGCATTTTGGAGTGCCAGGGCGCCTCGTTGG
+AGTTCCTGTCAAGTAATCCCCGTTAGCCAGTGTAACAAAGGAGGAACCCCAGTCAAAAGG
+AGTTGGCACTATCTGCCTCCTTCCCCCAACTTGGGTGCGTGTGTGAGTGGGTCCAGTGTG
+TGTGTGGAGGAACTTCCGCTGTGTACTGGTGTTGGTGATGATGGCGTTGCCATCGCTTCC
+GGTGCGCTGGCTTAGATAATGCCCCAGCTAAGCAGTGGGCACAGCACGTGACGGGGGGTC
+CAGAAAGGCAATGGGTGGGGGTACGGCTATAAGAATGCGGATGGGACCCAGATGCCCGAG
+ACTCTGCGCTCAGATTCCTTGATATCCCTCATCGCAGCTCCACGGGCGATGGCGTTTATT
+AAGCGCATATAATCGTAAAAAAATTAGCTTGTATGAAATACGCACTGAGGCAGCGGCAGA
+ATCCTGCGTTTAGCTGGTGGGGTGGAACGTGACAGAGGACGAGGGACTGGAGCGGTGTGC
+TTAAAATGCAAATGACATCAAGTGTAGTGCCTTTCCAGGGAGTCGAGTCATCGCTTTGGC
+TCCAGCCACGTTGTCCTTTCCCAAGGATTCACTTAAGCGTTTTGATTAAACGACCTGTTT
+TGCTTTATTCTCGTCATAATTTGAATTAATGTCGGAGCTTAGGGCGCAAATTGTTTTGTT
+TAGCTAGTTTTGAGCGGATTAGGATGGAAGACCGAGTTTATAATTAAGAAAAGGGTGGCA
+ATCCATTAAAGTCTTATTGCGGAAGGTACGCGGCGGTTCCTATTAGTGGTTGGTTCCTAT
+TGTTCATTTGTAAAAATTAAAAGCTTTAGGATTATAAAGAAGGGTAGTCTTTTTTGAAGA
+ATTTATGGCATGGACTTGGATTTTTAGTTACCACAATTTTAATTGGTAGGCCGTAATGCA
+AAGTTCTTCAGTTTTATCTATGTATGACCATTTACAAAAATTGTAAAACAGTAGTCAGCA
+TTGTAAAATCCCGAATCAAACACGCTGAGCTCAGTGAAAACATTGATTTGACATTATACC
+CAGCACGGAGCTTACTTTTCCGTTTTCTGTGAACCGACATGAGGTAAATGTTCCCATTCT
+TGACACAGTTTGTGTACACCCACCGAAATCAATATCCGCCTAGAGCTGCCATTCGCTGCC
+ATCGAGTGTCACACATTTCATTTCCGCCTGTCTACAGGACACGCCCACATATGCAGATTC
+ACACGTCCTTCCTGTCCCCTCATCTGCGGGATACATTCTTTATTCGCCAAATGTCGCAGG
+AGGTTGCCCCAAATACATAGTTGGTTGACAGAGGATATAGTTGCCACTCCTTTGGCATAT
+TTCTTCTAGGTCCTTCGAGGTCTCTTCCTGTCGGTCCGTCCTTTTATTATTCTTTGCAGG
+CAACTTTGGGGCTGGTTTAAAAGTGAAAAGCTGAGGCTCGAAGCCCGCCATTAAAATGGG
+TAAAACTTGTAATTGATTGTCTACTGCTAACGCTTAATTCAGTGCAATCGGAGGGGAGGG
+GACGGCGCAACTGTGGCAAGTAGCTCTGCAAACAATAAATAAAACAATAAAATTTTAGTG
+GCACGTAGCATAAAAAGCTCTGGGCGCAAACAAAGACGGCGGAGGAAGTGGGCCTTAAAA
+CAAAGGCCATGAAATGCTCGGAAGTCGAACTCGGACCCGGAAAAGTCGGGAAACTCGAGG
+CGAACAGGTTGCGTGAGCCTGTCAGCATAAGCAGCGCTGGAAAAGGCTCGAGTGGGTGGG
+CAGCTAAAAGCATTACAATACACACAGCTGAAAAACACACAATAACTGGGCTACAATTGT
+CTGGCTTTGATTCCGGGACCGGGGACGGGCTTGAGCCTTGGAGTGTTGCCAAAAGTGGAA
+AGTTTTCAATTGCCAGGATTTGTGTCTCCGGGCCACGCCCACACACCTCACCCACCTCAA
+CCTCGGCCTCCGGCACTTGTTTACGTACTTCGTCGCTCGCCGAGAGCGTATCAATCAACT
+GGGCCACGGGGCGTATGAACAGGGTCTTGGGGCCGGAGACAAAGGCATCCCTCACCACTC
+CGAGCGCCATAACATGCCCGACCAAATGTGTTTGTCCCAAATTAAATTTACTTCGGCCTC
+CGGAATCTAATCAAAGTGCTAGGGCTGCCACCGTGAACTAGGGGTTCGATTGGAAAATAA
+GTTTCCGATTTACGAGGGATATGCAAATTTGCAAGTGGTTTAAGCAAGGCCGATTTCTTG
+CAGCCCTTTCAAGGATATCATTTATTAATAATATTTTTAAAATTTGTACATGAAAGTCTG
+AATTTTTAAACACGTTTTATGTTAGGACCTTATACATCTTATATAAAGAACGTTATATTT
+CCTTAACTATTTCAAGTAAGAAAAGGGAGTTTCAATATCCATGAATACCTAACATTGAAC
+CAAAAACCCTATAAACATCGAACTTTTTGAAAGTATATTCTTAACTAACCATTTTCTTAG
+CTTCAGATGTTAAACCCAAATACATCCGTGCTATCTCGTTTAAACAAACTTAGTTAGGAA
+CATCTTGTACTTTTGTTTCTTCTCACCTCATATGAATAGTTTAAGTAAATTCAAATGTAT
+TCTAGATGAGGGTGTTTTTAAAGCATGATTTATGTAACTATAGGGTATCAGTTTCTCGAC
+TCATCTGGGTCCCGAAATCGCTTCTCGGAGTGACTCACGATGGGCCCTGGTTTCTCAGCG
+GGTTGCCTGTGAGGGCGTCGTTTAAGCCGTGCCCTTGGCGGCCGCTCTCAATCATATCTG
+ATCAAATCAAATCAGCCGCCTCGTCTTGCTCCCGGCGTCCTTATAAGGATACAATACATA
+CGTCCCCAGTTAGGTGTGGGCGTCGTCTCGATGACGCATGATTTTTCGGTAGGTGACTGG
+GATGATGTGAAGATGTGGCGAAGGATGTGGGCGTTGGGCGGATGCTGAAGCTGGTGCTGA
+TTCCGATGAAGATGTGGGCTATAAATACGCCAACGATGGCTGTCTGGCATTCTTAGCACC
+CTGTCTCCACGAATTTCGCTCAGGGCATATTTTGCGGTTATTAAATTTATTAAGTTTCCT
+GCTCGGCGGGGGCGCTGAGTGGACTGATGATGGATGATAGATGAAGCTGTTGGCAGATGT
+CTAACTAATTAAGAGGAGGCGCAAAATGTTGAGGGTGCTGCGCCTAAAAGCCCCAGAAAC
+GACTTCTGGGCAATTTAAAAGAACTTTAACGAGCATTCAAAACCTAAAAGTGGCGTTAAT
+CAAGCCACAATCTCGTTTTTCGAAACTTTTCTAATTATAAATCTGTTCTGGTGTAATTTA
+CAAGCGGTCCACCCGCAAACGAAATTCTCGGAACGAAAAATACAATTGCCCAACATTTTT
+CACGCCCCACTTAATGTTTTTCTTTTTGTGTGCTTTTTTCCGTTTTCTGAAAAATAGGCA
+GTAAGAAATGCGCCCTCGGCGAAAACGAGAGCCAGAAATCAACTTCCGTTGTGCAGCGGA
+AGTGAAATGTGAAATTTGAAATTTATTATTGGCAATGCAAAGAGACCCGGAGGAGAAACA
+AGGAAAAACGGAAGGGGGTGGGGAAGGGCCAAACAATATTTATGTTATTAAACTGAAATC
+AATGTGCAATATCCGCTGGCGACTCAATAAATTTAGTTAGCCGAATTCAGGCTGATTGGC
+ACGAAATCATTTTGGGGCTCGCAAAGCGATTTTTCGCCGTCACTTTTCCAATTTATTTCA
+CTGCCACTGATTTGTGTTCATTTCAATGTAGCTGCCAGATTGTTTGGGAAAGCCATTTAA
+GTTATAATCTTGCTTTTTAATCGAATCGAAATTAATGTTCCAAAGATACATGGTTTAAAA
+TAGATGCATTCAATTACTTTTATCCTTTAATGTACTTATGAAAACATAAACATTTTCTTC
+TCTTTCAGCCTGTTTTATGGAATCATTTAGCAATAATTGCAACTAATTTCGAAGCTTGCT
+GCCTGGCTTTGAGTTTGCTTCAACCCTCGACTTTTACTTCTATCCCCCCATTCCGCTAAA
+TCAGTCAAGCTGGCGTCGTTCAAGCAGAAAAATAACAATAATACTATAAGCAATTACAAT
+AACAATATAATGTGGAGTAGTACTATATCGCCAACCAACTCTAAGAAACTACTGATCGGA
+AGCACACGAAGCGTTGATTATGTCGGTGATAGTGCGAGGACCGCAGCAGGCAATATCAAA
+ACAGGAGCAGCAGCATCAGCAGCAGCAGGAGCCAAAGGATCAAAAGCCAAAGCCACCGCC
+ATCGCAGCCACAGCCGCAGCAGCAGCGAACACAACCAAGATCTCAATTGAAATGGAGCTT
+CATATACAGAATAAGTGCATTTCGGCATAGCGCATCACTCTGGAGGGTGGTGCGGAGCCG
+CCATGGCTGCAGGGCCCCCTTAAAGCCGCATTTTTGGGGGCTACTGGGGTCGGCAAAACA
+AGCATACTACAGGTGAGTCAAAATGTATTGTACGATTAAGGGGGCGAAAAAAGAATGTGC
+CCTCCTGCCGATTATATAACATAGCTCCAAAGTTTATTCTATCAAACGTCCAATCAGCAT
+GTATTTCTATGGTTCGGTTTTATCTCGGATTTTAAAGGCCTTCAAAGCATCGTCAAAAAT
+TGAGCAACTCTGCTGAAATACAAAGCAAAAATTTAAACAGGTCCTCCGGTACATTACATG
+ATAATACTTATAATTCCTCGAAAGCCAAATCATCAAAAAAGGGAATTTTGTAAAATTCCT
+GGGGTTGTTTCTCAGACTACACATGAAAGGTGACTTCTTATCTCTGCATTCCATGGGGTA
+GACATTCTTCAAATTTAGATCTGTTACCTGGCTGATAAGGTGACTCAGAGCACCCTAATT
+CAAGGCCTCGGTGGCGCAGTTGGCAGCGCGTAAGTCTCATAATCTTAAGGTCGTGAGTTC
+GAGCCTCACCCGGGGCACAATTTTTTGTTGGTCCATATATTTTTTGTAAAAAAATTAATT
+AAAGCAAAAAAGTTTTTTTTTTATAAGGTTTTTAGCCATTTTACAAATCAATTTAGAATA
+AGGGTTAGTAAACTTAACCAAAAAACAAGAAAAGAAGCCAGCTTCAGCAAACCCAAGTTA
+AGATACACTTGCAGGTAATTTCTATGTGAGAAATTTTTGAATAGAGCTTTCCGATTTTTT
+AAAAACTAAATAATAATCACAGAGATATATAGATAAGGCTACATTTAAATTTACTAGCGC
+ATTGTATGTTTTGCCTAATATGAAGTATAACGATTTTTTGTATTATTTTGACAAATTTTT
+TCCATCTTTTTAATGGCATCTATAAGATAAATTGTTAAATTTTATTCGTAGTTCTGAAAT
+AATAAATTAAACTATATACCGGCGCACAAGTGAATATGATCAAATATAACGAAGCTACAA
+TTATTTTCCTGTTGTTTTCCCAGTAACTATCAGATCGTTTCTATGACAGATATATGATCC
+TATTTTTTAAAATTGTAATTCGAATTTCTAAAATGTTAAACAATGATTAATTAATCCTAA
+GAGTAGAAGAAGATATTTAAAAAAAACCAAATCTTTAATTAAGTAAATATACTTTCATTA
+TTTGTATACCCTGGCTTTTTCTATCATTCATATGAAAGCTATAGGATATACTTGGCTGAC
+TAAAATCATTATATCCTCTGCAAGAGTATAATAAAAGTTTTTAACTGTTGTCTACAAATT
+ATATGCAAGTTGGAACATTTGGAAAATATCTTAAGCTATAATTACTTGTGTCTTCAAAGT
+GCGAAAAAACCAGACAAAGGCTAAGAAAGTTACATACGAATATTAGTAAGCCTTTCTATA
+CAAAAGGCCTTTCAATTGATAGGCGAAACCAACAATCAATTTGAGCCAAACCTAATTAAA
+ACACCCGGCAAAATAAATTTGTGTAAATTTCAAAAGATCAAAGTGCATCTACCGGACATC
+GCATCTAATTGATGTAATTAATACGGAATCACCAATGATAATTTAAATGTTTGTTAAGTG
+CGTTTCAGCTTTGTAATGCAATTAAAGTTAATGACTGTAATCATCGTTAGTCCCATCCGA
+TCCAATCGTCAGCAGCATAGAAAGGGTCCTCGCTGCCCAGTCGCATTAATTAATTTTTCA
+ATAATAAATTGCATTTTCAATTAACACAATTCCTGATTAAAAGTTTCGCCAATACACGCA
+AAACGGTGAATCCGGGGATGATGGAGCGCTGCAGAGATGCAAACGCTGCACTTTTCATGC
+CCCAACTTGGCTTTAAATTATTAATGGGCAGCGGGCGACCCCGATGAAAGCTGAAAAGTT
+TAGCGGCAAACTTTTTAATAGACCAGTCCCATGGCAGCTGGCTCTCATCGCCGATGTTTA
+GCGCCCCATCCACCTAAAGGACCCTCCACCTCCATCTCCACCCGGGACCCACATCCTCCA
+GGTCCTTCACACTCCTTCCCGGGACCTGCTAATTGCATTTGTGTGCGTGTGGGAGCCTCG
+TTAATTTGATTTGCGCTTCGCATCGCATCGTATCTTTTGTGGTTTATCTTTTGTAATTAG
+ACAATGGCAAGGCACAGAGCTAGAATGCCTCATATGTGTTTAGCCAGGTCCCTGCCCTTG
+CGAGTGGGTATATCCACCATGTGGGTCAGTGTGAAACGATGGCCTTTTGACGTTTCCTGG
+CTGAGTGGATTTATTGTGCGAGAAAGTAAAAACTACATATATGGTCAGCACATATCTCGC
+ACAGTTGAAAGACATACGAGTACATGTCCAACAGTGGATTAACCCATATTTGACAGTGGC
+TTATACGTACTACTCCATATATAAGTTTGTCGATTTCTAGCGTTCAGTGTAATAAAAGAG
+TGAAAATCCTCTATTTATATGTTTTGACTTAAACACATGTCGACAAAATCACAATTTAAA
+TGTAAGCAAATAGTTATGAGTCATCATTTTATTGGAGAGTCGAAATATGATTACCATTTG
+AAATTGGATTGTTGCTAATTGAAAGTTATCACCTTCTATAAAGTCAATACAAAATCGTTA
+TTAAAAAAATTTAATTAACCATCTGCAGAAAAATCATTGGTTCTATCGATTCTTCTTTGA
+ATCAATTGGAACACCAAACGAGTAATTAAAAAATGCATTTGTTTTTATTAAAAAGTTATT
+TTAAAAGGTTGTTAAAAGCAAACAAAATTGAAGAATTTAATTAAATTGCACCGATAAACA
+ATACAGTGTTTCATTTAAGTTCAGACAAAGGTAAAAAATTCTTTTCAGTATACCTTAGTA
+AGAGAATGTTATTTTCTTTAAAAAAATAAAAAGGAAATTATGGAAATAAAATCAATAAAA
+TAAGCTTTATGAAAGAAAATTGTTTTAAAATAGCAGATACCGGATGTCCTTAGACCTCGT
+ACTGTAAATAAGAAGCAAACATTAAATCTGAAAGATTATAGCTCGTAAAGAAACTTCTTT
+TTTCGCCGAACCATAGGAAATTATCCTCAAAAAGGGTATTAGCTTCGTCGAGGTAGACCC
+TCTGCCGGCAACCACGCCCCCGCCTTTCACCTCTCGCTCGGCAAATTCAATTAACTGCAG
+TTGGCAGTTGCGAGTTGGCCGCTTTGCCATTTGCTTTCCCGCTGCGCTCTCCATTATTTC
+CATACGTGTGTTTGTGTGAGCTCTACAGCTGCGTTTAATTTCCACGAGCGCGAGTGTGTG
+TGTCAATGGCTTTTAGGACCGCTTTCCCATGAACCCCCAGCCCGAACCCCCGCCCTTCTC
+CGAACTCAGCTGTCCAACATCCGGCATTATCCTTTCTCCGTTCCCGTTGGGCGCCTTTTA
+TTGGATGTAATGCGAGATTTGTGCATTTTTATGGCATTTTAAGCACTGCAAAATCAATTA
+CGTCCTGTTTAATGGCTGTTTGCGGTCAAGCTGGCAAGGGAACCCGTTTACGTGGTGGGA
+AGCTGAGCACCCAACATCAAACATTTTATTGCAGGGTAAATGTAACAGGCGTGTAAACGA
+AAAAATGCGAGTCCAAATCACATAATTGTTATAACAGTATAAAATAAATTGGGGCACTCG
+GCCTTGTCTTTTTTTCCAGCTGAAGAAACAAACATTTTTAAACGAAAACATCTTCGCCTT
+TTAATAAAAAGCAATTATAACTCGGCCATGACCCCAAGTTATTTATGTTTTTCCAACGAA
+TTGGAAAAACGAAAACTTTGGCTTAAGCTGAAACCACGAATTGTTTTTTTCTATCGTGTT
+TCGTCGACCTCTACAGCTCACTTTATAATGTTAAAACATTGTTTTTCTGAATATGGGTTC
+CTAAATAATTGATTTAAAAATTATAAGCAATACAATTGGTTAGGTCCAACATCAATATCT
+AACAGACATATTTAGTTTAAAAGTGTTTTAGCTGTCAAATAATTTTAGTTTAAATGCAAT
+AATTTTAAGGCCTACGATAACCTATATAAGGTCATACGAAACCTAATAAGTAGCGCAAAA
+AGTCCAAAAATTAAAGTTTTGAACTTTTAGTCCATTTTTAGTTTATTTTGTCATGCATGA
+CCTAACATTCTGTTTATCATTTTTCTGTGTGAGAAAGCTATAATTTTTTTAAAAATCAGT
+TTTAGTGAATAAAATATTTGGAAAATCTATAAGTAAGTTACTTATTTAAAAAAAAAAATG
+TTGTTTTTATTTTTTAATTAGTTAATAACAACTTCACTAACAGTTTCACCTAATGCTGTT
+TTATTACATCTTTAGTTGCCTTTAACAATATCCAATCAAAAGTTGGTCGCCATAGAGCTC
+CGCTGATTTAAGGGAGGTATTTGGCTTTTTCGCCCACTGTGCGTTCGCATGAACGCAGAG
+ATTTTGGAAACTATAAAAGCTAGGCAGGAAGATTCTAGAGGTTCTTGCGAGGGCAAGTTT
+ATTTTAGCAGGGTGCCACGCCTACGCGCCCGAATAGCTCACACATTTTTTAAGATTATAG
+TAAATGGGATTTTGTTTTGATAATAAATATCCATAAAAGAGTTATAAAGAAATAAAGAAA
+TAAACGCTTGGGAACAGTCGCTTTGATGCTAGCATATCTCCATCTCCCTCAGACTCCCTT
+AGCTGAGTAAGGGGTGACGGAGTAAAAGTCAAATGACAGTAAAAGGAAGTGAAGTTACAC
+ATTAAACAGGACTTTGGCACTCATTCTTAACTTAACTTTAATCCATGTATCCGCTCGTTT
+AAATGGACGCCAACATTTTCGAGTAAACTGCGCTAATTCCAGCAGATAAACGCGGGAAAT
+AAAACGCAGTGCATCATACCAATAAAAAGTGCGCCATGAATATCTATTTGGGTAAATTTG
+GAAAAGCTGCTCGGATCCCCGGCGTGCTTATTTATGTGGCAGATAATGTGCCGCACTTTA
+TGGGGCAGCAGGAGCATAAAGAGGCGCAAAGCCGGCCACGACAACGGCAACGACCGGAGC
+AGCAAGGACACGGAGCTGGATGCTGGGGGTCGGAAAATGGAAACAGGACCTGGCAGACCA
+CGGAGCAGACCATCAATGTCATTTCTTATTCAATTACCAGTTCAATAAAAATAAAACTCA
+ATGATATGCGGCGCTGGGACATAAAAGCGATGCGATGTGAATCGATGTCATGCCAAGCGC
+CGCGATCTGACCCCTTTGCCACGCCCCCACGCGACCCCCGCCTTCCTTTTCCCCGGGGAA
+AGTAACTGTGCAGTGTGTAATTTAAAAAAGTCTGCTCCAAAGTCGTTCCTCCTTTTAGGC
+CAAGCAGCATTTTCGCTCTTCCCAACGCGGCCACTTCCGCTTCCGGTGGTTGGCCTGCTT
+GGATCCTTTTTGGTGCCCCCTAATTGAATATAGTGTGCATAAATTGCATCTGATTTCATT
+GCAGTGACAACAATGGGTATGCTGATTGGCAGAATAGAATTTGCATTTTTATGAGAAGAG
+CGGGAGAAGTCAGGCCCCAAATGATTTTCACTTGACTTTGTTATTAGCGCATCTCATCAC
+ACATACACACTGAGGAAATCATTCTTAAGTTGTATCATATTGAAAGCTTTTAGAGAACTT
+AGGAGGATAAGAACTACCAATCTATTAAACTCATTTATTTAATGTGTGAGAGTTTCCAGG
+CTATAATCTTAAAGAACTTATTTACTCTAAATATATACCGGACTTTTCTTTTGAGATTAG
+AGTACTTTTTTTCTCTGTGTGTATACAATCAGGAAAATCGTGAATTGGCAATCCGTTCGA
+TGGCTTCTTGGTGCGACAAGGCATCACTTTAAAGTGCAATCAGGCGTTAAATATCCTTTG
+AGCCTGTCACTCACTCAGCTCATGCATTGAGACCCACAGCGAGTCCCACATCCAGCCGGC
+CACATCCAAAATCTTCCGCAAGTCGCCCCCGTTTCCCCTCTTTCATTACCATTTATCTCT
+TTTCAAATTGTATTTTATATCTCCATCGGCCTTGGCTTTATTTTTAGGATGCTTCGGCAA
+CTCCGTCTCCCTGATCTCGGACCCCAGACTAAATCCCAGTAAGAGAGTGAGGAGACTTGG
+CTGAAAAGGCTGCGGGTTAATGGGGTCATTTCGACCACGGCGGGGTGATATCCAAAAAAG
+TCCAGCGTGTGCGTTATGAGCTTTGGATTAGAGTTATGGCTCGTTACTGAAGCTTAAAAG
+AGCTAGTGAAGCGCATCATTAGGGATCTGAAATTTATTAATAAATTAAAGCGAAAGTTGA
+GGATTACGTGGACTTGATTGAAAAGTGATTAGAGTTTATTGAAAAAATGTAATGCTGCTT
+GAAATAGCTTAAAGTGAAGGTGACACAAAGCAATAATTGGGGTAACCGCCATTTTGACTT
+CAAAATACGAAAGAACTTATTGAAACCAGTTGCTCGTTTGGATACTAAATGAGGTTTAGA
+TTAGCTAAAATAATTCCAGTTCCCATACTTTTTTATGATTTTTAATAAATATTATTATAT
+TATTTGACTTAAAAGGTGCTTTTTATATTTTTTATCTAAAAGTCTT
+>ENA|CAKG01034665|CAKG01034665.1 Drosophila suzukii WGS project CAGK00000000 data, contig drspszk_2144681
+AACAATTTATAGACAAATGAGTTATAACAGATCTTCAGAACTATGCCTTGCCTAAATCAT
+TCAGGCCTGCTTTTGTGGACCAGATCTGACTTCAAAGAGCCACTGTTCCCCATCTAGTCT
+CCCTAGGAGGAACCTTAATTGAGTTCATACGGCGCATTTTTGATTGTCAGCGTTGTCATG
+GCCGGCGGACGAGTCGCCGGTGGACGGAATGGAGTACATCGCGGCACAGGACAGAATCCC
+AGCGACAATGGAGCACTCGAGGAGCTGGCTTCGTTATCACACAGAACATGGCAGCACATG
+GGAATTGCTGCCTCCTGGTGCCGACTGCACTCTGGATGGGAAGGCAGGGACAATGGATGG
+GCGCGGAGCTTTGGGGGCAGGAACTATGGACTCGGACAAGAGCCGGCGAGGCAGAAGCTG
+AAGCTGAAGCTGAAGCACAGTCTGCATCAGAATCAGAAACAGAATCCCCGACAAGAGCAA
+TCCATCCACAAAGGCAAAGGCATTTCATGCTCATCAAATGCGTTGACATTGAACAATTGC
+GCGTAATGTTGTCGTACACTTGACAAGCGCGCAAATTGTAGTGCTACCTGTACTTGAGCC
+GCAATTTTGCTCAAAGCGAAAGCTGAACCACCGGCATCGGCTGTCCCAAAATCGATCTGC
+GTTTGGTCTAGCCGAAAAGCTACTACCAACTACTTTTGATGGAAATTGGCAGAGTTGTCT
+GTCTGTCTGATTGCTGCGACGTTTGTCGTTTGCCGTTTGCTGTTGTGGCCTTAATGAAGC
+GGACGACATTCACCGGACAAGCTCCGCTCTCTGCCACATCAACATCCACATCCATTTCCA
+GTTTCCACTTCGGAGGCACTCGCCAAATATGCGGCGACAAGTCCTCGCTAAATGCTATCC
+AGATTAATAAGTCCCAGCCGTGTGGGTGATGTGAGCCACATGTGGAGCGAGATACGATAG
+TAAAAGTCAAAAGTCGCCCCGGGCCAGACGTTCTAGGCGATATGTCTGACCACACTTGAA
+TAAAATATATCCGCAGCCTAATCTAGCTAAAATGTAGATAAAAGGGTTAAACATTAAAAA
+AAAATCAGCCTTTTTTAAGGGTTTAATGGGGTTTTGGGTCAAGAACGAGCACTTCTTTGT
+GTATTTTTATGTTTCTCATACACTGCTTTAAATATAAAAATTTGTTTTAAATATTAATCT
+TTGCTTGCGTAAAATCAATTTCCAGCTTTACAAAAATAAGAATAAGAATAATAATACATT
+TTTTAGTTATCGTATTCCTGGTTTCCAAGACGTAGTTTTAAGGAACCCTTCGTAACCCCT
+ATAAAAATAAAGCCTTATATATTTTATATCGATCATTGGCTGTGGTGGTAACACTTTGTA
+TATCACTTTTGTCAAAAAGTTCAAGCTATTCAAATTAATTGGGTTATTTCCCAACTGGAT
+ACTTCAAAGTTGGCTCTACTGATACAATGGATTACGAACGATTTCTCAGAGTGCATCACC
+CCCCACCTTTGGTTTTTGGGGCTACCAAATTTGGCCAAGGCAATATTTTGTTCGTTTGGC
+AGGCCGTTAGAGATTTGCAAAAGGTAAAACTGTAAAATGCATTTCGGCTTGCCTTAAATG
+GAGCGGGGAAAAGTCAGCAGAACGCACGATAACGAAAGAAAAGTGCAAACATTGTTGCAG
+AACCGCAACGAGTGTGCAAATTTGCCTTTCGATGCCGGCCAGAAATCCGAAGACTGGTGA
+AATGCATTCGAAGCTCGACTCCAAACAACAATGGGGCAACAATGGCAGAGTGGCAACGAG
+GAGGAAATCTGCCTCTGCCCGACCCGATAATCGCCTGGCACTCGAAGGCTGCTCCTATGA
+TTTTAAGTGGACGTTATACCGGAGTATTCGCCAATAATTGCAGTTGCAAATATGAGTTTT
+CCCATTCGCCATTTGCCCAGTGCCATTTTCATTTCCATTTCCCAGGCCTGCCCAGCTGCA
+AAGTTCTCGGCCGGCAATTGCCGTAATGAGCAATAAGTTCCTTCGTTATTTATTCAGTAA
+TTCCACACCTCGTATGCGTATAAAACAGTTCACAGTTCCGGGTCAGTCGACACTCCTAGT
+ATTTGCATTGGATTGGATCGCAAGATGACCGAGCTGCAGAATGAACGGAGAAAGGGAAAA
+TGGCATCGTTTGTGGATACCGTTTTTTGAAGGCTGGGCTGTTCTCAAGGATCCCAGTGCT
+CGTTCCCAACATATTGTCGCCTACTGGACTCGGGATCAAATTAGGTTGGATATAAATGGA
+ACCCTAGAAGTTTTTATAAAGGTTTCCTATATTATAGATCCATAGGTCTTTACACAAGCA
+CGGAGGAACGGCGTCTGTCCAACAATGTGGTCTGGCAGTCTTATATCTTGATCCAACTGG
+CGATTAGTATAGCCTCCCTTTTCTACGGTATCGTTGAGTCCATTGGTGATATCGTCAATC
+TGGGTCGAGATCTAGTCTTTACCATAACGGTTCGATAAAATAAAATGTTTATTATGCATC
+TTTCATTGATATAAACCACACCTCCTAGTGCCTATTTATATGCTTTAGATTGGCGTTCTT
+CGCTCAGTATGGTGATGACGTCGATATGGTAGTCAATGCTCTCGAGGATTTCCATCACAG
+GACAATAAAGGGCCCGGGAAGTAAGGAAGTGCAGTCCACCAAGCGTTTGCACTTCCTGTT
+GTTTATGGCTTTGCTCGTAACCTGGTTAACCTTTCTTATACTTTTCGTCTTCATAAAGAT
+ATCAACGCCCTTTTGGATGGAATCGCAGATATTGCCTTTTCACGTCGCCTGGCCCTTTCA
+CCTGCACGATCCAACGAAACACCCGATTGCCCATGCCATCATCTTTGTAAGTCAAAGCAC
+CACTATGCTGTACTTCCTAATTTGGCTGGGCCTTGTGGAGAACATGGGTGTGTCCATTTT
+CTTCGAGTTGACTTCCTCCCTAAGGGTGCTTTCTATCGAGCTGCGAAACCTCACGGCCTT
+TTGCCAAGGCGATGAGAATCTGCTGACTACAGAGCTGCATCGACTAACCAAGTTTCACCA
+GCAAATCATCCTGTAAGATCTTGTTGTAACTAAAAATACTAAAAATCGTATGTTTCTATC
+TGCTAACAGTCTTTCAGAACATTGCAACGATATATTTAATAAAGCATTTATAATGCAAAT
+GCTGGTAAACTTCGTTCTCGTCTCATTGTCACTTTTCGAAGTACTGGCAGCCCGGAAGGA
+TCCCCAAGTGGCAGTCGAGTATCTGGTTGTAATGCTGATGACTCTGGGTCACCTCTCTTT
+CTGGTCGAAATTCGGAGATATGTTTTCCGAAGAATCGGAACAGGTGGCCTTTGCTGCCTA
+CGAGGCTTATGACCCGACTGTTGGATCTAAAAGAATACATCGGCACTTTATTTTCTTTAT
+TCAGAGAGCCCAACAGCCGCTTGCGATGAGTGCAAGTCCTTTTCCACCTTTTAACTTGGA
+GAATTACATGTTTGTAGGTACATACCGAAAAGGCTCTTGAAAAGTTTTTGAAAATTTTAT
+TTTGCAGATTCTAAAGCAATGCTATTCAATCCTAACAGTGTTAACCAACACATTGGACTA
+GATCTACATATTTTTTTTTAGTAAAAGGCAATCACATGCAGAAACTTACATAATTGTAAA
+ACACTTTGCTTGACAAATAAAAGCATTAGGTTACTTGTCGCTTTATTTCATCCTTCTCAA
+CTCTGTAAATGAAATCAACCATTTTGGGCCACTCGAAGAAAGTTCTGCAAAGAGCCTGCA
+TTTTATGCATGCGACCCCAAAAGGTCGCCACTGCATTTACTGCAACTTCGAAGAGTGGTT
+CAAGCCGTCTGAAGATTGGGCTCATAAATTGCAATTGTGTGTGGAGCCCGAACTGGAAGC
+TGGTTTTCCTTCAGACCGATGCTTGTTGGCTGCCGGTTGCTGGCGTTTGACTGCTCCGTC
+ATTAGCTTGATTGAATCTTATTGTTGGCAATTAACCTTCGCTGCGATGGGGCCAAGAGTC
+TGAGGGTCTGTGGGGCTACGATCCTGACATTCTGCGGCATGGACGAGGCGAATAACTTCA
+TTTGGCACGACTACATGGCATAACATGTCATCTTCCTGGGCCACACTAATTGCCAACGAC
+AAGCAGCCGCAATTAATTAGCAAACGCCAACGTATTAGGCCAATAACCAATAT
+>ENA|CAKG01060972|CAKG01060972.1 Drosophila suzukii WGS project CAGK00000000 data, contig drspszk_8368
+AAAGATATTAAATCAATTAAAACAATTTCAATATGAGGTTCTAAAAAATATAAATAACAA
+ACTTCAAATTGTGATTAAAATTCAATTAATTTCCACTTTATTAAAAACCCTTCCAGAGCT
+TGAAATCGTTGTAAAAATATTTTTTTTTGAAAACCAAATTTTTTAGCGAATCAAGAATAC
+TTCCTTTTTTATTCATTATTTTTGGAAGTCCCCAAAAAAAATTCCCATTACCAAAAAAAC
+AGCCCGATGAATATAGCAACTCATGCCGACTTTCTTGAGGGGCTTCCGCTGGGGGATGAG
+GCGGTCTTTCGAGTGGGCGGATGGGACGGTGGAGCACCTTATCCATAAGCAATGATGAAT
+AACGGTGCTTACGCTTCGGACATTTGATTAATGATGCGTTTACCGACCTCGCCGCCCCCT
+CTCACCACCCCATCATCCATCTTGGCCTTCGCCTTGCGCCCGCGCACTCAGTTTTCAACG
+CCATTTTTTGTGGATCTTGGTGGGTTTTTACTTTTTTGTACCGAAGTACACTATTTCGGG
+TGCGTTTTAGCGGTGCGCGGGCTTTTTGTTCTTTATGCCCGGACATAACTTTATTTTATT
+AGCACTACGTGGCAATCTGCTGGATTTGCGCGGCATTAAAAGACAATTTTTACAACTTAC
+CAGCGATGCTTTTTCATACTTTTCCCTCATTTGCATCGCCTGCGTTTTTCTTTTCTCCTG
+CCACGTCTTCTTTCTTTTTTTTTGGTTTTACTATTTTTCATGGTCTGTGGCCTGGCAGAC
+ATCATTTTTTGTGGGCCCATAAAGTGCGGGACTGTTTATTAAATTCTTTTGCGGCAAGTT
+CATTAGACAAAGAGCAAAAATTAATCAGCTTTCTTCCCCGCCCAAATTCATTTCAGCAGC
+ATAAGAACATAGTAAATGGACTTTGAAAGTTGCACCGCGGTTTTCCTATTGAGATGAATC
+TCTTTTCACACCGAAAGTCTGGGGATGGATTGGGATTTTCGCAGCATGAAGAGCAGAATT
+CTAGGAAAAGGTGTTCATTAGTAGTTAAACCAAGAAAAATCTTTTGTGGATTACAATATT
+TTTTTATTAAAGTGTGGTTTCTACAATACAATAGATAAAATGTGCACGATATTTTATGTT
+ATAATAAGCTCCTTAGTTATCCTTTCCCAAGTAGTTCATTAACATCATGCTGAAACTATA
+GATTCCCTTGGTCAACTGGAGAGCTGTATTCATTGACAGTGGAGCCATATCTGCGGCGGT
+GAGGCAAACCTCTTTCTGGGCTTTGGCTATCATCAGAATAATGAGCTTCTCCTCTTTTAC
+AGGCAGCTCATACCACAAACAGTTGGTGTAGATCACACTGAGAAATTCCTCATTCTAAAA
+AGCATGTATTAATAACTGTATCTTGAAAAAAAAAATGATTAAGTTACAGAATTTTCCACC
+AAAGTGCCGAGTCCGCAGAAAGTGTAGAGGGTTATGGCGGCGTATATTAGATAAAGAGGA
+GCTGCGGGCCAGGCTTTAATAAATATGCAAGATATGGTACACAGAAGTCCTACGCAAGTT
+GTGGAAAGCTGAACAAATAACACGATACTATAGATCTTCTTGGTGGTCTGAAGAATGCTG
+GAAAATAATAAAAAGTAATGATAAGAAATTTAAAGAAAACCTCTAATCACCAATATTTTT
+TTACCTAGAATACAACTGATGCCATGTCAAGAGGTCACAGAGCATGGCCCTCATCCTAGG
+GAACTCATTCCTTTTGACAACCACCTCGTTGAATTCCTCCAGCTTCAAAGAGAATATGTT
+CTTAATTAAAGGCACATGGGTGACGAAAAGAAAGAAGTACATATCTCCGCCATAATTGCC
+CAAACCACCGAAAACAATAAATCCCACATGGATAGCAGTGAGCACCAGATGACCTCTATC
+GGTGGTGTGATCAAGTAGTGGCATCATGAACTGCATGACCAAAACCTTCTCGTGCAGAAC
+CACCAAATAGTAGATTGGAAAACCGACAATGAGACCCAGGAGGATAATGTAACCGATCAT
+AAAGCCGATGATCAATTGCCAGGTTATACGGATTCTGCTTTCCAGGCATTTGGCATATTC
+ACCACCCTTGGGACCGTATTCACTGGGGGCAGAACAGAACATACATCTTGAAATTAAAAT
+ATTTCTGGGAAAATGCTACTCCTACCTGTAGATATTCTCGTAAGTGTTTTGAATTTCTCG
+CATCTCAGAAGCCATATTGGCGGTGACCAATAGCTTAGTTAATCCTTGGAATCCCGACCC
+TACCATAGCAAATGCCTGAAGGATCACTGTTAGATCTCCATTGATAACCACGCCTACGTA
+TATGGTATATATTGTGCAGGCAAAAAAGAAGAAAATGGCGACAATTACAGAGTAGGTGAG
+CCACCACATTCGAAAATTGGGATCTGCAACATCATTTCCGCAGAATCCCACGCAAAAACG
+TATCATCCGAATGACCTTGCGATACCGCTCGACAGGCTCTATTTTTGCCATTTTCACTGC
+CAACTCTTTGGATACAATCTTATAGGAAAAGTGATTCCCAACAGTAGGGAAAACCCACTT
+TTATAGTCTCGCTTGGCAGACTTCTTATGTCAAAATATTGACAATTTAATTAAGGTATTT
+AGCAATAAAATCGTTTCATGGTAACTAACACTTCAAGGAGAAATATAAAAGTGTAATTAA
+TAGCATTTCATAGTTAAATAATTTATTAAGTGTAGAAATACTGATAGGTATATGTTTAAT
+TTCTTTCCATTTTGATTGTATTACTATACTATTTTTAAAAAAAGAGAAAATTTTAGGTTA
+AATGGTAATAAATCTTGGTTTCTTGTTTTCCATATCGATTTGTCAGTAAATGTAACGAAA
+TTTATTTCATTCCCATCAAAACAGCTCCCATCCAAACAACTTTATGCATGAGCACATTTA
+ACACCCCGGCCAGAAAAACCCAAGATAAGGAGAAAATCTCCACGCAATTGATTTAATATA
+AAATTTTTTAATAAAATTTGCTGCCGGAAAAAAAGTGAATTTCCAAATGGAAAAACCAGG
+GAAAATGGAAACAAGGAGGGCAGCTCGAAATTATATCTATTTGCAGAGCGCACGAGTCCT
+GATGTGGCGATTTCGGGACAGGAAGTGAAAGTGCGGGGGAAATGCGTAAGCGCCTAGGCT
+TTGGGCCAACAACTAATAAAGGCTATCAACAACAGTTCAAACAGCAGCAGCAGCATCGCA
+AACAAAAACAACAAGGACGCCAGGACAATGGGCTCAAAATCAGCCAAACAGGATGAGGAT
+GCCCAGCCTCGATGGCGCATACGCATACGCACTCAAGTGAATATTTTCTCATTTTCTTGC
+ATTTAAGTTGAGTTCGCTTTGAAGTTTTGACATTTCATAAGGCAGCAGCGAAACAAATTT
+CGTTCTTCCTCATTTCGTTTTTATTTTATTTATTTTTTTCGTTTATTCTATATATTTTTT
+TT
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/input83.fas	Thu May 30 07:13:55 2013 -0400
@@ -0,0 +1,106 @@
+>OR83b
+TTTTTATAATGTGTGCGTGTGTGTGTGTGTGTGTGTCGCATTGATTTCGC
+AATTTATGGGCGATTTGATGGATTGCTTGAATAACTTTATATGCTTATTT
+TTGAGTTTTTATTGTTTTACAACTTGCGGTATTTTATGTAGAGATCCTGT
+GGACGACCTAATGGAAATCATTTGGTTTTGGCTGAAATGCGGCCATAAAG
+GTGTGAATCAAAATAATGTTGCCTATACTTCGGGTATATCATTTCATATG
+GAAAGCGCTTAATAATAATTATATAAATATATAATTTCTAGTTAATGTGA
+CTTTATTAACCCATTAGTGCGTTTTAATCATTTAATTTGGCATCAGAATC
+GATCACAGTCACGAACACAAAAGCGTAATGGTAAAAATAAAGGCTCATTT
+GTTTAAGTTGTAAATTAAATAAAGCAAGTGTCACTTTCCATTTAAATGTT
+GCCTAATAATTAATGACAAAAGGCTGCAGGGCTCACGATGTCCGCGGTTA
+GCTAATTGATCCAAACGCATCCGCGTAATTAAACTTTCAGCCACAAGCCC
+ATAAAATAAATCAAAAAGCGAAGGACCGAAAGGGGCAACATTTAGGGGGG
+GGGGGCTTGTTTCGCATGGCTGAGTTCAGGACGATTAAACGTTAAATCAA
+TATTGTTAAATCCCCGCTCGCATCCCCGCAATCCACACAGGCAAGTGTTC
+ACGTATTAATTGATGTTCGTGAGTGTCCTGCATTTAAATAATCCATGATT
+TGGGACATCTGTGTCTGAGTTCCCATTCATATATGTATGCATATGTGTAT
+ATGAGTGGTGGAAACTAGCTGCAGATATAGCTACAGACACAGATACATTT
+ACATTCCGGCACATAGTTTTAAGTGTGATTCAGTTATTCACAATAGTCGC
+CGCTTTTTGTTCTTGCCACGTTTTAATATTGTCACAACTAGTTTCGAATA
+ACTAAATTGGATGTTTTCGATTAGCATTCAATACACTGCTCAGCAATTTC
+GTTTGCGTTGCAATTTGAGTACTAGATTTTGAATTAGACAATTGTTTTAT
+TAATTGCCTACATGTATATTACCTAACTGATTTCGAAGGCCACTTGTACG
+ACCTTGAGATAGAGTATTAATTATTTAAATTCTACTGTATTATAATTGCA
+AAGAATTGTAAGTATTCATAATATATAATGGCAACCCAATTTAAGACTTC
+TTTTGAAGGCCCCCGCCTACCGAAATTCAGTGCCTATGAGAACTGAGAAC
+GAAAAAAATTGAGCAAGGACCAAATATCCATCAGGCTGAACACACACATT
+TTCATGCAAATAGGCAATGTGTTATTTTTTTGGGTCAGCGATTCACGGAG
+GGATCCCCACCAAATGGGTTGGCTGAGGAATGGCCTATCCCCATATCTCA
+GCGGCACTTGGGGCAGGCCAACAAATACAAGCAGGCATAATAAAATAATC
+GATGCTTTTAAAATTTGCATAAGTTTGGATACCGCAGATGCCGCGCAAGG
+ATGAGCCCATCTCCAGTCCCAGTGCCATTCCGCCAGTGCGCATACGCCGC
+GTGGAGGGCACAGGACTGGGCCATGGCCCATGGCCCAAAAGCGGAGTCCT
+AGACCCGGAGACGACAGCAGTGGTGGACAAGTTCGTGGGCGTTCGATTTA
+ATTGTGGGAATTCTGCGTCTGCCACGCACCCATCACATCGATGGACGTGG
+CTGAAGAGCTGAATTTTTAAGCGCTCCAAGGCGGCCCGATACCCATATTG
+TATATTTTCATTACCATGTGTGGGTCGGAGTGAAAGTCGCGGGCTAGGAT
+TTAATGTGGCCTTGTTGCAGCCGTGGGAACTCGTCCTCAAAGTACACGTC
+CTTATGTACAGCGGAGCAAGTACCTAGCCGACAGAAGGAGCAGGCACTTG
+TCGACAGAGCTTTTTAACCTTCCGGATTTCACATTTCATTACCGTCGACA
+TCGCGGTGCTGGCAGGTCAACTGTGTCCTGGTTCCGGAAAGCCTCATATC
+TCGTATCTTAAAGTATCCCGGTTAAGCCTTAAAGAGTGAAATGATTGCCT
+AGATGATTGCTGCATTACTGGCACTCAATTAACCCAAGTGTACCAGACAA
+CAATTACATTTGTATTTTTAAAGTTCAATAGCAAGGTAATAGCACTGGGT
+CTTTCAATATTACAATATTACCAATTAGAGAACCATATATCGTACACAAT
+TGTTCCACATTCCGAATTTAATAACTCACGATCGATAGCCAAATTAATAT
+TAATTTGAGAGGACATGAGTCCACCTGAATATTCAATATGCATTATACAT
+TATCCCGCTATGAATAAAACATTCCAAATCGATTCATTTCGGGCAGGAAA
+ATTCCTTTTCTACTCGGCAAGCAAACCAAGGACTAATCACAAATACGGAA
+TATTGAACAGATTACGTTCATAATAGCTGATTGTGTTGGCGAAACCTATT
+AATTTTGTCGTGCAATTTCCGCCGCTCAACAGGATGACAACCTCGATGCA
+GCCGAGCAAGTACACGGGCCTGGTCGCCGACCTGATGCCCAACATCCGGG
+CGATGAAGTACTCCGGCCTGTTCATGCACAACTTCACGGGCGGCAGTGCC
+TTCATGAAGAAGGTGTACTCCTCCGTGCACCTGGTGTTCCTCCTCATGCA
+GTTCACCTTCATCCTGGTCAACATGGCCCTGAACGCCGAGGAGGTCAACG
+AGCTGTCGGGCAACACGATCACGACCCTCTTCTTCACCCACTGCATCACG
+AAGTTTATCTACCTGGCTGTTAACCAGAAGAATTTCTACAGGTGAGCCTC
+TGCTCACCGCACCGAGCTTACGAACACTTGGGGAATTTAAAATTTTATGT
+TTTTCCGGCAGAACATTGAATATATGGAACCAGGTGAACACGCATCCCTT
+GTTCGCCGAGTCGGATGCTCGTTACCATTCGATCGCACTGGCGAAGATGA
+GGAAGCTGTTCTTTCTGGTGATGCTGACCACAGTCGCCTCGGCCACCGCC
+TGGACCACGATCACCTTCTTTGGCGACAGCGTAAAAATGGTGGTGGACCA
+TGAGACGAACTCCAGCATCCCGGTGGAGATACCCCGGCTGCCGATTAAGT
+CCTTCTACCCGTGGAACGCCAGCCACGGCATGTTCTACATGATCAGCTTT
+GCCTTTCAGATCTACTACGTGCTCTTCTCGATGATCCACTCCAATCTATG
+CGACGTGATGTTCTGCTCTTGGCTGATATTCGCCTGCGAGCAGCTGCAGC
+ACTTGAAGGGCATCATGAAGCCGCTGATGGAGCTGTCCGCCTCGCTGGAC
+ACCTACAGGCCCAACTCGGCGGCCCTCTTCAGGTCCCTGTCGGCCAACTC
+CAAGTCGGAGCTAATTCATAATGAAGGTGATTTGTTGAGTCTGAACCTAA
+ACTTTTAGGCGGTTATTCAGTGAGCACTTCACTGAATAGGAAAATGCCAT
+GACGAGCTGTTTTTCCATTGCAGAAAAGGATCCCGGCACCGACATGGACA
+TGTCGGGCATCTACAGCTCGAAAGCGGATTGGGGCGCTCAGTTTCGAGCA
+CCCTCGACACTGCAGTCCTTTGGCGGGAACGGGGGCGGAGGCAACGGGTT
+GGTGAACGGCGCTAATCCCAACGGGCTGACCAAAAAGCAGGAGATGATGG
+TGCGCAGTGCCATCAAGTACTGGGTCGAGCGGCACAAGCACGTGGTGCGG
+TGAGTTCAAATCCTGGCCAAATTGGACCAGCCATTTCAAGGGGGCTTTGG
+CCAGTGATGATTGGATTTTTGGCGATTTAAATGGCAGAGCAGTCCACTCA
+TATTTCATGGACTTGGATTTTTGCCTTTAACAGAGCACCGAACATAATAA
+ACACACACACTTTCCCCTCAGTTTTGTAAAACTTCAATAGGCGCCATCGG
+AACATGTGTTCTCATTTATTAGGAGCTCAACAGATCCCTGCAGCTTGTTT
+GACTTACTTGATTACTTCCTCAATTGCAATCATTGTTGGGGGCCCTAGAG
+GAATGTCCTTGTTTGTCCTGTCCGACAGTTGGCGTGTGCAGTTGTTGATA
+CCAATATTGACTTGATTCCTGCCTGCAATCCCTCATCCTTTCCCCCGTTG
+CCTTTTCCCCACAGACTGGTGGCTGCCATCGGCGATACTTACGGAGCCGC
+CCTCCTCCTCCACATGCTGACCTCGACCATCAAGCTGACCCTGCTGGCAT
+ACCAGGCCACCAAAATCAACGGAGTGAATGTCTACGCCTTCACAGTCGTC
+GGATACCTAGGATACGCGCTGGCCCAGGTGTTCCACTTTTGCATCTTTGG
+CAATCGTCTGATTGAAGAGGTGAGTTTGTGCAGGGTTGCAAGATAAATTT
+ATAAGTAAATCAGACATCAGTCTCAACTGATTAATAATCGAGAACATCCT
+TATTTGAGTTATAGGGATATTTATAAAAAATTTTGAGACTTCATTAAAAC
+TAAATGAATTGTAAGTTGAGAGTCAACAGATTGGTCCGTTCACTACAAGC
+TAACCAGTGTGTTTTTTCCATGTGGTAGAAATAAAAGGGTGTTTTTGCGT
+ATGAGATAAAATTGAACCAATGTTTTCAAGTTTATAGATTGGGAAACATA
+CATAGTTCTAAACGTTGTTATAGTTATAGTTTGTGTAGTTAGTTATCTAG
+AGCATCCTTAATACGACTTTCATTTCGCAGAGTTCATCCGTCATGGAGGC
+CGCCTACTCGTGCCACTGGTACGATGGCTCCGAGGAGGCCAAGACCTTCG
+TCCAGATCGTGTGCCAGCAGTGCCAGAAGGCGATGAGCATATCGGGAGCG
+AAATTCTTCACCGTCTCCCTGGATTTGTTTGCTTCGGTTTGTTGCATTTG
+ATTTATTGATCTATTGATGGAGTTAAAACTGAATCGGATATTCCCGATTC
+GCAGGTTCTGGGTGCCGTCGTCACCTACTTTATGGTGCTGGTGCAGCTCA
+AGTAAGTTGCTGCGAAGCTGATGGATTTTTGTACCAGAAAAGCGAATGCC
+AAGAAGCCACCTACCGCCCCTTGCCCCCTCCGCACTGTGCAACCAGCAAT
+ATCACAGAGCAATTATAACGCAAATTATATATTTTATACCTGCGACGAGC
+GAGCCTCGTGGGGCATAATGGAGACATTCTGGGGCACATAGAAGCCTGCA
+AATACTTATCGATTTTGTACACGCGTAGAGCTTTTAATGTAAACCCAAGA
+TGCAAACTAAATAAATGTGTAGTG
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/outputtest1.txt	Thu May 30 07:13:55 2013 -0400
@@ -0,0 +1,30 @@
+# BLAT 35x1 [2009/02/26]
+# Query: OR83b
+# Database: /mnt/galaxydb/files/016/dataset_16882.dat
+# Fields: Query id, Subject id, % identity, alignment length, mismatches, gap openings, q. start, q. end, s. start, s. end, e-value, bit score
+OR83b	ENA|CAKG01028373|CAKG01028373.1	91.94	521	42	0	2858	3378	822	302	5.6e-258	886.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	92.99	314	22	0	2480	2793	1425	1112	2.2e-152	535.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	91.38	116	8	1	22	135	4691	4576	1.6e-46	184.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	81.12	143	27	0	634	776	4064	3922	5.7e-45	178.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	89.57	115	7	2	1388	1501	2884	2774	3.0e-43	173.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	83.81	105	17	0	1879	1983	2416	2312	3.4e-36	149.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	96.49	57	2	0	1628	1684	2656	2600	6.6e-23	105.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	87.01	77	7	3	469	543	4226	4151	7.7e-21	98.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	94.55	55	2	1	1806	1859	2478	2424	5.0e-19	92.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	76.00	100	18	2	2003	2101	2297	2203	1.0e-18	91.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	97.30	37	1	0	1751	1787	2534	2498	1.7e-11	67.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	93.55	31	2	0	2309	2339	1614	1584	2.2e-06	50.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	92.59	27	2	0	2420	2446	1479	1453	6.0e-05	46.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	89.66	29	3	0	199	227	4483	4455	1.1e-04	45.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	91.30	23	2	0	1710	1732	2577	2555	3.7e-03	40.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	100.00	19	0	0	1537	1555	2731	2713	1.2e-02	38.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	95.00	20	1	0	1594	1613	2692	2673	2.1e-02	37.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	95.83	24	0	1	1321	1344	2947	2925	5.2e-02	36.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	100.00	18	0	0	1240	1257	3024	3007	1.1e-01	35.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	94.74	19	1	0	1293	1311	2976	2958	1.7e-01	34.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	95.00	20	1	0	162	181	4519	4500	1.8e-01	34.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	94.12	17	1	0	449	465	4245	4229	3.3e+00	30.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	100.00	13	0	0	2287	2299	1629	1617	1.0e+02	25.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	94.12	17	0	1	1271	1286	2997	2981	5.7e+02	22.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	92.31	13	1	0	2448	2460	1450	1438	2.1e+03	20.0
+OR83b	ENA|CAKG01028373|CAKG01028373.1	100.00	10	0	0	1693	1702	2593	2584	3.0e+03	20.0
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_data_table_conf.xml.sample	Thu May 30 07:13:55 2013 -0400
@@ -0,0 +1,7 @@
+<tables>
+    <!-- Locations of indices for CLC aligner -->
+    <table name="clc_indices" comment_char="#">
+	<columns>value, dbkey, name, path</columns>
+	<file path="tool-data/clc_indices.loc"/>
+    </table>
+</tables>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_dependencies.xml	Thu May 30 07:13:55 2013 -0400
@@ -0,0 +1,21 @@
+<?xml version="1.0"?>
+<tool_dependency>
+    <package name="blat" version="1.0.0">
+        <install version="1.0">
+            <actions>
+                <action type="download_by_url">http://hgdownload.cse.ucsc.edu/admin/exe/linux.x86_64/blat/blat</action>
+                <action type="move_file">
+                    <source>blat</source>
+                    <destination>$INSTALL_DIR/bin</destination>
+                </action>
+                <action type="shell_command">chmod +x $INSTALL_DIR/bin/blat</action>
+                <action type="set_environment">
+                    <environment_variable name="PATH" action="prepend_to">$INSTALL_DIR/bin</environment_variable>
+                </action>
+            </actions>
+        </install>
+        <readme>
+The BLAT binary for linux x86_64 is retrieved from UCSC.
+        </readme>
+    </package>
+</tool_dependency>