# HG changeset patch
# User iuc
# Date 1525306675 14400
# Node ID 26c5f217aad70c496527e0761c7d55328bf90541
# Parent 889682a276f6cd4e0f56de8d5b5909e8550070ac
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/repeat_masker commit 8dacb4321122d92df0983e0794cf23572be03224
diff -r 889682a276f6 -r 26c5f217aad7 RepeatMasker.xml
--- a/RepeatMasker.xml Sun Apr 29 07:03:52 2018 -0400
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
@@ -1,321 +0,0 @@
-
- Masks different kind of repeats
-
- RepeatMasker
-
-
-&1;
-
-## Copy the output files to galaxy
-## AgR: if there are no repeats, the output files may not exist.
-## This causes the job to fail, so touch files to ensure they exist.
-#if $adv_opts.adv_opts_selector=="advanced":
-
- #if "summary" in $output_files_list:
- ## Write out the summary file (default)
- #set $summary_file = $output_basename + '.tbl'
- touch $summary_file;
- cp $summary_file $output_summary;
- #end if
-
- #if "gff" in $output_files_list:
- ## Write out the gff file (default)
- #set $gff_file = $output_basename + '.out.gff'
- touch $gff_file;
- cp $gff_file $output_gff;
- #end if
-
- #if "html" in $output_files_list:
- ## Write out the html file
- #set $html_file = $output_basename + '.out.html'
- touch $html_file;
- cp $html_file $output_html;
- #end if
-
-#else:
-
- ## Write out the summary file (default)
- #set $summary_file = $output_basename + '.tbl'
- touch $summary_file;
- cp $summary_file $output_summary;
-
- ## Write out the gff file (default)
- #set $gff_file = $output_basename + '.out.gff'
- touch $gff_file;
- cp $gff_file $output_gff;
-
-
-## End of advanced options:
-#end if
-
-## Write out mask sequence file
-#set $mask_sequence_file = $output_basename + '.masked'
-touch $mask_sequence_file;
-cp $mask_sequence_file $output_mask;
-
-## Write out standard file (default)
-## The default '.out' file from RepeatMasker has a 3-line header and spaces rather
-## than tabs. Remove the header and replace the whitespaces with tab
-#set $standard_file = $output_basename + '.out'
-tail -n +4 $standard_file | tr -s ' ' '\t' > $output_std;
-
-## Delete all temporary files
-rm $dirname -r
-
-]]>
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- (adv_opts['adv_opts_selector'] == 'advanced' and 'mask' in adv_opts['output_files'])
-
-
-
- (
- (adv_opts['adv_opts_selector'] == 'advanced' and 'summary' in adv_opts['output_files'])
- or
- (adv_opts['adv_opts_selector'] == 'basic')
- )
-
-
-
- (adv_opts['adv_opts_selector'] == 'advanced' and 'html' in adv_opts['output_files'])
-
-
-
- (adv_opts['adv_opts_selector'] == 'advanced' and 'gff' in adv_opts['output_files'])
-
-
-
-
-
-
-
diff -r 889682a276f6 -r 26c5f217aad7 readme.rst
--- a/readme.rst Sun Apr 29 07:03:52 2018 -0400
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
@@ -1,63 +0,0 @@
-===============================
-Galaxy wrapper for RepeatMasker
-===============================
-
-This wrapper is copyright 2013 by Björn Grüning.
-
-This is a wrapper for the command line tool of RepeatMasker from the Institute for Systems Biology.
-http://www.repeatmasker.org/
-
-
-Smit, AFA, Hubley, R & Green, P. RepeatMasker Open-3.0.
-1996-2010 .
-
-
-Additional Information:
-Using RepeatMasker to identify repetitive elements in genomic sequences.
-http://www.ncbi.nlm.nih.gov/pubmed/19274634
-
-============
-Installation
-============
-
-To install RepeatMasker, please use the following instructions:
-
-http://www.repeatmasker.org/RMDownload.html
-
-To install the wrapper copy the file RepeatMasker.xml in the galaxy tools
-folder and modify the tools_conf.xml file to make the tool available to Galaxy.
-Add a line like the following:
-
-Add the tool definition to your tool_conf.xml file under Galaxy root.
-
-
-=======
-History
-=======
-
-- v1.1: Initial public release
-- v0.1.1: patch from Simon Guest, to create empty files if no repeat is found
-- v0.1.2: remove trailing semicolon, redirect all output to stdout
-
-===============================
-Wrapper Licence (MIT/BSD style)
-===============================
-
-Permission to use, copy, modify, and distribute this software and its
-documentation with or without modifications and for any purpose and
-without fee is hereby granted, provided that any copyright notices
-appear in all copies and that both those copyright notices and this
-permission notice appear in supporting documentation, and that the
-names of the contributors or copyright holders not be used in
-advertising or publicity pertaining to distribution of the software
-without specific prior permission.
-
-THE CONTRIBUTORS AND COPYRIGHT HOLDERS OF THIS SOFTWARE DISCLAIM ALL
-WARRANTIES WITH REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED
-WARRANTIES OF MERCHANTABILITY AND FITNESS, IN NO EVENT SHALL THE
-CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY SPECIAL, INDIRECT
-OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS
-OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE
-OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE
-OR PERFORMANCE OF THIS SOFTWARE.
-
diff -r 889682a276f6 -r 26c5f217aad7 repeatmasker.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/repeatmasker.xml Wed May 02 20:17:55 2018 -0400
@@ -0,0 +1,230 @@
+
+ RepeatMasker
+
+
+ repeatmasker
+
+
+ '${output_log}' &&
+ mv rm_input.fasta.tbl '${output_table}' &&
+ #if $gff == '-gff':
+ mv rm_input.fasta.out.gff '${output_gff}' &&
+ #end if
+ #if $advanced.keep_alignments == '-ali':
+ mv rm_input.fasta.align '${output_alignment}' &&
+ #end if
+ #if $advanced.poly == '-poly':
+ sed -r 's/^ *// ; s/ *$//; s/\+ //; s/ +/\t/g' rm_input.fasta.polyout >'${output_polymorphic}' &&
+ #end if
+ #end if
+ mv rm_input.fasta.cat '${output_repeat_catalog}'
+ ]]>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ not advanced['is_only']
+
+
+ not advanced['is_only']
+
+
+ not advanced['is_only']
+
+
+
+ not advanced['is_only'] and advanced['keep_alignments']
+
+
+ not advanced['is_only'] and advanced['poly']
+
+
+ not advanced['is_only'] and gff is True
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ @misc{RepeatMasker,
+ title = {RepeatMasker Open-4.0},
+ howpublished = {\url{http://www.repeatmasker.org}},
+ author = {Smit, AFA and Hubley, R and Green, P.},
+ year = {2013-2015}}
+
+
+
diff -r 889682a276f6 -r 26c5f217aad7 test-data/repeats.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/repeats.fasta Wed May 02 20:17:55 2018 -0400
@@ -0,0 +1,64 @@
+>Asian_seabass_ONSAT_SB_Concensus_Lenght_170_bp
+CGAAAAATTTAATAATTTAGGGGTCTTGAGCATGGGCGTGGTAAAATGCCCTCGGTAGCG
+CCACCTACATTTTTAAACGGAACAGCCCCTCAAGCCCGTTGCGCCTAAAAATCTGAAAAT
+CTGCACACATATGTAACATCCCATGACGCACCAAAAAGTCTCTTGGAGCCA
+>Asian_seabass_MOSAT_SB_T_34a_satellite_DNA
+TTTGTGACATCACTACATAGTTTGTTGAAAACGTAC
+>Asian_seabass_MOSAT_SB_T_34b_satellite_DNA
+TTTGTGACATCACACATAGTTGTGGGTCAGTAC
+>Sat_38
+AAAAAATGTCATAGTATAGTATGGCGTCAAAAAACATG
+>Asian_seabass_Sat_217_Consensus_Length_217_bp
+AGTAAACAAGCATTATGGTTGAAACCATAATTTCCTGTCGGGAGAGCCTTTCCCTCTTTT
+GTGCACTGTATGCAATCCCAGAGTGTGAATAAGCGCTTTTCCAGCGTTTTGAGGCTTATT
+CAGCTCAGAATGGCTTAATACTGCACTATCTGACCAGGACAAAGACAAACTAAGAACTCA
+GCCACACGGACATGAAAGTTGTTTTACTTACAATATT
+>Asian_seabass_Sat_217_Consensus_Length_427_bp
+CCAGCGTTTTGAGGCTTATTCAGCTCAGAATGGCTTAATACTGCACTATCTGACCAGGAC
+AAGACAAACTAAGAACTCAACACACTGACATGAAAGTTTCTATATTTCTATTAAAATAAA
+CAAACATTATGGTTGAAACCATAATTTCATTTCGGGAGAGCCTTTCCCTCTTTGTGGCAC
+TGTATGTAATCTGAAGTGTGAATAACGCTTTTCCCGCGTTTGAGGCTTATTCAGCTCAGA
+ATGGCTTAATACTGCACTATCTGACCAGGACAAGACAAACTAAGAACTCAGCCACACGGA
+CATGAAAGTTGTTTACTTTACAATATTAGTAAACAAGCATTATGGTTGAAACCATAATTT
+CCTGTCGGGAAGAGCTTCCCTCTTTTTGTGCACTGTATGCAATCCCAGAGTGTGAATAAG
+CGCTTTT
+>Asian_seabass_Sat_LM_Consensus_Length_453_bp
+CCCAACAAAATAGCACTTACTGCTTTCCAAATTCAAGTCTGTGCCTGTGTTAGGGTAATG
+TTGGTGATAAATTGATGTACTTAGCTTATCCTGTGAAAATGGTGTAAAATGGCAGTCTCC
+ATGTTTGTTGAAGAAACTCACAACCAAGACAACCCCAAAGAGAAGCACTTATGAAGACAG
+AAATCATGAGTGGCTCTTATTGAAGTGATCAGAGTTGGACTCCATTAAGAAAATGGCTTT
+CAATGTAGTCAGTTGCTTTGTCACTTAAAACTGCCCCAACAAGTAGCACTTACTGCAATT
+TGGTAGTCAAAGTCAATGCTCAAGTTAAGGGTAATAGTAGTGACATAATAGAAAAATCTC
+TAAATATATTTGCTGGCAGCTTTAATATACAGAATGAGTGCCATGATGAATTCTTGATAC
+AGAACAGGGACTTCCAAAATCAGCCAACACTAA
+>Asian_seabass_Sat_LM_Consensus_Length_218_bp
+CCCAACAAAATAGCACTTACTGCTTTCCAAATTCAAGTCTGTGCCTGTGTTAGGGTAATG
+TTGGTGATAAATTGATGTACTTAGCTTATCCTGTGAAAATGGTGTAAAATGGCAGTCTCC
+TGTTTGTTGAAGAAACTCACAACCAAGACAACCCCAAAGAGAAGCACTTATGAAGACAGA
+AATCATGAGTGGCTCTTATTGAAGTGATCAGAGTTGG
+>Asian_seabass_Sat_LM Consensus_Length_150_bp
+CTCACAACCAAGACAACCCCAAAGAGAAGCACTTATGAAGACAGAAATCATGAGTGGCTC
+TTATTGAAGTGATCAGAGTTGGACTCCATTAAGAAAATGGCTTTCAATGTAGTCAGTTGC
+TTTGTCACTTAAAACTGCCCCAACAAGTAGCA
+>Asian_seabass_Sat_Unk_Consensus_Length_341_bp
+GTTTGGGTAAAAATATTGTCTATTTACGAGCTATCCTCTATATATTTTTGATCTGATTAA
+TAAATACCTCTAGCCCACAAACTGTGGTATTTTGCTATGTGGCAGTTCACCCGAAAGTCC
+AGTAGCATTTATCGCATTTTCTAAAGATAGTCAGTGCCTGAAAGTTTGAGGCAGATAAAC
+AAATTGTTCAAGTAAGAACTATATCTTTCTTATGATTTTACCGCAATCATACAGGTTGTT
+TCTTGTGGTCTGCTGGGCATTGTATCCCTTTGTTGTATGGATTTTTCCTTTCTTTAATGA
+TCTCCTCCCTGGAGTTTGTAATCCCTGTTTGTAGTGGAATT
+>Asian_seabass_Sat_Unk_Consensus_Length_789_bp
+CAAAAAAATGGAAAAAAAAAAAGTGGCTCATTTGAAGTGAATCAGAGTTGGGTAACATTG
+TCCTTAATTACAGCTATGCTTATATACTTGATCTGATAATAATACTCTAGCCACAATCTG
+TGGGTATTCTGCTATTTGCAGTCCACCCAAAGTCATAGCATTTAATCCATTCTAGGAAGA
+TACGTCAGTGCTGAGTTGAGCCAATAACACCAAATTGTCATAAGAACTATTATTTTCTTT
+ATGATTTTTACGCATCAGTACAGGTGTTTTCTTGTGGTTTCTGCTGCATGTATCCCTGTT
+GTAAGTGGATTCTCCTTTGCTTATGATCTCCTCCGCTGCGTTGTATCCTGTTTGTAGTGG
+ATTTCCTTGCACTGATTCTGCCCGCTCTTAATACTGAATGAACGCCCTCCCACCAGTAGT
+ACTGCCACCTTTGTTTTTTCACAAAGTGTTCAATGGCCTTGATAATGACTTGGTAACTAC
+ATCACCACTTTTTTGTACGTAATCAACAGACAATCACCCATTAAATTCATGCGGCCATTA
+GGCAGCTTGATGAGCTGGACATTTGACCTCCCCAATGAATCTTTGCTGATGGGAAACTTA
+TTGCCACCATAAAGTGAACCAGCATTGCTATGTCCATGCTGTAATTTGAAAACCCAATAC
+AAAGAAGCCCTGCATATATACCTCCCAAATTGGCTTCTGAGACCCGGGCGTAATCACTGC
+ATGGCCATAGATAAACATTGAAATCTTCTGTTGCAGTCAGTTTGCTTTTTGTCAACTTTA
+AAAACTGCC
diff -r 889682a276f6 -r 26c5f217aad7 test-data/small.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta Wed May 02 20:17:55 2018 -0400
@@ -0,0 +1,238 @@
+>scaffold_1
+TGCTTTTCTGAGATTTATGTCAGCTCCCCATTGGGAGATACAGGAGAATCCAATATATTC
+CTGTCTCGCTTCTTTTATATTTATCCTTTCTACACCTGACATCCTCAGTGATTGAAGTGA
+CAAAAAGTGGAGCGCACGCAGTGGTCATTACCCTCCAATGGTACTTCTAATTAAGGAAAG
+ATTTTTTGCATTCACTGAGCAAAACACTTATTTGCATGAATGGAAAATCATAAATGAGGG
+GTCCATTAAACAAATTTCCTAATTGTTTGCTTTTTTTTCTTCCTACTTCACCATCCCTCT
+AAAGCTATTACTCTCTATTCTACCCCATTATCGAGTGCACAAACACCAGCCCCAAATTGT
+CTTATCTCTGCTTTGATAAATGATATTTTTTTCTCTTATAATTGTGTTTCTCTCTAGATG
+TGCGGTGTCCATCAAGACACTGGATGTCACGTGGTCACTCCTGTGAAGAGCGAACTGTGT
+GGAACCCGAAGTACTGTGTGGTTGCTGACTGTCAGATGCTGCTTCTGAATGAGGAGGAGG
+TGGTGAGAGCAGACAGCACAATCTCTTGTCTGGCATGTTCCTCTGTGTCACCATTGTCTC
+TCTCATCTGCTCGTGTGTGTGTGTGTGTGTGTCCTTGTCAATGTCATTACACAATTTATG
+TTGGTGCACTGCATGTCAGAGTCTGAACTTTGTTGGACATCTACTTTCTGTCACCTGATA
+CCTCATACTTTACACTCTAATCCCTTTTTCCTTTCTAACTGCTGCTGTGTTAAGCTGTCA
+TATTAATATACTAAATAATGATAATATTAATTCTAATAATGATAGTGAATGGAGATTCAC
+AATGAAGAAACACAAGGTCCAGACTGAACCCCTGTGCTGTGTGAAGAGTTCACTCTACAT
+TTACATTCATCCCACATCAGAGACCAGCAATAGCCAGGTTAAGCAGAGCAAGGCTGAGTC
+TGGCTCTTTGCCTCTGTTGTTTTGATTAGTGTCACACTGGATTATGCTAGTTTGTGTGAG
+ATTAGAGGTCCTGTTGTTACGAGCAAATCAGCAGTCAGCAGGGTAATCTAAATTACATTG
+TTCTGTCGGCAATATCCTCTCCTCGCTCAACAGCTTTGTGTGAGCTCATATTTAAAGCCC
+CCACAGTAGTGCAGTGCATAAAATCATGCAGATACAGATCAGAAGCTTCAGGTAATGTTT
+ACATCAAACATCAGGGGGAAAATGTGATCTCAGTGCCTCTGACCGTGGTGTGATTGTTGG
+TGCCGGACAGGCTGGTTTGAGTATTTCTAAAACTGCTGATCTCCTGGGATTTTCACACAC
+GGCATTCTCTAGAGTTTACTCAGAACGGTGTGGAAAGCAAAAAAACATCCCGCGAGCTGC
+AATCCTGCGGATGGAAACACCTTGTTGATGGGATATGTCAGAGGAATGGCCAGGCTGGAT
+CAATCTGACAGAAAGGCGGTAACTCAGATAAGCACTCTCTACAACTGTGGTGAGCAGAAA
+AGCGTTCTCAGAATGCACAACACGTTCAACCTTGAGGAAGATGTTGCTACAGCAGCAGAT
+GAAGACCACGTCTGGTTCCACTCCTGTCAGCCAAGAACATCTCAGACTGCACAGGACACC
+AAAACAAAAACACATCCTGTTTTCTACTGGTGGTAGAGTCACAATTTGGCAATAAGATAA
+ATCCATGGACCCAACTTGCCTTGTGTCAATAGACCAAGCTGCTGGTGGTCTTGGGGAATG
+TTTTCTTTACACTTTCACACTATCGGCCTATATAAAATCCTATTATAAACTGCTGTACAG
+TGCATTGGGTTTGATAAGCCCTCTAAGTCTGTATATCATGATCTCATTGATACCTGCGGC
+AATACACCCCCACAAACGCAGCTCCCTGCATTTTAAGTATTATAGAGAGTAATTTCACTG
+TCCATGTCTTTTTTGATCATAAAGCAGGTCTAGGTGCTGTATACAACACTGTATTGAAAT
+GCTGAAGCAGGTCTAGGTGCTGTATACAACACTGTATTGAAATGCTGAAGCCAATATATC
+AATCTATCTGTCTATATTTTATGAAATATCAGAGCATTTTAGTCCAAATTTGTCTGTTTT
+GTTCATTGCAATGCTGACTGCTTAACATTTTCCTCAGTGGTGGCCATCACCACAGCATTT
+ACTGGTGAGTTTTACCAAGCTACAGTGGGCCACAATGAGTTACCTGTTATTGGCCTGGCT
+CTATGGCATGCAGAAAACAGTCAGCCAATCAGAGGACAGACTCAGAGACAGACACAAAGT
+GCCCTGTTCTTGTTAGAGCAGAGATAAATGAGACAGAGGAGATGTAAAACTATACTGAGA
+TGGTTTTTTGGTTCTTAAAACCACAAATATATTGTATTACGGATATCAAAACTTCAAATA
+AAACCAGTAAAGTGTAAAACATGGGACCTCTAAATGAAGGGCTGTTTTGTTTCGTAGTTC
+TAGATTATGTCACTATGTGGCCTCGGTCTCTGTCTGCGTAAAGCGGCTACATGTAGAATT
+TGACCCACTTTGGTGCCCACATATGGTAACTAAAACACTACAGACAGTATGCACTCCAAC
+CCTATATAATTTATGTCCTTCAGTGAAGCCTACAAAATGTGCAGCATGATTTGCTATGAT
+TAATACCTAGAATTATATTAAATTTTAGAAGTTTAGAGAGATGGCTTATACCTTTTTCTG
+AGCATGGAGTCATCTCATGTAATTTGTCACATACCTTTGGCCAGCTTAAACCTGGTCATT
+CCAGTGAGAGCTGCTCACCCAAATGTTTCTGTATGCACCTCCTGCTGTGGGTGCCAATAG
+CTCATGCAAGTTGGTGTCTTTCAACTAAGGCCACTATGTGAGGACCATCAGCAGCAAATT
+AAATTAGAAGTGCCTTGGAGTTTCTCAGGCCCTCTTCTATGATCATTAAGGTCTCAGTGA
+CAGAACAGTGCCCCTTTGAGGGACTATGGCATCTTGAGCACTTAAGTTGGCCGAATGTTT
+GATCTCAAATATGAGTGCACTGTTTCAAAGTCACAAAAGCCTCTGGACAAGGCATAGTTA
+CTGGGCTTGGTTAACCTTTTTTTCATACCGGCGTGACTGCTGGAACTTGGAACATGTAGC
+CTAAGTTTCCCTTTGTCTGCAATTACTGAGGTATGCCATGTTGAAATAGAACAATAATTG
+CAGGGAGGAATTATTCCAATCGACCCATCGGCAGGCTTTCCAATACAGTGCTTTTTGTTT
+CACAGCAACAAAGAACAAGAGCTTTTAAATGCATCCATCTGGACCCTGACTATGAAAGGT
+CATTGGTAACGCTGCTGGATTTCTGTTATGTCAGCAAACTGCAGGTCAAAGCGATGATAC
+AGTCTTATAATGGCTTTCTCCAAGTGAAGGTGGGATAACATGGTTTAAACAAGCTCAGTT
+AAATGGATCAGAGCATCAACTGCTGTGAACAAGCAATCACACGGTCAAGGTCAAACATTT
+ACACTTCTGAGAGATCTGGAGAGTATGTCATGGCAGTATTGCTTTTCAGTTATTTCAGTA
+ACTGATTACGCCTTGTACTTAGTCTCAGAATTAGTGATTTGATTCAAAGTGTTTTATATA
+TGTATATTTCAAAGCAAAAATACAGCTTAGGTAAAGCTCCTTAGACTCATGCAGCCTAAT
+TTACTGTAGACATTCCTCCATGTACAGTACTGTGCAAATGTTTTAGGCAGTTTTAGGCAC
+TAAAGGTGAACTGAGGATGCAGTCCCACGATTAATTTTTATTCATCAGTTAACCTCATGT
+GAAGTGTAGTAAACAGAAAAAACCTAAATCAGATCAGTATTTCTTATGACCCCCCTCCCC
+TACCACCCATCTTTAAAACAGCTCCAGTTCTCCTCAATCCCCCTGTACTTAGGTAGTTTT
+TTTCTAGCGTCTTGGAGAAGTTGCCTCAGTTCTTCTGTGGATTTTAGGCTGTCTCTGTGT
+CTTCTGTCTCCTCATGTATTCTCAGACTGACTCCATGATGTTGAGATCAGGGCTCTGTGG
+TGGGGGGGTCAGACCATCTGTTGCGGGACTCCTTGTTCTTCTTGTCTCTGAGGATAGTTC
+TTTATGATGCTGACTGTGTGATTGGACTCATTGTCCTGCTGCAGAATTAATCTGGGACTG
+ATCAGACATCTCCCTGATTGTACTGACAAAGGATAAGAGCAAAAACCTGTAGACTGCCTA
+AAACTTCTGCACAGTACTGCACAATACTGTATGTATGTGTGATAATACTCAGAAGTGATA
+TAGAGTGGTTCAGGAGAAGCCTTAACTTACTTGTTCTTCTTTTCCCTATGATGCAATTTC
+TCTCCAAGCAAACAGTACATAATGAAATATGTCTAAGAAAACACTAGCTGTTTGTCTTTT
+TGAAACACATTTAATAATTCAGATTTAGCCACAAATTAAAAATGAGCTTATACTTTGAAC
+TTGCCCATTGGTTTTGATGTATGAAGCTGACAGATTTAGTCCACTGCATACTGCACTTTT
+TTGGATAGTGAAATAAATTAATTTATTATGCAGCATTTAAGCATATTGCTGTTATCTAGA
+ATTTTATATATTAATAGGTATATATTATATTAACTCTTCATTTGCTTAAATTTGGCCTGT
+ATATTCCTCCATTTTATACAACCTTTAGAAAACACTGGAGTGAACAAAAATGTGAGGTTC
+AAAAGTGAGAGGAAAGAAAAATCAGTGTGTGCAGCAAGACTGTAAGAGTCCCTGAACAAA
+AGTGTTGATTTATTGTTGGCTGTGAAAGTTTTTGCTGCAGGGGTTTTTGTAAACAGTGAC
+TCTTCTTTATGTCTTTGTTTCTATCTTTTTGTGTTTTCTTTTTTCATCTTATTCTATTTT
+TCTCTCTCTCTCTTCGGTCAGTTTCTCTTCTTCTCCTCCTCATACTCATGCTTCTCTTTT
+ACTCTAATGGAAAACATAGAATTGAGGTGCAGTATCACTGAGAACAGCCAATGCTGATAC
+TGTCATTTGTTATAGGATGTTTACTTAAGAAATGATTGTGGCCTTATTTGCCAAAGACGA
+TTAGGCCCTGAGCCATTTGTACAGCCAATGTGACACCTCCGTAACCATAAGAAAAATTAT
+GCTTCCACAAACAGAAAGAGAGACAAATACAGACAGTGAAAGCAAAACTATGAGAGAAGG
+GATAGCCATCTCAGCATTCAGCCAGTGTGTCACATGTCCAGAGGGCTGCAATATGAAGCC
+AATAAACTGAGAGAAAGGTGTGATTCCAGAGGGCTTTCCGGACTTTAAACTTTTCTCATT
+TTCACCTTCAGCTCGTTGTGAAGCCTTCAATTGTTCCTTGGTCACATGAAGCCCCCTGTG
+TGTAAAATTGACATTCAGCTTATTACTCTCATCTACATCTCTAAAGTTGCACATGACTGC
+CAGTAGAGGGTGCTCATGATTTGAGACAAGTAACTTTTCTGTGCTTGTGTCAACAGTTAA
+AAATTCCCTATGGATACTTGAAAGAAATGCACCAGTGTTTAAATTTAGACTCAGTCCAAG
+TAGGCTTTGCCATTTGCTTTACTGTTGTAATCAAATCAGTGCTCACAGTACATCAGTGGC
+AAAAGCAATTAGCTTAATTGAGTTAGTAGGGAGTGAAAAGATAGATCACTATTTCCTGGC
+AGCGATATATTTTTCTCAGTTAACCTTCTCACAGAAAATTAGTTAGATGAGTTTCTTATC
+TCATTAGAACCATTGTTGTTTATTATTTAAACCTGACCTTTATCCAGAGAATGTTTTTCA
+CAGTAAGCATGTGTTTCACTCCAGCTCATACAGACACACCTTGTGGCCAGTCAGGGAATG
+TGCATTAAAACTAATGTTCTCTCTGGTAGAGCCATTCTGCCTATTCTGTTATTCACCAAA
+ACTTTCCTGCCCAGATTTTTCCATCTAGTCAGGGGACTTTTTCCTCAGCTGAACTGTCAG
+TAGCCAGCTGCTCTGACCTTTACTCACCTCAGAGATTACTCATTCAAGTTATTTTACCAA
+TGATGGAATAAAGTGAATACACACATCGTGACTTCATCATACTTTCCCTCCTTTACCGTA
+CTTTCCTAACATCAGTTAGCAAATTATACACTTAAATATGCTAAAATAGAGATTTGTTTC
+AAATTGAAGAGCAACACAGGACACATTTGCTTACACAAGTGACTCTATCTTATTTTTTAA
+GTGGCTGTCATCCTCAATATCATCAATATTTTAGGCATGTGAATGTAGGTAATGAGTATT
+ACTAATTAATAATTGGATGAGTTTATGAATTCATCATTAAATAAGATTATTATGATAAAG
+CTACACATTATACTGCAATTCCGGGCCAACACTATTGTTTCGCCCTTACAGTACAGGACT
+GTACATATCACTGTCACTACAAATTGTTTCAGTGAGGCTCAGATTACAGCTCATCTTGCT
+TAGTCATTACGGCTCAGACCACCAGACAATGTCTTTACGTCAGAGAAAGTCTGAGTGAGA
+GCTGTCCTTAAAACCAAGTCCCATGAGGCAAGTAAAGAGGTGACTCGCTGAGAGGATCAG
+GGAGAGGGACAGAGAGATAAACAGACAGACATGGAAACAGAGGGACATAGAAAACAAGAC
+AGAGAGGGTGCTGCATTGAGTCGAGAGGTGTGAGGATGTTCGATAAGCCATTATCACTCT
+GCTCGGAGGACGTCAGGCCCTATCCTTTTTTCTTTGAGTCACCACTTTCTCACCACAGCC
+ATCCTTCTTCCTTTGTCTGTTTAATCTTTTGCAGCCAAACATTTGGTATGCAAACTATAG
+GAAGATATGGTCTGACACCGACTGATGTGATGCTAATGCCTTCTCTGTTTTATCCAATGA
+CTCCTCATTTATCAGGACCAATCCAGCTATTGTGTGCTATTGGCCCAACACAGCATTAAA
+CATGGTGACCAGAATAGCCACAGCAAAATAAATAACGGGCCTCTGTGACTATTGTATGTG
+CATTTCTTACAGCTGTCATTTTTCTTTTCTGTTAGCTTTCATTCTACTGTGCGTGCTCTC
+TATCTGCCTACGTTGTATCTGTGCCTTTTGTTAAATTCATTCAGCCTTTTATCTGTCTTG
+AATTTCTTTCTCTGTGTCCTCCTTTCCCTCTCTGTCTCAGCAGATCCGTCCCTTGTTTTT
+GCAGGAGAAGCGCTCTGCGTCATGCAAGGTCCATCTTCTGCGACGCACCATCAGCGTTCC
+AGTGGAAACACAGTTTCCAGAACTCCATAGCCAGCTGTCCACTGAGAGCGGTGAGTAGCC
+TGAGGACATGCCTCTGCTGTGATTAGCATGCATCATTATTTCCATACACACACTGGAAAT
+CTTTTAATCGTTTTTCTTGACACAATTTAATTAATTTAAATAATTAATAACATTGAAATC
+AACTGTTAAACACTTGTTCAACATGGTTGTGGACAAAATCATCATAATGACTGTGGAGAC
+TAAGGAGAAACAATGCTTTGTTAAAATCTTTGCTCTGGTTTTGGCTTTTTCTATATTCTA
+TTTGTGTGTGCAGTGCTGCTAAACATCATCTTAGTCAGAGTCAAACTTGAGCACTCATGC
+AGATGCTTGTTCTATTCAGTGGTCAAATGGGCAGTGTAGCTTAGGAGAAGCACTTCTTTC
+CGCTCCTCAGTGACATAACCAGTCACACACTCACACAGGCAAGTGAGCCTTTTAAAATTG
+CTGATACTATTTTTTTCTACTTCATATCCACTAGATGGAGAGCTTGGTGCTTTGTAGCAC
+TCCAGTGTACTTGGAATGTTTCATCATAACCACTAAGGCAGACATTGATAAAGGCTTCGG
+TCTCTTTCAAACTGCAGGTGTCATGTTGCACTCTCCCTATTGCTTTTATGAAAATGTAGT
+GCCGGTAATATAACACAGTTACTCTCTGCATATATCACTATGTACACTTACTTCTATGGA
+AAAGATGGAGCGCCACAGTGAAAACTGTTTTGAGTCTGTGAGGGGAAAACACAGCATCAG
+TCACAGTGAAACACTAGGTGGCACTCAGGTTTGACATTCAAGCATTTGTATCCCACAGTT
+ACTGTTGCTGGGTTGTTGGCTGGCATGCAACTTAATATGATCTATCTTTAAATCAGTGTG
+TGCAGTGGTTATTTAGTTTAAGTGCTTTTTAATGATGTCACAACATTATTTTGTCTACAC
+CCTGCATACAGCACAGTATATTAAATTTAGGTTTTATTAAGTTAAGTAATGTTCTGAGGT
+GGCATTGCCCTCAGGTATATATCCCTCAGGCAGTGTTACTGGACAGCATATAGATTGTAA
+TGTTGTGTAAGCAGTGTTGTGTAAGCTTTTTTAACCAAAATGCTCTCATGTTTCTTTGTT
+ACCACAGTGGTTTTAGTGATGTTTTGTGCTGTGAACAGAATCATGATTTCTGCAGACACT
+CCACATCTGTTTAAACAGTGATTTTCACATCTGTCTGTAACTGAGTCAGTCAGTTTGTGG
+TTGGATTGATGTGTAGTGGGATCTACAGATCATCAACCCTCGGGGAAGCCATTTAGTTCT
+GTGTTAAATAAAAATACAACTTTTGAGCACTGTTTTTTCATATTTTTCTTCATCCCTTAG
+TTGATATTAAAGGTGCTATATGTAGATTTTTGCTATCACTACATAGCCAATGTTAGGATT
+AAGAACCCCAGCAACCCGAATGTTAACTCGTACTTTGCTTCTATTTCTATTACATATTTT
+CTTCTATGGAAGTTAGGATGTTAACCAGCTAACCCCAGGTCATCTCATAATACCACTTGG
+CAATAGTCAGTCACTGTTGCATTCAGTCTGCCCCTCCAGCATGAAAGGATGAAGAAGTAC
+CGCTACCCAGAAGGCGTAGTCTAACCCCTTGTCTTGTAAACACAGCAATGGCTGAAGCTC
+TTGGTAAGTAAACAGCTGTTAATGTCAGTGTTGGCTACATAGCTAAAACTTACACATAGC
+ACCGTTAAAAAAATAAATGGTAAGTTTTTGTCCTTTTAGTTAAAGCATGTAAATGTCAGT
+TAAAACAATTTAGAAAATTTCTCATTCAAATAGTCATTTTATTTTGTGTGCTATAAATAC
+CTTCAGTTTTTTTTCTTGTACTTTATTTTAAACTCTTGTCTTTCTCTTATGCCCCTTATC
+TACCAGGAGAGGTCACACTCTTGTTGATAGCATGATAAGGAAATGAGCAGAGATGTCCTT
+ATTTCTCCTCAAAGTTATTCCCTGCATAGCACATATTTGACTTTAAAAATACAAAGACTA
+CAGGTGCTAAATCACACACACAACACCCAAAAGAATAGAGGACTTTTAAATATGTGCATC
+CCATTTTCTAATCTATATTCACCACTGATACAAGTGATGACACGGTGATGAGAAAATAAC
+GTAACATACATTATTATACAAGATTGGTATGATTGCTGTAGGTTGGTTTTGTTTATCTGA
+GAAGGGACAGAGGCTAAAAGAATAAACAAAGTCTGCCAGCTACTTCACTAATTACAGAGT
+ACCCCTGCAACTCTGCCAATGACATTCTGAAACTTTTCCATGACTATTATGTAAGATAAT
+TTTTGAATCACTGATTCAGATTTCCATAGCCAAGATACACTATTCTGCATGTTGGCTAGA
+ATACATTACAATACATTAATATATTACTGTAGTGGTTATTATGTCAGCCATTTAAACATA
+ATTTCATACTTTCAGCTGTTCGCAGGGCAAACTTTTTATTTTTGTCACCTGAATCCAGTT
+GCATTTGGATTTGAATTCAGTGGTGACTGCCAATGAAAAATAACTCACAGGGGCACTTAG
+AGATCTGAGGCGGCATTGACTGAACATCGAAGGGCTACTATTACAGAAATGCAAGTGGAA
+AAAGAATCTGATATGATACTTGCCAGTATGAAAAGCATAATTAGGACTTTAAATGCATGT
+TTTAAATGTTTTTGTGAACCATAATTTCAGTGTAAAAGTTCCAGTTATATTTTAAAAGGA
+ACTCCAAATATCCAGTGGTAGCATCAAGGTAACCTGAGATAAGTGAAAAGTAATTCTAAA
+TTAATCAGTATGTTGAAATATCAGACATTTGTGTGCATTATTGTTAGTGTGACCATGGTG
+GGATACTTCAAACACACTTGTTCATTGGCAAAATAATTGTCACATGAATTAACACAAGTG
+ACACTTTCAGTATCATACTGACAGAATGTTTGTTGTTAACTTTATCCCTGAAAACAAACA
+CTAATACATGTTCTTGTCGCCCCTTCAGTGCCTAACCTTTAAAATTGTGCTTGTGAGTGT
+GTGTATGTGAGCGCACCTGTATGGTTTTCAAATAATGTTCCACATCACAACACTACAAAC
+ACTCACATGGTCTATGTTTTACTAAATTATTCATTGGCGTAGGCCCCACCTGCTCTTGTC
+CTTGTGTGACACAGGCTCTAAATAAGCAGCATGATGAATAAAAATGACACTGAGATGAAT
+AGGAATCCACAGCAAATCAGAGAGCACTCTCATCTCGTCTCATCCTCCGACTGAATAGCG
+AGCGGCTGCCTCCTTTATTCTTTTGAACTCTTCGCGGTTTTGGCACAAACATGCCAGAGA
+CAGAGAGCGCTGTTACGCTCCCACCAGAGCAACTACGCTTAATTTTACTGAGGTGAAAGT
+TTTTTTTTTTTTTCTGGATAAAGCTTTGGAAAAGTTCTCAACTGTTGCTTCTTTAAAGAT
+GCTGGGGCATATTCTGCCCTATTTTCCAGTTTTTTACATCTCCCATAAATATTTTCACAA
+GCTGTAACATTTTAGACAGGATTAAATTGAACTAGATAACTGACCAAAGGCTGCTAAATT
+ATTTTTATGTGCCTTGTAGCACAAATACTGTCTCACATATATTTTAAGTATCTTAATATT
+CCCTCTGATGTTTAATTTAACAAAGCTGTCCTTCCCTCCATCTCTCTCCTCATAGTTTTT
+CATTACAATTAGCTCTCATTAGATAGAATTGTATTTGTTGTCTTTGTGCCAGTCACTCCA
+GTCTATTTTGCCAGCACACAACTAAATAATTGTTTTGCCTTGTCAGTGTCTTGTTTTACA
+GTTTTAATGATGAGCCCAAAACATGTCAAATATGAGGAACTATAACTTATCAAGAAAGTG
+GGGTAGTTGAGATAAAACTGTTTCCGAGGTGGAGGTTGGCTGAGCTCCATTTGGCCACAA
+AATGTAGCTGAAAGGGCAGAGAAACCCACTTTAATGGAGTACAGGTTGCATATGAGCTGG
+TAGGAAAGATATAGAATCATTATCAGCTGATAATCTAACAGTAGCAGTCAGTGTAGATGC
+TGTGCTAACGCAAAGTTGTGAAACTACTGTCTGTAAGCAACTCATCCAATTGTTATTGCT
+GCCAAGCTTAAGTATTTTAACAGCTTTTAGGTGTTGTTAGCACAGTACTCGTTTGGATCC
+GGCCATGACAAGAAATCTTTATCGGCCACTAATTTAATTAATCATCTTTTTTCAAGCAAA
+AATCACAAACTTTCTTTGGTTCCACTTTTTCTCATTGTAGATTAAATATCTTTTGGGTTT
+TGGCACAGGCTGGACAAAAAAACCTCTGAGACGCTGTGATAAGAATTTATTTTCACATTT
+TTTTTACTTTTCAGGGACTACACAATTATTTGGTGATGAAAATAATATTTTGTTGCAGCC
+CAAATGTTAACTTGCCACTCAAGCTGTCAATTCAAGAAGGCAAAAGCAACAAATACTGCT
+TTGCCGAGCTGAAATGAGAGTAGAAACCATGCCCGGGCCAGCTCAGCCTGGTCAGGTTTT
+TGAGTCCATCTATTGTTAACATTCAGGTTGCAGCACAAGGGAAGTTCCTAAATTCTTCTG
+GCATGTTAATGTTTTCCAAACTGATGTTACCAAGTCCTCGTTATGATGAGAAAAAAATAT
+GCTGAGAGTGAAATTGATCAAAGTGGAAACATTAAGCACTGCCACAGTCCCCTCCACCCA
+TCTTTCTCCCTCTCTCTCCACCGCAACGTGGAAACTGCTCCTCTCTCTCTCTCCCTCTCC
+CTCTCCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCCTCCCTCCCA
+TTCTGTGCTCCGGTATACTCGCTCTCTCACTCTCTCCCTCTCTCCCCACTCTCCAGAGAG
+GGGTTCAGTCAGACAGATGTAACACAGCAGTAGAAGCCTGAGCTGAGCTGGCAGGCTGCG
+GAGGCCAGACCAGAGCCAGCAGCTCTGACTGGAGAGAACAGCGAAGAGGTGACGGCAGCA
+GCGGCAGCACAGGGGATAAAACAGTAGTTGTAGTAGCAGTTTCAGTAGTTGTACTTCAGT
+TACAGAGCTGACTTTACCTCAGGATATGGGTGTGTTGATCTGGGCGCTCATCACCCTGTG
+AATTTAACATGGACCCTGACACCAGCACCCATCCAGAGACACAACATGGTGAGTGAGATT
+TGAAGGAGGAAAAGATTAGAAACAATGAGAGTGATACTGTGGGAAAAGTTGAGGAGCGTG
+TTAGTGAACAAGGGAGTCAGGTCACATGGTTTTCCCGTTAGGGTTGCTATTATGACTAGG
+CTCTCCATTTGGCTCTAAAGCTGTTGACTAGGGCCTCTGTGGTCAAATGAATAGGACTTC
+AGTCTGTTCTGTTGAGTAGGGGGTGAAGGGGTGAGGGGTGTTACATGGCAATGTGATGAA
+ATCAACTGCCTGCTTAAGACATTTTGCTCTAATGACCCTCTTGTCATTACTTTAACAGGG
+TTGTAAAGTTTTTTTTGCTTTTTTGTAGCTAAGAAAGTTGAGAATTGTTTTGTCTGAACT
+CTCTCTGGGATTTGTCTTGTCGGTTTTTGGCTGGTTTTTGGTGTGAGCTTCACAGAGCAG
+GAAGCTCTCCTCCTGCTCTTTGAATGGAATAATTAACTGTGAGGGCCGTGGGTGTACCAT
+TTCTGCTCAAAAGCAGCAAGATAATTTGATGGTTATGTGAATCTGTATATTTGTATGCTG
+TGTAGTGGTGCTGCATGTGGGTGTTTGTGTTAGAGACACAGAGGGGCACCAAAGAATGAA
+AGTGGGAGACAGAGGGAACGAGAAGGGGAGAGACCGAGAGAGAAGGACTTATGTACACAA
+ATAAATCCAGGGGGATCTAGACTGCACTGTAGGCCAGTGCGAATGCTCACTCTTTCTCTT
+CCCCCTCATTTTCCGCTGCCTCTTTTTTTTCCTCCACTGCTCCAAATGTTGGAGCCCAAA
+CTAGATAGTTAAAAGGCAGAAAAAAATGGTGTGTTATTAACTGGGCCAGAAAAGACGATG
+TTTTGTCTTCATGGCCGATGGGAAGGACTCTGCTGTGCTGCTGATGAAGAATGTGGTTAA
+CAGAATGAGTCAACAGAGAACATATTTCCAAGAGACTGTAGTTTCTCTTCGCCAGCGTCT
+AAGCCACATTGCTTTATGCACTGGGCTCTCTGCCATGACGGCGAAGGAGAGACAAAGAGA
+GGGGAAAGAGAATCGCTAAAGATAAAACTCTGTTTTTATCCATCTCCTGAGACACAAAAC
+TTCTGTTAGCAATCTAACCAAATAAGCGAGAACATTAAGCTTCTTCTCACCTTCCCAAAA
+TAAAATGTCAACTTCATGCAGTAATACTCACTCTCTTCTCTCAACCAGTCAGCCAGCCTC
+TTTCAGTGCATACAGCTTGAGGAGATCCCTTCTAAAGGTCCAATATAAATAGAAAAGTGG
+GAGTAGAAAGGGCAATAATCTGATATCATCTGATTACATTCACACCTCAGGCTTGCACGC
+TACAGGAAGAGTTCACGCTTCCCAAGGCTTGCAGGCATCACTTTTCACTCATTCTCAGAT
+AGACACACAAACACATGCACAGAAATATCATTGCTGTTGTTTGCAACAAATCCTGGAGTA
+GACTACTTTGCATTGAATTTCTATATGCATGTGTTTTCATATATTACACATTGCTTTTTG
+TACTTTGCATATAAAGTAGATGCTGATCTGCTATCTGCATATATAGTAGCTGCAGATAGC
+ACTGTAACTACATCTACATATTTCTTGTTTGTATCTACATCAAGCAGATAGTTGCTGATG
+CTGGACAACCTCTTCCGATATTCATTATTTTGGAAAAAAAAATATCAATGGCATTCCTAC
+CTTACAACTTAAATTAAAAGTGGTCACTTGAGTAACTGCAGAACATGTGTTCACCCAATA
+GTTTTTTTTAGAGAGTGTCACTCAAAGTATTCCTCCTTACAAGCACCCATGCCTAAATCA
diff -r 889682a276f6 -r 26c5f217aad7 test-data/small.fasta.align
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.align Wed May 02 20:17:55 2018 -0400
@@ -0,0 +1,104 @@
+18 0.00 0.00 0.00 scaffold_1 613 632 (13519) (GT)n#Simple_repeat 1 20 (0) m_b1s252i0 1
+
+ scaffold_1 613 GTGTGTGTGTGTGTGTGTGT 632
+
+ (GT)n#Simple_ 1 GTGTGTGTGTGTGTGTGTGT 20
+
+Matrix = Unknown
+Transitions / transversions = 1.00 (0/0)
+Gap_init rate = 0.00 (0 / 19), avg. gap size = 0.0 (0 / 0)
+
+
+16 18.30 2.22 2.22 scaffold_1 780 824 (13327) (ATAATA)n#Simple_repeat 1 45 (0) m_b1s252i1 2
+
+ scaffold_1 780 ATATTAAT-ATACTAAATAATGATAATATTAATTCTAATAATGATA 824
+ v - v - i v vv i
+ (ATAATA)n#Sim 1 ATAATAATAATAAT-AATAATAATAATAATAATAATAATAATAATA 45
+
+Matrix = Unknown
+Transitions / transversions = 0.40 (2/5)
+Gap_init rate = 0.05 (2 / 44), avg. gap size = 1.00 (2 / 2)
+
+
+12 23.88 4.55 0.00 scaffold_1 2231 2274 (11877) (CAGA)n#Simple_repeat 1 46 (0) m_b1s252i2 3
+
+ scaffold_1 2231 CAGA-AAACAGTCAGCCAATCAGA-GGACAGACTCAGAGACAGACA 2274
+ - i v v iv -i vv v
+ (CAGA)n#Simpl 1 CAGACAGACAGACAGACAGACAGACAGACAGACAGACAGACAGACA 46
+
+Matrix = Unknown
+Transitions / transversions = 0.50 (3/6)
+Gap_init rate = 0.05 (2 / 43), avg. gap size = 1.00 (2 / 2)
+
+
+15 18.42 10.20 0.00 scaffold_1 4853 4901 (9250) (TC)n#Simple_repeat 1 54 (0) m_b1s252i3 4
+
+ scaffold_1 4853 TCTATTTTTCTCTCTCTCTCT-TCGGTCAGTTTCTCT-TCT-TCTC-CTC 4898
+ v i i - vv vv i - - -
+ (TC)n#Simple_ 1 TCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTC 50
+
+ scaffold_1 4899 -CTC 4901
+ -
+ (TC)n#Simple_ 51 TCTC 54
+
+Matrix = Unknown
+Transitions / transversions = 0.60 (3/5)
+Gap_init rate = 0.10 (5 / 48), avg. gap size = 1.00 (5 / 5)
+
+
+13 19.07 1.82 7.69 scaffold_1 6230 6284 (7867) (TAATTAA)n#Simple_repeat 1 52 (0) m_b1s252i4 5
+
+ scaffold_1 6230 TAATGAGT-ATTACTAATTAATAATTGGATGAGTTTATGAATTCATCATT 6278
+ v i - v -i - i v - v v
+ (TAATTAA)n#Si 1 TAATTAATAATTAATAATTAATAATT-AAT-AATTAAT-AATTAATAATT 47
+
+ scaffold_1 6279 AAATAA 6284
+ -
+ (TAATTAA)n#Si 48 -AATAA 52
+
+Matrix = Unknown
+Transitions / transversions = 0.60 (3/5)
+Gap_init rate = 0.09 (5 / 54), avg. gap size = 1.00 (5 / 5)
+
+
+15 28.31 0.00 3.51 scaffold_1 6548 6606 (7545) (GACA)n#Simple_repeat 1 57 (0) m_b1s252i5 6
+
+ scaffold_1 6548 GACAGAGAGATAAACAGACAGACATGGAAACAGAGGGACATAGAAAACAA 6597
+ v i i viv i vi v -v i -
+ (GACA)n#Simpl 1 GACAGACAGACAGACAGACAGACAGACAGACAGACAGACAGA-CAGAC-A 48
+
+ scaffold_1 6598 GACAGAGAG 6606
+ v
+ (GACA)n#Simpl 49 GACAGACAG 57
+
+Matrix = Unknown
+Transitions / transversions = 0.86 (6/7)
+Gap_init rate = 0.03 (2 / 58), avg. gap size = 1.00 (2 / 2)
+
+
+67 2.94 1.43 0.00 scaffold_1 11981 12050 (2170) (CT)n#Simple_repeat 1 71 (0) c_b1s251i0 7
+
+ scaffold_1 11981 CTCTCTCTCTCTCCCTCTCCCTCTC-CTCTCTCTCTCTCTCTCTCTCTCT 12029
+ i i -
+ (CT)n#Simple_ 1 CTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCT 50
+
+ scaffold_1 12030 CTCTCTCTCTCTCTCTCTCTC 12050
+
+ (CT)n#Simple_ 51 CTCTCTCTCTCTCTCTCTCTC 71
+
+Matrix = Unknown
+Transitions / transversions = 1.00 (2/0)
+Gap_init rate = 0.01 (1 / 69), avg. gap size = 1.00 (1 / 1)
+
+
+19 15.37 2.78 0.00 scaffold_1 12078 12113 (2107) (CT)n#Simple_repeat 1 37 (0) m_b1s252i6 8
+
+ scaffold_1 12078 CTCGCTCTCTCACTCTCTCCCTCTCTC-CCCACTCTC 12113
+ v v i - i v
+ (CT)n#Simple_ 1 CTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTC 37
+
+Matrix = Unknown
+Transitions / transversions = 0.67 (2/3)
+Gap_init rate = 0.03 (1 / 35), avg. gap size = 1.00 (1 / 1)
+
+
diff -r 889682a276f6 -r 26c5f217aad7 test-data/small.fasta.cat
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.cat Wed May 02 20:17:55 2018 -0400
@@ -0,0 +1,103 @@
+18 0.00 0.00 0.00 scaffold_1 613 632 (13519) (GT)n#Simple_repeat 1 20 (0) m_b1s252i0
+
+ scaffold_1 613 GTGTGTGTGTGTGTGTGTGT 632
+
+ (GT)n#Simple_ 1 GTGTGTGTGTGTGTGTGTGT 20
+
+Matrix = Unknown
+Transitions / transversions = 1.00 (0/0)
+Gap_init rate = 0.00 (0 / 19), avg. gap size = 0.0 (0 / 0)
+
+16 18.30 2.22 2.22 scaffold_1 780 824 (13327) (ATAATA)n#Simple_repeat 1 45 (0) m_b1s252i1
+
+ scaffold_1 780 ATATTAAT-ATACTAAATAATGATAATATTAATTCTAATAATGATA 824
+ v - v - i v vv i
+ (ATAATA)n#Sim 1 ATAATAATAATAAT-AATAATAATAATAATAATAATAATAATAATA 45
+
+Matrix = Unknown
+Transitions / transversions = 0.40 (2/5)
+Gap_init rate = 0.05 (2 / 44), avg. gap size = 1.00 (2 / 2)
+
+12 23.88 4.55 0.00 scaffold_1 2231 2274 (11877) (CAGA)n#Simple_repeat 1 46 (0) m_b1s252i2
+
+ scaffold_1 2231 CAGA-AAACAGTCAGCCAATCAGA-GGACAGACTCAGAGACAGACA 2274
+ - i v v iv -i vv v
+ (CAGA)n#Simpl 1 CAGACAGACAGACAGACAGACAGACAGACAGACAGACAGACAGACA 46
+
+Matrix = Unknown
+Transitions / transversions = 0.50 (3/6)
+Gap_init rate = 0.05 (2 / 43), avg. gap size = 1.00 (2 / 2)
+
+15 18.42 10.20 0.00 scaffold_1 4853 4901 (9250) (TC)n#Simple_repeat 1 54 (0) m_b1s252i3
+
+ scaffold_1 4853 TCTATTTTTCTCTCTCTCTCT-TCGGTCAGTTTCTCT-TCT-TCTC-CTC 4898
+ v i i - vv vv i - - -
+ (TC)n#Simple_ 1 TCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTC 50
+
+ scaffold_1 4899 -CTC 4901
+ -
+ (TC)n#Simple_ 51 TCTC 54
+
+Matrix = Unknown
+Transitions / transversions = 0.60 (3/5)
+Gap_init rate = 0.10 (5 / 48), avg. gap size = 1.00 (5 / 5)
+
+13 19.07 1.82 7.69 scaffold_1 6230 6284 (7867) (TAATTAA)n#Simple_repeat 1 52 (0) m_b1s252i4
+
+ scaffold_1 6230 TAATGAGT-ATTACTAATTAATAATTGGATGAGTTTATGAATTCATCATT 6278
+ v i - v -i - i v - v v
+ (TAATTAA)n#Si 1 TAATTAATAATTAATAATTAATAATT-AAT-AATTAAT-AATTAATAATT 47
+
+ scaffold_1 6279 AAATAA 6284
+ -
+ (TAATTAA)n#Si 48 -AATAA 52
+
+Matrix = Unknown
+Transitions / transversions = 0.60 (3/5)
+Gap_init rate = 0.09 (5 / 54), avg. gap size = 1.00 (5 / 5)
+
+15 28.31 0.00 3.51 scaffold_1 6548 6606 (7545) (GACA)n#Simple_repeat 1 57 (0) m_b1s252i5
+
+ scaffold_1 6548 GACAGAGAGATAAACAGACAGACATGGAAACAGAGGGACATAGAAAACAA 6597
+ v i i viv i vi v -v i -
+ (GACA)n#Simpl 1 GACAGACAGACAGACAGACAGACAGACAGACAGACAGACAGA-CAGAC-A 48
+
+ scaffold_1 6598 GACAGAGAG 6606
+ v
+ (GACA)n#Simpl 49 GACAGACAG 57
+
+Matrix = Unknown
+Transitions / transversions = 0.86 (6/7)
+Gap_init rate = 0.03 (2 / 58), avg. gap size = 1.00 (2 / 2)
+
+67 2.94 1.43 0.00 scaffold_1 11981 12050 (2170) (CT)n#Simple_repeat 1 71 (0) c_b1s251i0
+
+ scaffold_1 11981 CTCTCTCTCTCTCCCTCTCCCTCTC-CTCTCTCTCTCTCTCTCTCTCTCT 12029
+ i i -
+ (CT)n#Simple_ 1 CTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCT 50
+
+ scaffold_1 12030 CTCTCTCTCTCTCTCTCTCTC 12050
+
+ (CT)n#Simple_ 51 CTCTCTCTCTCTCTCTCTCTC 71
+
+Matrix = Unknown
+Transitions / transversions = 1.00 (2/0)
+Gap_init rate = 0.01 (1 / 69), avg. gap size = 1.00 (1 / 1)
+
+19 15.37 2.78 0.00 scaffold_1 12078 12113 (2107) (CT)n#Simple_repeat 1 37 (0) m_b1s252i6
+
+ scaffold_1 12078 CTCGCTCTCTCACTCTCTCCCTCTCTC-CCCACTCTC 12113
+ v v i - i v
+ (CT)n#Simple_ 1 CTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTC 37
+
+Matrix = Unknown
+Transitions / transversions = 0.67 (2/3)
+Gap_init rate = 0.03 (1 / 35), avg. gap size = 1.00 (1 / 1)
+
+## Total Sequences: 1
+## Total Length: 14220
+## Total NonMask ( excluding >20bp runs of N/X bases ): 14220
+## Total NonSub ( excluding all non ACGT bases ):14220
+RepeatMasker version open-4.0.7 , default mode
+run with rmblastn version 2.2.27+
+RepeatMasker Combined Database: Dfam_Consensus-20170127
diff -r 889682a276f6 -r 26c5f217aad7 test-data/small.fasta.gff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.gff Wed May 02 20:17:55 2018 -0400
@@ -0,0 +1,11 @@
+##gff-version 2
+##date 2018-04-21
+##sequence-region dataset_12.dat
+scaffold_1 RepeatMasker similarity 613 632 0.0 + . Target "Motif:(GT)n" 1 20
+scaffold_1 RepeatMasker similarity 780 824 18.3 + . Target "Motif:(ATAATA)n" 1 45
+scaffold_1 RepeatMasker similarity 2231 2274 23.9 + . Target "Motif:(CAGA)n" 1 46
+scaffold_1 RepeatMasker similarity 4853 4901 18.4 + . Target "Motif:(TC)n" 1 54
+scaffold_1 RepeatMasker similarity 6230 6284 19.1 + . Target "Motif:(TAATTAA)n" 1 52
+scaffold_1 RepeatMasker similarity 6548 6606 28.3 + . Target "Motif:(GACA)n" 1 57
+scaffold_1 RepeatMasker similarity 11981 12050 2.9 + . Target "Motif:(CT)n" 1 71
+scaffold_1 RepeatMasker similarity 12078 12113 15.4 + . Target "Motif:(CT)n" 1 37
diff -r 889682a276f6 -r 26c5f217aad7 test-data/small.fasta.log
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.log Wed May 02 20:17:55 2018 -0400
@@ -0,0 +1,10 @@
+SW score % div. % del. % ins. query sequence pos in query: begin end (left) repeat class/family pos in repeat: begin end (left) ID
+
+18 0.0 0.0 0.0 scaffold_1 613 632 (13588) (GT)n Simple_repeat 1 20 (0) 1
+16 18.3 2.2 2.2 scaffold_1 780 824 (13396) (ATAATA)n Simple_repeat 1 45 (0) 2
+12 23.9 4.5 0.0 scaffold_1 2231 2274 (11946) (CAGA)n Simple_repeat 1 46 (0) 3
+15 18.4 10.2 0.0 scaffold_1 4853 4901 (9319) (TC)n Simple_repeat 1 54 (0) 4
+13 19.1 1.8 7.7 scaffold_1 6230 6284 (7936) (TAATTAA)n Simple_repeat 1 52 (0) 5
+15 28.3 0.0 3.5 scaffold_1 6548 6606 (7614) (GACA)n Simple_repeat 1 57 (0) 6
+67 2.9 1.4 0.0 scaffold_1 11981 12050 (2170) (CT)n Simple_repeat 1 71 (0) 7
+19 15.4 2.8 0.0 scaffold_1 12078 12113 (2107) (CT)n Simple_repeat 1 37 (0) 8
diff -r 889682a276f6 -r 26c5f217aad7 test-data/small.fasta.masked
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.masked Wed May 02 20:17:55 2018 -0400
@@ -0,0 +1,286 @@
+>scaffold_1
+TGCTTTTCTGAGATTTATGTCAGCTCCCCATTGGGAGATACAGGAGAATC
+CAATATATTCCTGTCTCGCTTCTTTTATATTTATCCTTTCTACACCTGAC
+ATCCTCAGTGATTGAAGTGACAAAAAGTGGAGCGCACGCAGTGGTCATTA
+CCCTCCAATGGTACTTCTAATTAAGGAAAGATTTTTTGCATTCACTGAGC
+AAAACACTTATTTGCATGAATGGAAAATCATAAATGAGGGGTCCATTAAA
+CAAATTTCCTAATTGTTTGCTTTTTTTTCTTCCTACTTCACCATCCCTCT
+AAAGCTATTACTCTCTATTCTACCCCATTATCGAGTGCACAAACACCAGC
+CCCAAATTGTCTTATCTCTGCTTTGATAAATGATATTTTTTTCTCTTATA
+ATTGTGTTTCTCTCTAGATGTGCGGTGTCCATCAAGACACTGGATGTCAC
+GTGGTCACTCCTGTGAAGAGCGAACTGTGTGGAACCCGAAGTACTGTGTG
+GTTGCTGACTGTCAGATGCTGCTTCTGAATGAGGAGGAGGTGGTGAGAGC
+AGACAGCACAATCTCTTGTCTGGCATGTTCCTCTGTGTCACCATTGTCTC
+TCTCATCTGCTCNNNNNNNNNNNNNNNNNNNNCCTTGTCAATGTCATTAC
+ACAATTTATGTTGGTGCACTGCATGTCAGAGTCTGAACTTTGTTGGACAT
+CTACTTTCTGTCACCTGATACCTCATACTTTACACTCTAATCCCTTTTTC
+CTTTCTAACTGCTGCTGTGTTAAGCTGTCNNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNNNNNNNNNNNNNNGTGAATGGAGATTCACAATGAAGAAA
+CACAAGGTCCAGACTGAACCCCTGTGCTGTGTGAAGAGTTCACTCTACAT
+TTACATTCATCCCACATCAGAGACCAGCAATAGCCAGGTTAAGCAGAGCA
+AGGCTGAGTCTGGCTCTTTGCCTCTGTTGTTTTGATTAGTGTCACACTGG
+ATTATGCTAGTTTGTGTGAGATTAGAGGTCCTGTTGTTACGAGCAAATCA
+GCAGTCAGCAGGGTAATCTAAATTACATTGTTCTGTCGGCAATATCCTCT
+CCTCGCTCAACAGCTTTGTGTGAGCTCATATTTAAAGCCCCCACAGTAGT
+GCAGTGCATAAAATCATGCAGATACAGATCAGAAGCTTCAGGTAATGTTT
+ACATCAAACATCAGGGGGAAAATGTGATCTCAGTGCCTCTGACCGTGGTG
+TGATTGTTGGTGCCGGACAGGCTGGTTTGAGTATTTCTAAAACTGCTGAT
+CTCCTGGGATTTTCACACACGGCATTCTCTAGAGTTTACTCAGAACGGTG
+TGGAAAGCAAAAAAACATCCCGCGAGCTGCAATCCTGCGGATGGAAACAC
+CTTGTTGATGGGATATGTCAGAGGAATGGCCAGGCTGGATCAATCTGACA
+GAAAGGCGGTAACTCAGATAAGCACTCTCTACAACTGTGGTGAGCAGAAA
+AGCGTTCTCAGAATGCACAACACGTTCAACCTTGAGGAAGATGTTGCTAC
+AGCAGCAGATGAAGACCACGTCTGGTTCCACTCCTGTCAGCCAAGAACAT
+CTCAGACTGCACAGGACACCAAAACAAAAACACATCCTGTTTTCTACTGG
+TGGTAGAGTCACAATTTGGCAATAAGATAAATCCATGGACCCAACTTGCC
+TTGTGTCAATAGACCAAGCTGCTGGTGGTCTTGGGGAATGTTTTCTTTAC
+ACTTTCACACTATCGGCCTATATAAAATCCTATTATAAACTGCTGTACAG
+TGCATTGGGTTTGATAAGCCCTCTAAGTCTGTATATCATGATCTCATTGA
+TACCTGCGGCAATACACCCCCACAAACGCAGCTCCCTGCATTTTAAGTAT
+TATAGAGAGTAATTTCACTGTCCATGTCTTTTTTGATCATAAAGCAGGTC
+TAGGTGCTGTATACAACACTGTATTGAAATGCTGAAGCAGGTCTAGGTGC
+TGTATACAACACTGTATTGAAATGCTGAAGCCAATATATCAATCTATCTG
+TCTATATTTTATGAAATATCAGAGCATTTTAGTCCAAATTTGTCTGTTTT
+GTTCATTGCAATGCTGACTGCTTAACATTTTCCTCAGTGGTGGCCATCAC
+CACAGCATTTACTGGTGAGTTTTACCAAGCTACAGTGGGCCACAATGAGT
+TACCTGTTATTGGCCTGGCTCTATGGCATGNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNNNNNNNNNNNNNNCAAAGTGCCCTGTTCTTGTTAGAGCA
+GAGATAAATGAGACAGAGGAGATGTAAAACTATACTGAGATGGTTTTTTG
+GTTCTTAAAACCACAAATATATTGTATTACGGATATCAAAACTTCAAATA
+AAACCAGTAAAGTGTAAAACATGGGACCTCTAAATGAAGGGCTGTTTTGT
+TTCGTAGTTCTAGATTATGTCACTATGTGGCCTCGGTCTCTGTCTGCGTA
+AAGCGGCTACATGTAGAATTTGACCCACTTTGGTGCCCACATATGGTAAC
+TAAAACACTACAGACAGTATGCACTCCAACCCTATATAATTTATGTCCTT
+CAGTGAAGCCTACAAAATGTGCAGCATGATTTGCTATGATTAATACCTAG
+AATTATATTAAATTTTAGAAGTTTAGAGAGATGGCTTATACCTTTTTCTG
+AGCATGGAGTCATCTCATGTAATTTGTCACATACCTTTGGCCAGCTTAAA
+CCTGGTCATTCCAGTGAGAGCTGCTCACCCAAATGTTTCTGTATGCACCT
+CCTGCTGTGGGTGCCAATAGCTCATGCAAGTTGGTGTCTTTCAACTAAGG
+CCACTATGTGAGGACCATCAGCAGCAAATTAAATTAGAAGTGCCTTGGAG
+TTTCTCAGGCCCTCTTCTATGATCATTAAGGTCTCAGTGACAGAACAGTG
+CCCCTTTGAGGGACTATGGCATCTTGAGCACTTAAGTTGGCCGAATGTTT
+GATCTCAAATATGAGTGCACTGTTTCAAAGTCACAAAAGCCTCTGGACAA
+GGCATAGTTACTGGGCTTGGTTAACCTTTTTTTCATACCGGCGTGACTGC
+TGGAACTTGGAACATGTAGCCTAAGTTTCCCTTTGTCTGCAATTACTGAG
+GTATGCCATGTTGAAATAGAACAATAATTGCAGGGAGGAATTATTCCAAT
+CGACCCATCGGCAGGCTTTCCAATACAGTGCTTTTTGTTTCACAGCAACA
+AAGAACAAGAGCTTTTAAATGCATCCATCTGGACCCTGACTATGAAAGGT
+CATTGGTAACGCTGCTGGATTTCTGTTATGTCAGCAAACTGCAGGTCAAA
+GCGATGATACAGTCTTATAATGGCTTTCTCCAAGTGAAGGTGGGATAACA
+TGGTTTAAACAAGCTCAGTTAAATGGATCAGAGCATCAACTGCTGTGAAC
+AAGCAATCACACGGTCAAGGTCAAACATTTACACTTCTGAGAGATCTGGA
+GAGTATGTCATGGCAGTATTGCTTTTCAGTTATTTCAGTAACTGATTACG
+CCTTGTACTTAGTCTCAGAATTAGTGATTTGATTCAAAGTGTTTTATATA
+TGTATATTTCAAAGCAAAAATACAGCTTAGGTAAAGCTCCTTAGACTCAT
+GCAGCCTAATTTACTGTAGACATTCCTCCATGTACAGTACTGTGCAAATG
+TTTTAGGCAGTTTTAGGCACTAAAGGTGAACTGAGGATGCAGTCCCACGA
+TTAATTTTTATTCATCAGTTAACCTCATGTGAAGTGTAGTAAACAGAAAA
+AACCTAAATCAGATCAGTATTTCTTATGACCCCCCTCCCCTACCACCCAT
+CTTTAAAACAGCTCCAGTTCTCCTCAATCCCCCTGTACTTAGGTAGTTTT
+TTTCTAGCGTCTTGGAGAAGTTGCCTCAGTTCTTCTGTGGATTTTAGGCT
+GTCTCTGTGTCTTCTGTCTCCTCATGTATTCTCAGACTGACTCCATGATG
+TTGAGATCAGGGCTCTGTGGTGGGGGGGTCAGACCATCTGTTGCGGGACT
+CCTTGTTCTTCTTGTCTCTGAGGATAGTTCTTTATGATGCTGACTGTGTG
+ATTGGACTCATTGTCCTGCTGCAGAATTAATCTGGGACTGATCAGACATC
+TCCCTGATTGTACTGACAAAGGATAAGAGCAAAAACCTGTAGACTGCCTA
+AAACTTCTGCACAGTACTGCACAATACTGTATGTATGTGTGATAATACTC
+AGAAGTGATATAGAGTGGTTCAGGAGAAGCCTTAACTTACTTGTTCTTCT
+TTTCCCTATGATGCAATTTCTCTCCAAGCAAACAGTACATAATGAAATAT
+GTCTAAGAAAACACTAGCTGTTTGTCTTTTTGAAACACATTTAATAATTC
+AGATTTAGCCACAAATTAAAAATGAGCTTATACTTTGAACTTGCCCATTG
+GTTTTGATGTATGAAGCTGACAGATTTAGTCCACTGCATACTGCACTTTT
+TTGGATAGTGAAATAAATTAATTTATTATGCAGCATTTAAGCATATTGCT
+GTTATCTAGAATTTTATATATTAATAGGTATATATTATATTAACTCTTCA
+TTTGCTTAAATTTGGCCTGTATATTCCTCCATTTTATACAACCTTTAGAA
+AACACTGGAGTGAACAAAAATGTGAGGTTCAAAAGTGAGAGGAAAGAAAA
+ATCAGTGTGTGCAGCAAGACTGTAAGAGTCCCTGAACAAAAGTGTTGATT
+TATTGTTGGCTGTGAAAGTTTTTGCTGCAGGGGTTTTTGTAAACAGTGAC
+TCTTCTTTATGTCTTTGTTTCTATCTTTTTGTGTTTTCTTTTTTCATCTT
+ATNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNN
+NATACTCATGCTTCTCTTTTACTCTAATGGAAAACATAGAATTGAGGTGC
+AGTATCACTGAGAACAGCCAATGCTGATACTGTCATTTGTTATAGGATGT
+TTACTTAAGAAATGATTGTGGCCTTATTTGCCAAAGACGATTAGGCCCTG
+AGCCATTTGTACAGCCAATGTGACACCTCCGTAACCATAAGAAAAATTAT
+GCTTCCACAAACAGAAAGAGAGACAAATACAGACAGTGAAAGCAAAACTA
+TGAGAGAAGGGATAGCCATCTCAGCATTCAGCCAGTGTGTCACATGTCCA
+GAGGGCTGCAATATGAAGCCAATAAACTGAGAGAAAGGTGTGATTCCAGA
+GGGCTTTCCGGACTTTAAACTTTTCTCATTTTCACCTTCAGCTCGTTGTG
+AAGCCTTCAATTGTTCCTTGGTCACATGAAGCCCCCTGTGTGTAAAATTG
+ACATTCAGCTTATTACTCTCATCTACATCTCTAAAGTTGCACATGACTGC
+CAGTAGAGGGTGCTCATGATTTGAGACAAGTAACTTTTCTGTGCTTGTGT
+CAACAGTTAAAAATTCCCTATGGATACTTGAAAGAAATGCACCAGTGTTT
+AAATTTAGACTCAGTCCAAGTAGGCTTTGCCATTTGCTTTACTGTTGTAA
+TCAAATCAGTGCTCACAGTACATCAGTGGCAAAAGCAATTAGCTTAATTG
+AGTTAGTAGGGAGTGAAAAGATAGATCACTATTTCCTGGCAGCGATATAT
+TTTTCTCAGTTAACCTTCTCACAGAAAATTAGTTAGATGAGTTTCTTATC
+TCATTAGAACCATTGTTGTTTATTATTTAAACCTGACCTTTATCCAGAGA
+ATGTTTTTCACAGTAAGCATGTGTTTCACTCCAGCTCATACAGACACACC
+TTGTGGCCAGTCAGGGAATGTGCATTAAAACTAATGTTCTCTCTGGTAGA
+GCCATTCTGCCTATTCTGTTATTCACCAAAACTTTCCTGCCCAGATTTTT
+CCATCTAGTCAGGGGACTTTTTCCTCAGCTGAACTGTCAGTAGCCAGCTG
+CTCTGACCTTTACTCACCTCAGAGATTACTCATTCAAGTTATTTTACCAA
+TGATGGAATAAAGTGAATACACACATCGTGACTTCATCATACTTTCCCTC
+CTTTACCGTACTTTCCTAACATCAGTTAGCAAATTATACACTTAAATATG
+CTAAAATAGAGATTTGTTTCAAATTGAAGAGCAACACAGGACACATTTGC
+TTACACAAGTGACTCTATCTTATTTTTTAAGTGGCTGTCATCCTCAATAT
+CATCAATATTTTAGGCATGTGAATGTAGGNNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNGATTATTATGATAAAG
+CTACACATTATACTGCAATTCCGGGCCAACACTATTGTTTCGCCCTTACA
+GTACAGGACTGTACATATCACTGTCACTACAAATTGTTTCAGTGAGGCTC
+AGATTACAGCTCATCTTGCTTAGTCATTACGGCTCAGACCACCAGACAAT
+GTCTTTACGTCAGAGAAAGTCTGAGTGAGAGCTGTCCTTAAAACCAAGTC
+CCATGAGGCAAGTAAAGAGGTGACTCGCTGAGAGGATCAGGGAGAGGNNN
+NNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNN
+NNNNNNGGTGCTGCATTGAGTCGAGAGGTGTGAGGATGTTCGATAAGCCA
+TTATCACTCTGCTCGGAGGACGTCAGGCCCTATCCTTTTTTCTTTGAGTC
+ACCACTTTCTCACCACAGCCATCCTTCTTCCTTTGTCTGTTTAATCTTTT
+GCAGCCAAACATTTGGTATGCAAACTATAGGAAGATATGGTCTGACACCG
+ACTGATGTGATGCTAATGCCTTCTCTGTTTTATCCAATGACTCCTCATTT
+ATCAGGACCAATCCAGCTATTGTGTGCTATTGGCCCAACACAGCATTAAA
+CATGGTGACCAGAATAGCCACAGCAAAATAAATAACGGGCCTCTGTGACT
+ATTGTATGTGCATTTCTTACAGCTGTCATTTTTCTTTTCTGTTAGCTTTC
+ATTCTACTGTGCGTGCTCTCTATCTGCCTACGTTGTATCTGTGCCTTTTG
+TTAAATTCATTCAGCCTTTTATCTGTCTTGAATTTCTTTCTCTGTGTCCT
+CCTTTCCCTCTCTGTCTCAGCAGATCCGTCCCTTGTTTTTGCAGGAGAAG
+CGCTCTGCGTCATGCAAGGTCCATCTTCTGCGACGCACCATCAGCGTTCC
+AGTGGAAACACAGTTTCCAGAACTCCATAGCCAGCTGTCCACTGAGAGCG
+GTGAGTAGCCTGAGGACATGCCTCTGCTGTGATTAGCATGCATCATTATT
+TCCATACACACACTGGAAATCTTTTAATCGTTTTTCTTGACACAATTTAA
+TTAATTTAAATAATTAATAACATTGAAATCAACTGTTAAACACTTGTTCA
+ACATGGTTGTGGACAAAATCATCATAATGACTGTGGAGACTAAGGAGAAA
+CAATGCTTTGTTAAAATCTTTGCTCTGGTTTTGGCTTTTTCTATATTCTA
+TTTGTGTGTGCAGTGCTGCTAAACATCATCTTAGTCAGAGTCAAACTTGA
+GCACTCATGCAGATGCTTGTTCTATTCAGTGGTCAAATGGGCAGTGTAGC
+TTAGGAGAAGCACTTCTTTCCGCTCCTCAGTGACATAACCAGTCACACAC
+TCACACAGGCAAGTGAGCCTTTTAAAATTGCTGATACTATTTTTTTCTAC
+TTCATATCCACTAGATGGAGAGCTTGGTGCTTTGTAGCACTCCAGTGTAC
+TTGGAATGTTTCATCATAACCACTAAGGCAGACATTGATAAAGGCTTCGG
+TCTCTTTCAAACTGCAGGTGTCATGTTGCACTCTCCCTATTGCTTTTATG
+AAAATGTAGTGCCGGTAATATAACACAGTTACTCTCTGCATATATCACTA
+TGTACACTTACTTCTATGGAAAAGATGGAGCGCCACAGTGAAAACTGTTT
+TGAGTCTGTGAGGGGAAAACACAGCATCAGTCACAGTGAAACACTAGGTG
+GCACTCAGGTTTGACATTCAAGCATTTGTATCCCACAGTTACTGTTGCTG
+GGTTGTTGGCTGGCATGCAACTTAATATGATCTATCTTTAAATCAGTGTG
+TGCAGTGGTTATTTAGTTTAAGTGCTTTTTAATGATGTCACAACATTATT
+TTGTCTACACCCTGCATACAGCACAGTATATTAAATTTAGGTTTTATTAA
+GTTAAGTAATGTTCTGAGGTGGCATTGCCCTCAGGTATATATCCCTCAGG
+CAGTGTTACTGGACAGCATATAGATTGTAATGTTGTGTAAGCAGTGTTGT
+GTAAGCTTTTTTAACCAAAATGCTCTCATGTTTCTTTGTTACCACAGTGG
+TTTTAGTGATGTTTTGTGCTGTGAACAGAATCATGATTTCTGCAGACACT
+CCACATCTGTTTAAACAGTGATTTTCACATCTGTCTGTAACTGAGTCAGT
+CAGTTTGTGGTTGGATTGATGTGTAGTGGGATCTACAGATCATCAACCCT
+CGGGGAAGCCATTTAGTTCTGTGTTAAATAAAAATACAACTTTTGAGCAC
+TGTTTTTTCATATTTTTCTTCATCCCTTAGTTGATATTAAAGGTGCTATA
+TGTAGATTTTTGCTATCACTACATAGCCAATGTTAGGATTAAGAACCCCA
+GCAACCCGAATGTTAACTCGTACTTTGCTTCTATTTCTATTACATATTTT
+CTTCTATGGAAGTTAGGATGTTAACCAGCTAACCCCAGGTCATCTCATAA
+TACCACTTGGCAATAGTCAGTCACTGTTGCATTCAGTCTGCCCCTCCAGC
+ATGAAAGGATGAAGAAGTACCGCTACCCAGAAGGCGTAGTCTAACCCCTT
+GTCTTGTAAACACAGCAATGGCTGAAGCTCTTGGTAAGTAAACAGCTGTT
+AATGTCAGTGTTGGCTACATAGCTAAAACTTACACATAGCACCGTTAAAA
+AAATAAATGGTAAGTTTTTGTCCTTTTAGTTAAAGCATGTAAATGTCAGT
+TAAAACAATTTAGAAAATTTCTCATTCAAATAGTCATTTTATTTTGTGTG
+CTATAAATACCTTCAGTTTTTTTTCTTGTACTTTATTTTAAACTCTTGTC
+TTTCTCTTATGCCCCTTATCTACCAGGAGAGGTCACACTCTTGTTGATAG
+CATGATAAGGAAATGAGCAGAGATGTCCTTATTTCTCCTCAAAGTTATTC
+CCTGCATAGCACATATTTGACTTTAAAAATACAAAGACTACAGGTGCTAA
+ATCACACACACAACACCCAAAAGAATAGAGGACTTTTAAATATGTGCATC
+CCATTTTCTAATCTATATTCACCACTGATACAAGTGATGACACGGTGATG
+AGAAAATAACGTAACATACATTATTATACAAGATTGGTATGATTGCTGTA
+GGTTGGTTTTGTTTATCTGAGAAGGGACAGAGGCTAAAAGAATAAACAAA
+GTCTGCCAGCTACTTCACTAATTACAGAGTACCCCTGCAACTCTGCCAAT
+GACATTCTGAAACTTTTCCATGACTATTATGTAAGATAATTTTTGAATCA
+CTGATTCAGATTTCCATAGCCAAGATACACTATTCTGCATGTTGGCTAGA
+ATACATTACAATACATTAATATATTACTGTAGTGGTTATTATGTCAGCCA
+TTTAAACATAATTTCATACTTTCAGCTGTTCGCAGGGCAAACTTTTTATT
+TTTGTCACCTGAATCCAGTTGCATTTGGATTTGAATTCAGTGGTGACTGC
+CAATGAAAAATAACTCACAGGGGCACTTAGAGATCTGAGGCGGCATTGAC
+TGAACATCGAAGGGCTACTATTACAGAAATGCAAGTGGAAAAAGAATCTG
+ATATGATACTTGCCAGTATGAAAAGCATAATTAGGACTTTAAATGCATGT
+TTTAAATGTTTTTGTGAACCATAATTTCAGTGTAAAAGTTCCAGTTATAT
+TTTAAAAGGAACTCCAAATATCCAGTGGTAGCATCAAGGTAACCTGAGAT
+AAGTGAAAAGTAATTCTAAATTAATCAGTATGTTGAAATATCAGACATTT
+GTGTGCATTATTGTTAGTGTGACCATGGTGGGATACTTCAAACACACTTG
+TTCATTGGCAAAATAATTGTCACATGAATTAACACAAGTGACACTTTCAG
+TATCATACTGACAGAATGTTTGTTGTTAACTTTATCCCTGAAAACAAACA
+CTAATACATGTTCTTGTCGCCCCTTCAGTGCCTAACCTTTAAAATTGTGC
+TTGTGAGTGTGTGTATGTGAGCGCACCTGTATGGTTTTCAAATAATGTTC
+CACATCACAACACTACAAACACTCACATGGTCTATGTTTTACTAAATTAT
+TCATTGGCGTAGGCCCCACCTGCTCTTGTCCTTGTGTGACACAGGCTCTA
+AATAAGCAGCATGATGAATAAAAATGACACTGAGATGAATAGGAATCCAC
+AGCAAATCAGAGAGCACTCTCATCTCGTCTCATCCTCCGACTGAATAGCG
+AGCGGCTGCCTCCTTTATTCTTTTGAACTCTTCGCGGTTTTGGCACAAAC
+ATGCCAGAGACAGAGAGCGCTGTTACGCTCCCACCAGAGCAACTACGCTT
+AATTTTACTGAGGTGAAAGTTTTTTTTTTTTTTCTGGATAAAGCTTTGGA
+AAAGTTCTCAACTGTTGCTTCTTTAAAGATGCTGGGGCATATTCTGCCCT
+ATTTTCCAGTTTTTTACATCTCCCATAAATATTTTCACAAGCTGTAACAT
+TTTAGACAGGATTAAATTGAACTAGATAACTGACCAAAGGCTGCTAAATT
+ATTTTTATGTGCCTTGTAGCACAAATACTGTCTCACATATATTTTAAGTA
+TCTTAATATTCCCTCTGATGTTTAATTTAACAAAGCTGTCCTTCCCTCCA
+TCTCTCTCCTCATAGTTTTTCATTACAATTAGCTCTCATTAGATAGAATT
+GTATTTGTTGTCTTTGTGCCAGTCACTCCAGTCTATTTTGCCAGCACACA
+ACTAAATAATTGTTTTGCCTTGTCAGTGTCTTGTTTTACAGTTTTAATGA
+TGAGCCCAAAACATGTCAAATATGAGGAACTATAACTTATCAAGAAAGTG
+GGGTAGTTGAGATAAAACTGTTTCCGAGGTGGAGGTTGGCTGAGCTCCAT
+TTGGCCACAAAATGTAGCTGAAAGGGCAGAGAAACCCACTTTAATGGAGT
+ACAGGTTGCATATGAGCTGGTAGGAAAGATATAGAATCATTATCAGCTGA
+TAATCTAACAGTAGCAGTCAGTGTAGATGCTGTGCTAACGCAAAGTTGTG
+AAACTACTGTCTGTAAGCAACTCATCCAATTGTTATTGCTGCCAAGCTTA
+AGTATTTTAACAGCTTTTAGGTGTTGTTAGCACAGTACTCGTTTGGATCC
+GGCCATGACAAGAAATCTTTATCGGCCACTAATTTAATTAATCATCTTTT
+TTCAAGCAAAAATCACAAACTTTCTTTGGTTCCACTTTTTCTCATTGTAG
+ATTAAATATCTTTTGGGTTTTGGCACAGGCTGGACAAAAAAACCTCTGAG
+ACGCTGTGATAAGAATTTATTTTCACATTTTTTTTACTTTTCAGGGACTA
+CACAATTATTTGGTGATGAAAATAATATTTTGTTGCAGCCCAAATGTTAA
+CTTGCCACTCAAGCTGTCAATTCAAGAAGGCAAAAGCAACAAATACTGCT
+TTGCCGAGCTGAAATGAGAGTAGAAACCATGCCCGGGCCAGCTCAGCCTG
+GTCAGGTTTTTGAGTCCATCTATTGTTAACATTCAGGTTGCAGCACAAGG
+GAAGTTCCTAAATTCTTCTGGCATGTTAATGTTTTCCAAACTGATGTTAC
+CAAGTCCTCGTTATGATGAGAAAAAAATATGCTGAGAGTGAAATTGATCA
+AAGTGGAAACATTAAGCACTGCCACAGTCCCCTCCACCCATCTTTCTCCC
+TCTCTCTCCACCGCAACGTGGAAACTGCTCNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNN
+CTCCCTCCCATTCTGTGCTCCGGTATANNNNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNNNCAGAGAGGGGTTCAGTCAGACAGATGTAACACAGCAG
+TAGAAGCCTGAGCTGAGCTGGCAGGCTGCGGAGGCCAGACCAGAGCCAGC
+AGCTCTGACTGGAGAGAACAGCGAAGAGGTGACGGCAGCAGCGGCAGCAC
+AGGGGATAAAACAGTAGTTGTAGTAGCAGTTTCAGTAGTTGTACTTCAGT
+TACAGAGCTGACTTTACCTCAGGATATGGGTGTGTTGATCTGGGCGCTCA
+TCACCCTGTGAATTTAACATGGACCCTGACACCAGCACCCATCCAGAGAC
+ACAACATGGTGAGTGAGATTTGAAGGAGGAAAAGATTAGAAACAATGAGA
+GTGATACTGTGGGAAAAGTTGAGGAGCGTGTTAGTGAACAAGGGAGTCAG
+GTCACATGGTTTTCCCGTTAGGGTTGCTATTATGACTAGGCTCTCCATTT
+GGCTCTAAAGCTGTTGACTAGGGCCTCTGTGGTCAAATGAATAGGACTTC
+AGTCTGTTCTGTTGAGTAGGGGGTGAAGGGGTGAGGGGTGTTACATGGCA
+ATGTGATGAAATCAACTGCCTGCTTAAGACATTTTGCTCTAATGACCCTC
+TTGTCATTACTTTAACAGGGTTGTAAAGTTTTTTTTGCTTTTTTGTAGCT
+AAGAAAGTTGAGAATTGTTTTGTCTGAACTCTCTCTGGGATTTGTCTTGT
+CGGTTTTTGGCTGGTTTTTGGTGTGAGCTTCACAGAGCAGGAAGCTCTCC
+TCCTGCTCTTTGAATGGAATAATTAACTGTGAGGGCCGTGGGTGTACCAT
+TTCTGCTCAAAAGCAGCAAGATAATTTGATGGTTATGTGAATCTGTATAT
+TTGTATGCTGTGTAGTGGTGCTGCATGTGGGTGTTTGTGTTAGAGACACA
+GAGGGGCACCAAAGAATGAAAGTGGGAGACAGAGGGAACGAGAAGGGGAG
+AGACCGAGAGAGAAGGACTTATGTACACAAATAAATCCAGGGGGATCTAG
+ACTGCACTGTAGGCCAGTGCGAATGCTCACTCTTTCTCTTCCCCCTCATT
+TTCCGCTGCCTCTTTTTTTTCCTCCACTGCTCCAAATGTTGGAGCCCAAA
+CTAGATAGTTAAAAGGCAGAAAAAAATGGTGTGTTATTAACTGGGCCAGA
+AAAGACGATGTTTTGTCTTCATGGCCGATGGGAAGGACTCTGCTGTGCTG
+CTGATGAAGAATGTGGTTAACAGAATGAGTCAACAGAGAACATATTTCCA
+AGAGACTGTAGTTTCTCTTCGCCAGCGTCTAAGCCACATTGCTTTATGCA
+CTGGGCTCTCTGCCATGACGGCGAAGGAGAGACAAAGAGAGGGGAAAGAG
+AATCGCTAAAGATAAAACTCTGTTTTTATCCATCTCCTGAGACACAAAAC
+TTCTGTTAGCAATCTAACCAAATAAGCGAGAACATTAAGCTTCTTCTCAC
+CTTCCCAAAATAAAATGTCAACTTCATGCAGTAATACTCACTCTCTTCTC
+TCAACCAGTCAGCCAGCCTCTTTCAGTGCATACAGCTTGAGGAGATCCCT
+TCTAAAGGTCCAATATAAATAGAAAAGTGGGAGTAGAAAGGGCAATAATC
+TGATATCATCTGATTACATTCACACCTCAGGCTTGCACGCTACAGGAAGA
+GTTCACGCTTCCCAAGGCTTGCAGGCATCACTTTTCACTCATTCTCAGAT
+AGACACACAAACACATGCACAGAAATATCATTGCTGTTGTTTGCAACAAA
+TCCTGGAGTAGACTACTTTGCATTGAATTTCTATATGCATGTGTTTTCAT
+ATATTACACATTGCTTTTTGTACTTTGCATATAAAGTAGATGCTGATCTG
+CTATCTGCATATATAGTAGCTGCAGATAGCACTGTAACTACATCTACATA
+TTTCTTGTTTGTATCTACATCAAGCAGATAGTTGCTGATGCTGGACAACC
+TCTTCCGATATTCATTATTTTGGAAAAAAAAATATCAATGGCATTCCTAC
+CTTACAACTTAAATTAAAAGTGGTCACTTGAGTAACTGCAGAACATGTGT
+TCACCCAATAGTTTTTTTTAGAGAGTGTCACTCAAAGTATTCCTCCTTAC
+AAGCACCCATGCCTAAATCA
diff -r 889682a276f6 -r 26c5f217aad7 test-data/small.fasta.poly
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.poly Wed May 02 20:17:55 2018 -0400
@@ -0,0 +1,2 @@
+18 0.0 0.0 0.0 scaffold_1 613 632 (13588) (GT)n Simple_repeat 1 20 (0)
+67 2.9 1.4 0.0 scaffold_1 11981 12050 (2170) (CT)n Simple_repeat 1 71 (0)
diff -r 889682a276f6 -r 26c5f217aad7 test-data/small.fasta.stats
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.stats Wed May 02 20:17:55 2018 -0400
@@ -0,0 +1,51 @@
+==================================================
+file name: dataset_12.dat
+sequences: 1
+total length: 14220 bp (14220 bp excl N/X-runs)
+GC level: 39.94 %
+bases masked: 378 bp ( 2.66 %)
+==================================================
+ number of length percentage
+ elements* occupied of sequence
+--------------------------------------------------
+SINEs: 0 0 bp 0.00 %
+ ALUs 0 0 bp 0.00 %
+ MIRs 0 0 bp 0.00 %
+
+LINEs: 0 0 bp 0.00 %
+ LINE1 0 0 bp 0.00 %
+ LINE2 0 0 bp 0.00 %
+ L3/CR1 0 0 bp 0.00 %
+
+LTR elements: 0 0 bp 0.00 %
+ ERVL 0 0 bp 0.00 %
+ ERVL-MaLRs 0 0 bp 0.00 %
+ ERV_classI 0 0 bp 0.00 %
+ ERV_classII 0 0 bp 0.00 %
+
+DNA elements: 0 0 bp 0.00 %
+ hAT-Charlie 0 0 bp 0.00 %
+ TcMar-Tigger 0 0 bp 0.00 %
+
+Unclassified: 0 0 bp 0.00 %
+
+Total interspersed repeats: 0 bp 0.00 %
+
+
+Small RNA: 0 0 bp 0.00 %
+
+Satellites: 0 0 bp 0.00 %
+Simple repeats: 8 378 bp 2.66 %
+Low complexity: 0 0 bp 0.00 %
+==================================================
+
+* most repeats fragmented by insertions or deletions
+ have been counted as one element
+
+
+The query species was assumed to be homo
+RepeatMasker Combined Database: Dfam_Consensus-20170127
+
+run with rmblastn version 2.2.27+
+The query was compared to unclassified sequences in ".../dataset_2.dat"
+