# HG changeset patch
# User greg
# Date 1488382194 18000
# Node ID ef6cd36613a839e67157d815c4b8d11e0657ceb8
Uploaded
diff -r 000000000000 -r ef6cd36613a8 kaks_analysis.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/kaks_analysis.xml Wed Mar 01 10:29:54 2017 -0500
@@ -0,0 +1,156 @@
+
+ and inferred maximum likelihood phylogenies
+
+ plant_tribes_kaks_analysis
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+This tool is one of the PlantTribes' collection of automated modular analysis pipelines that utilize objective classifications of
+complete protein sequences from sequenced plant genomes to perform comparative evolutionary studies. orthologous or paralogous ks
+analyses of coding sequences and amino acid sequences.
+
+-----
+
+**Options**
+
+ * **Required options**
+
+ - **Select gene family clusters** - Sequences classified into gene family clusters, optionally including corresponding coding sequences.
+ - **Orthogroups or gene families proteins scaffold** - PlantTribes scaffolds data.
+ - **Protein clustering method** - One of GFam (domain architecture based clustering), OrthoFinder (broadly defined clusters) or OrthoMCL (narrowly defined clusters).
+
+ * **Multiple sequence alignments options**
+
+ - **Select method for multiple sequence alignments** - Method used for setting multiple sequence alignments.
+ - **Input sequences include corresponding coding sequences?** - Selecting 'Yes' for this option requires that the selected input data format is 'ptorthocs'.
+ - **Construct orthogroup multiple codon alignments?** - Construct orthogroup multiple codon alignments.
+ - **Sequence type used in the phylogenetic inference** - Sequence type (dna or amino acid) used in the phylogenetic inference.
+ - **Use corresponding coding sequences?** - Selecting 'Yes' for this option requires that the selected input data format is 'ptorthocs' or this tool will produce an error.
+
+ * **Phylogenetic trees options**
+
+ - **Phylogenetic trees inference method** - Phylogenetic trees inference method.
+ - **Select rooting order configuration for rooting trees??** - If 'No' is selected, trees will be rooted using the most distant taxon present in the orthogroup.
+ - **Number of replicates for rapid bootstrap analysis and search for the best-scoring ML tree** - Number of replicates for rapid bootstrap analysis and search for the best-scoring ML tree.
+ - **Maximum number of sequences in orthogroup alignments** - Maximum number of sequences in orthogroup alignments.
+ - **Minimum number of sequences in orthogroup alignments** - Minimum number of sequences in orthogroup alignments.
+
+ * **MSA quality control options**
+
+ - **Remove sequences with gaps of** - Removes gappy sequences in alignments (i.e., 0.5 removes sequences with 50% gaps).
+ - **Select process used for gap trimming** - Either nucleotide based trimming or alignments are trimed using using trimAl's ML heuristic trimming approach.
+ - **Remove sites in alignments with gaps of** - If the process used for gap trimming is nucleotide based, this is the gap value used when removing gappy sites in alignments (i.e., 0.1 removes sites with 90% gaps).
+
+
+
+
+ @unpublished{None,
+ author = {Eric Wafula},
+ title = {None},
+ year = {None},
+ url = {https://github.com/dePamphilis/PlantTribes}
+ }
+
+ 10.1186/1471-2105-10-421
+ 10.1093/molbev/msm088
+ 10.18637/jss.v004.i02
+
+
diff -r 000000000000 -r ef6cd36613a8 plant_tribes_scaffolds.loc.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/plant_tribes_scaffolds.loc.sample Wed Mar 01 10:29:54 2017 -0500
@@ -0,0 +1,4 @@
+## Plant Tribes scaffolds
+#Value Name Path Description
+#22Gv1.0 22Gv1.0 /plant_tribes/scaffolds/22Gv1.0 22 plant genomes (Angiosperms clusters, version 1.0; 22Gv1.0)
+#22Gv1.1 22Gv1.1 /plant_tribes/scaffolds/22Gv1.1 22 plant genomes (Angiosperms clusters, version 1.1; 22Gv1.1)
diff -r 000000000000 -r ef6cd36613a8 test-data/species1.faa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/species1.faa Wed Mar 01 10:29:54 2017 -0500
@@ -0,0 +1,16 @@
+>species1_11
+MGVSMGQGNPMGMHLLPSGSSSPRTSPSLRDPPLSLPVLPNSDLSVSLPDLHKLRRNEPVTSGILHVRDLSFLRPRSHNGDDDEETEEMTREQEEKYLQWRSSLVEKLAGIELNLERVKFRMSVEIPPSDDFRAMKKSWENFYASELLSSRNPVRKIAKRPDTILVRGVPSRWFAETRISSKASTLVTHTIIESC
+>species1_12
+MSAAAAALRPTEPLPLPSGLSLAPRLKLLLTFFRADLSVRPVDEWQLKTALLAFLRDPPLSLPVLPDSDLSVRTLPDLHKRRRDEPVASGVLHVRDLSFLRPRRRNGDDEEEEAEEMTREQEEEKYFQWRSSLVEKLAGIELNLEGVKFRMSVEIPPSDDFRAMKKSWENFYASELLSSRNPVRKIAKRPDTILVRGVPSRWFAETRISSKASTLVTHTIFSALGKIRNLNISSDDEWGAKQDGTNKEIISGLNCKVWVQFENYDDFNSAMQALCGRSLEKEGSRLKVDYEVTWDHEGFFRNAQYEPVRSNLEERNSSAHGRKKHYTSRIESDHRKRFRD
+>species1_15
+MKDGLSLSFALISSSPDSKCELLNSRPSCRAARRGESGLLIRRSYLRPCQCPFGDRMSEQQDSTSKSSSSSISSSTQESEEEVSITIGSLLAQAKNNSGHSLGRRLSQLGSIPHTPRVNGKIPNLDNATLDHERLSERLGNYGLAEFQIEGDGNCQFRALADQIFRNPDYHKHVRKLVMKQLKEFRKQYESYVPMEYKVYLKKMKRSGEWGDHLTLQAAADRFGAKICLLTSFRDTCLIEIVPRDVTPTRELWLSFWCEVHYNSLYATDDLLTRKTKKKHWLF
+>species1_16
+MSEQQDHASKSSCSSLSTSTQESEEDVTVGTLLTEAKNSGRSLGKRLSHLDSIPHTPRVNGQIPDVNNATIDHETLLERLGTYGLAEFQIEGDGNCQFRALADQIFRNPDYHKHVRKSVVKQLKEFRKHYEGYVPMEYKVYLKKMKRSGEWGDHVTLQAAADRFAAKICLLTSFRDTCLIEIVPRGATPTKELWLSFWSEVHYNSLYATEDLPNRKTRKKHWLF
+>species1_21
+MAGAGAGESLDLPVVDLASSDLAAAAKSVRKACVEYGFFYVVNHGAEGLAEKVFGESSKFFEQPLGEKMALLRNRNYLGYTPLGADKLDASSKFKGDLNENYCIGPIRKEGYQNDANQWPSEENFPCWKETMKLYHETALATGKRILSLIALSLNLDVEFFDCPVAFLRLLHYPGEANESDDGNYGASAHSDYGVLTLVATDGTPGLQICREKDRCPQLWEDVHHIEGALIVNIGDLLQRWTNCVFRSTLHRVVAVGKERYSVAFFLHTNPDLVVQCLESCCSEACPPRFPPIRSGDYLEDRLRARYK
+>species1_22
+MWGPHIILYLQPFFLLPSSHMSCVLGRPSAPSLDHPQQPNPPPVAPEKPPAVAKKAAEEEEEKKPPKQARRERHAWSSRSAAAEAVGLGLGGSFANRARGEQVAAGWPAWLSAVVGEAIDGWTLRRADSFEKIDKVRTPALALAIVGGGGRELSSSVLSVAQIGQGTYINVYKARDTVTGKIVALKKMGQVCFLLCKPSYRGDTAAGGRGGRRRQQQQTAALAEEESGMAGGGGGGNRLDLPVVDLASSDPRAAAESIRKACVESGFFYVVNHGVEEGLLKRLFAESSKFFELPMEEKIALRRNSNHRGYTPPYAEKLDPSSKFEGDLKESFYIGPIGDEGLQNDANQWPSEERLPSRRETIKMYHASALSTGKRILSLIALSLNLDAEFFENIGAFSCPSAFLRLLHYPGEVDDSDDGNYGASAHSDYGMITLLATDGTPGLQICREKNRNPQLWEDVHHIDGALIVNIGDLLERWTNCIYRSTVHRVVAVGKERYSAAFFLDPNPDLVVQCLESCCSESCPPRFSPIKSGDYLKERLSATYK
+>species1_35
+MAAATTSRRGPGAMDDENLTFETSPGVEVISSFDQMGIRDDLLRGIYAYGFEKPSAIQQRAVLPIISGRDVIAQAQSGTGKTSMISLSVCQIVDTAVREVQALILSPTRELAAQTERVMLAIGDFINIQVHACIGGKSIGEDIRKLEHGVHVVSGTPGRVCDMIKRRTLRTRAIKLLILDEADEMLGRGFKDQIYDVYRYLPPELQVCLISATLPHEILEMTSKFMTDPVRILVKRDELTLEGIKQFFVAVEKEEWKFDTLCDLYDTLTITQAVIFCNTKRKVDWLTERMRSNNFTVSAMHGDMPQKERDAIMGEFRSGATRVLITTDVWARGLDVQQVSLVINYDLPNNRELYIHRIGRSGRFGRKGVAINFVKKEDIRILRDIEQYYSTQIDEMPMNVADLI
+>species1_36
+MAAATTSRRGPGAMDDENLTFETSPGVEVISSFDQMGIREDLLRGIYAYGFEKPSAIQQRAVLPIISGRDVIAQAQSGTGKTSMISLSVCQIVDTAVREVQALILSPTRELAAQTERVMLAIGDYINIQVHACIGGKSIGEDIRKLEHGVHVVSGTPGRVCDMIKRRTLRTRAIKLLILDEADEMLGRGFKDQIYDVYRYLPPELQVCLISATLPHEILEMTSKFMTDPVRILVKRDELTLEGIKQFFVAVEKEEWKFDTLCDLYDTLTITQAVIFCNTKRKVDWLTERMRSNNFTVSAMHGDMPQKERDAIMGEFRSGATRVLITTDVWARGLDVQQVSLVINYDLPNNRELYIHRIGRSGRFGRKGVAINFVKKEDIRILRDIEQYYSTQIDEMPMNVADLI
diff -r 000000000000 -r ef6cd36613a8 test-data/species1.fna
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/species1.fna Wed Mar 01 10:29:54 2017 -0500
@@ -0,0 +1,16 @@
+>species1_11
+ATGGGTGTGAGTATGGGGCAAGGAAACCCAATGGGTATGCACTTGTTGCCATCTGGCAGCTCAAGTCCGCGCACCTCGCCTTCCCTCCGCGACCCGCCCCTCTCCCTCCCCGTCCTTCCCAACTCCGACCTCTCCGTGTCCCTCCCCGACCTGCATAAGCTTCGCCGCAATGAGCCCGTCACTTCGGGCATCCTCCACGTCCGCGACCTCTCATTCCTCCGCCCCCGCAGCCACAACGGGGATGATGATGAGGAGACCGAGGAGATGACCCGTGAGCAGGAGGAGAAGTACTTGCAGTGGAGGAGCTCCCTGGTCGAGAAGCTGGCCGGGATCGAGCTCAACCTCGAGAGGGTTAAGTTTCGGATGAGCGTCGAAATCCCGCCCTCCGATGACTTCAGGGCAATGAAGAAGTCTTGGGAGAATTTCTACGCCTCCGAGCTCCTCAGTAGCAGGAATCCTGTGAGGAAGATAGCGAAAAGGCCAGACACAATTCTTGTCCGTGGTGTGCCATCCAGGTGGTTTGCGGAGACGAGGATATCATCGAAAGCCTCCACACTGGTCACACACACTATCATCGAAAGCTGC
+>species1_12
+ATGTCCGCCGCCGCCGCCGCCCTCCGGCCGACCGAGCCGCTCCCCCTCCCGAGCGGCCTCTCCCTCGCGCCGCGCCTCAAGCTGCTCCTCACCTTCTTCCGCGCCGACCTCTCCGTCCGCCCCGTCGACGAGTGGCAGCTCAAGACCGCGCTCCTCGCCTTCCTCCGCGACCCGCCCCTCTCCCTCCCCGTCCTCCCCGACTCCGACCTCTCCGTGCGCACCCTCCCCGACCTGCATAAGCGCCGCCGCGACGAGCCCGTCGCCTCGGGCGTCCTCCACGTCCGCGACCTCTCCTTCCTCCGCCCACGCCGCCGCAACGGGGATGATGAGGAGGAGGAGGCCGAGGAGATGACCCGTGAGCAGGAGGAGGAGAAGTACTTCCAGTGGAGGAGCTCCCTGGTCGAGAAGCTGGCCGGGATCGAGCTCAACCTCGAGGGGGTTAAGTTTCGGATGAGCGTCGAGATCCCGCCCTCCGATGACTTCAGGGCAATGAAGAAGTCTTGGGAGAATTTCTACGCCTCCGAGCTCCTCAGTAGCAGGAATCCTGTGAGGAAGATAGCGAAAAGGCCAGACACCATTCTTGTCCGGGGTGTGCCATCCAGGTGGTTTGCGGAGACGAGGATATCATCGAAAGCCTCCACGCTGGTCACACACACTATTTTCTCGGCACTTGGTAAAATAAGGAACCTTAATATTTCTAGTGATGATGAATGGGGAGCAAAACAAGACGGAACCAATAAGGAGATTATATCTGGACTAAATTGCAAAGTGTGGGTGCAATTTGAGAACTACGACGATTTCAACAGTGCAATGCAGGCATTATGTGGACGTTCATTAGAAAAAGAAGGATCACGGTTGAAGGTAGACTATGAAGTAACTTGGGATCATGAAGGTTTCTTCCGCAATGCACAATACGAGCCTGTTCGCAGCAATTTAGAAGAGAGAAATTCATCGGCTCATGGAAGGAAGAAACATTACACATCGCGAATTGAGTCAGATCATAGAAAGAGATTTAGGGAT
+>species1_15
+ATGAAAGATGGCCTTTCTCTCTCCTTCGCTCTCATCAGCTCGAGCCCCGACAGCAAGTGTGAGCTACTGAACTCGAGACCCTCCTGTCGCGCGGCGCGGCGCGGCGAGAGTGGCCTTTTGATCCGACGAAGCTATCTAAGACCCTGCCAATGTCCATTTGGAGATAGGATGTCGGAACAGCAGGATAGTACTAGTAAAAGCTCTAGCTCAAGCATCAGCAGCAGTACACAGGAGAGCGAGGAGGAGGTATCTATAACAATAGGTAGCCTCCTCGCCCAAGCAAAGAACAACAGTGGGCATAGTCTTGGAAGGCGCCTCTCTCAATTGGGTTCAATCCCGCACACTCCTCGAGTTAATGGAAAAATCCCTAATCTTGATAATGCAACTTTGGATCATGAAAGATTGTCGGAAAGGTTGGGAAATTATGGTTTGGCCGAGTTTCAAATAGAGGGTGATGGAAATTGTCAGTTCCGAGCTTTGGCAGACCAGATATTTCGCAACCCCGATTATCACAAACATGTGAGAAAGTTAGTCATGAAACAGCTAAAGGAATTCAGAAAACAGTATGAAAGCTATGTACCTATGGAATATAAAGTCTACTTGAAGAAAATGAAAAGATCTGGGGAATGGGGGGATCATCTGACTTTACAAGCAGCTGCAGACAGGTTTGGTGCCAAAATTTGTTTGCTGACGTCATTCAGAGACACCTGCCTAATTGAGATAGTCCCCAGGGATGTGACTCCCACAAGGGAGTTGTGGCTAAGCTTCTGGTGTGAAGTGCACTACAATTCCTTGTACGCAACTGACGATCTCCTAACCCGCAAAACCAAGAAGAAGCATTGGTTGTTC
+>species1_16
+ATGTCTGAACAACAGGATCATGCTAGCAAAAGTTCTTGCTCAAGTCTTAGCACCAGTACTCAGGAGAGTGAGGAGGATGTGACAGTTGGTACCCTTTTAACTGAAGCAAAGAACAGTGGACGGAGTCTTGGAAAACGCCTTTCCCACTTAGATTCTATCCCGCACACTCCTCGAGTTAATGGGCAAATTCCTGATGTTAATAATGCAACAATAGACCATGAAACATTACTGGAAAGATTGGGCACTTATGGCTTAGCTGAATTCCAAATTGAAGGAGACGGAAATTGTCAGTTCCGAGCTTTGGCAGATCAGATATTCCGCAATCCTGACTATCACAAACATGTGAGGAAGTCAGTCGTGAAGCAGCTAAAGGAATTCAGGAAACACTATGAAGGCTATGTACCGATGGAATATAAGGTGTACTTGAAGAAAATGAAAAGATCTGGAGAATGGGGAGATCATGTGACCTTACAAGCGGCTGCAGACCGGTTTGCTGCCAAGATTTGCCTGCTGACATCATTTAGAGACACATGCCTAATCGAGATAGTCCCCAGAGGTGCCACTCCCACAAAAGAGCTTTGGTTAAGCTTCTGGAGTGAGGTGCACTACAATTCCTTGTATGCAACTGAAGATCTTCCAAATCGCAAGACCAGAAAGAAGCACTGGCTGTTC
+>species1_21
+ATGGCCGGCGCCGGCGCCGGCGAGAGCCTGGACCTCCCCGTGGTGGACCTAGCGTCCTCCGACCTCGCCGCCGCCGCCAAATCCGTCCGAAAGGCTTGCGTGGAGTACGGATTCTTCTACGTGGTCAACCATGGAGCCGAGGGATTGGCGGAGAAGGTGTTCGGGGAGAGCAGCAAGTTTTTCGAGCAGCCGCTGGGGGAGAAGATGGCGCTGCTGAGGAACAGAAACTACCTGGGGTACACCCCGCTTGGCGCCGATAAGCTCGACGCCTCGTCCAAATTCAAAGGAGATCTCAATGAAAATTACTGTATCGGACCTATCAGAAAAGAAGGTTATCAGAATGATGCTAACCAATGGCCTTCTGAAGAGAATTTCCCATGTTGGAAGGAGACAATGAAGCTATACCATGAAACTGCACTTGCTACTGGTAAAAGGATACTCTCTCTAATTGCTCTGAGTTTGAATCTCGACGTTGAATTCTTTGACTGCCCAGTGGCCTTTCTTCGGTTATTGCACTACCCAGGTGAAGCTAACGAGTCCGATGATGGCAATTATGGTGCATCAGCTCACTCAGACTATGGAGTACTAACACTTGTAGCAACAGATGGCACTCCTGGGCTGCAGATATGCAGGGAGAAGGATAGGTGCCCCCAGCTTTGGGAAGACGTTCATCACATTGAAGGGGCCCTGATTGTTAATATCGGCGATTTGCTACAAAGGTGGACTAATTGTGTTTTCAGGTCTACACTGCATCGCGTTGTTGCAGTTGGTAAAGAGCGATACTCTGTGGCTTTCTTTCTTCACACAAACCCTGATTTAGTGGTTCAATGCTTGGAAAGCTGCTGCAGTGAGGCATGCCCACCGAGGTTCCCACCTATAAGGAGCGGCGACTATTTGGAAGACCGATTGAGGGCTAGATACAAA
+>species1_22
+ATGTGGGGCCCACATATCATCCTCTATCTCCAACCCTTCTTCCTCCTCCCTTCCTCTCACATGAGCTGCGTCCTCGGCCGCCCCTCCGCCCCCTCCCTCGACCACCCCCAGCAGCCCAACCCCCCGCCCGTCGCCCCGGAGAAGCCGCCCGCCGTCGCCAAGAAGGCGGCCGAGGAGGAGGAGGAGAAGAAGCCGCCGAAGCAGGCTAGGAGGGAGAGGCACGCATGGTCGTCGCGGTCTGCCGCCGCCGAGGCGGTCGGCCTGGGGCTCGGGGGGAGCTTCGCCAACAGGGCGCGCGGGGAGCAGGTGGCGGCCGGCTGGCCCGCCTGGCTCTCCGCCGTCGTCGGCGAGGCCATCGACGGCTGGACCCTGCGCCGCGCCGACTCCTTCGAGAAGATCGACAAGGTACGTACTCCTGCCCTCGCGCTCGCCATTGTTGGTGGTGGGGGAAGGGAACTGAGCTCATCGGTCTTGTCGGTGGCGCAGATCGGGCAGGGGACGTACATCAACGTGTACAAGGCGCGGGACACGGTGACGGGCAAGATCGTGGCGCTCAAGAAGATGGGCCAAGTTTGCTTCCTTCTCTGTAAGCCCAGTTACCGTGGGGATACAGCCGCCGGCGGACGCGGAGGGCGGCGGCGGCAGCAGCAGCAAACCGCCGCTTTGGCAGAAGAGGAATCCGGGATGGCCGGCGGCGGCGGCGGCGGGAATCGCCTGGACCTCCCCGTGGTGGACCTCGCGTCCTCCGACCCCCGAGCCGCCGCCGAGTCCATCCGAAAGGCGTGCGTGGAGTCCGGATTCTTCTACGTGGTCAACCATGGGGTGGAGGAGGGATTGCTGAAGAGGTTGTTCGCGGAGAGCTCGAAGTTCTTCGAGCTGCCGATGGAGGAGAAGATAGCGCTGCGGAGGAACAGCAACCACCGGGGATACACCCCGCCCTACGCCGAGAAGCTCGATCCCTCGTCCAAATTCGAAGGAGACCTCAAGGAAAGTTTCTATATTGGGCCTATTGGAGATGAAGGTTTGCAGAATGATGCTAACCAGTGGCCTTCTGAAGAGCGCTTACCAAGTCGGAGGGAGACAATTAAGATGTACCATGCAAGTGCACTGTCTACTGGCAAAAGGATACTCTCTCTAATCGCTCTGAGTTTGAATCTTGACGCTGAATTCTTTGAGAACATTGGTGCCTTCAGCTGCCCATCAGCATTTCTTCGATTATTGCACTACCCAGGTGAAGTAGACGACTCTGATGATGGCAATTATGGTGCATCAGCTCACTCTGATTATGGAATGATAACCCTCCTAGCAACAGACGGCACTCCTGGGCTACAGATATGCAGGGAAAAGAATAGGAATCCCCAGCTCTGGGAAGATGTTCATCACATTGATGGGGCCCTGATTGTTAACATTGGCGATTTGCTAGAAAGGTGGACGAATTGTATTTACAGGTCTACAGTGCACCGTGTTGTTGCAGTTGGTAAAGAGCGATATTCTGCGGCTTTTTTTCTTGACCCAAACCCTGATTTAGTGGTTCAGTGTTTGGAAAGCTGTTGCAGCGAGTCATGCCCACCGAGGTTCTCACCTATAAAGAGTGGCGACTATTTGAAAGAGCGATTGAGCGCTACATACAAA
+>species1_35
+ATGGCGGCGGCCACCACGTCGCGGCGCGGCCCGGGCGCCATGGACGACGAGAACCTCACCTTCGAGACCTCCCCGGGGGTCGAGGTCATCAGCAGCTTCGACCAGATGGGGATCCGCGACGACCTCCTCCGCGGCATCTACGCCTACGGCTTCGAGAAGCCCTCCGCCATCCAGCAGCGCGCCGTCCTCCCCATCATCAGCGGCCGCGACGTCATCGCCCAGGCCCAGTCCGGGACCGGCAAGACCTCCATGATCTCGCTCTCCGTCTGCCAGATCGTAGACACCGCCGTCCGTGAGGTGCAGGCTTTAATACTGTCACCAACTAGAGAACTTGCTGCACAAACAGAAAGAGTTATGCTGGCTATCGGTGACTTCATCAATATCCAAGTGCATGCTTGTATTGGTGGCAAAAGTATTGGTGAGGATATTAGAAAGCTTGAGCACGGAGTGCATGTGGTGTCAGGAACACCTGGCAGAGTCTGTGATATGATCAAGAGAAGGACCTTGCGTACAAGAGCCATTAAGCTCCTAATTCTGGATGAAGCTGATGAGATGTTGGGCAGAGGCTTTAAGGATCAGATATATGATGTGTACAGATACCTCCCTCCAGAACTCCAGGTTTGCTTGATCTCCGCAACTCTGCCTCACGAGATCTTGGAAATGACCAGCAAGTTCATGACTGATCCAGTTCGGATCCTTGTGAAGCGTGATGAATTGACTCTAGAGGGCATCAAACAATTCTTTGTTGCTGTTGAGAAAGAAGAATGGAAGTTTGACACGCTTTGTGATCTTTATGATACACTGACAATCACCCAAGCTGTCATTTTCTGCAACACAAAGAGAAAGGTTGATTGGCTTACGGAAAGAATGCGCAGCAATAACTTCACAGTATCAGCTATGCATGGCGACATGCCTCAAAAGGAAAGGGATGCCATTATGGGTGAATTCAGGTCTGGTGCAACCCGTGTTCTAATCACGACAGATGTGTGGGCTCGAGGCCTCGATGTTCAGCAGGTCTCTCTTGTCATAAATTATGATCTCCCAAATAATCGTGAACTTTACATCCATCGCATTGGTCGCTCTGGACGTTTTGGTCGCAAGGGTGTGGCCATCAATTTTGTCAAAAAGGAAGACATCCGTATCCTGAGAGATATCGAGCAGTACTACAGCACGCAGATTGATGAAATGCCAATGAATGTTGCTGATCTAATT
+>species1_36
+ATGGCGGCGGCCACCACGTCCCGGCGCGGCCCCGGCGCCATGGACGACGAGAACCTCACCTTCGAGACCTCCCCCGGGGTCGAGGTCATCAGCAGCTTCGACCAGATGGGGATCCGCGAGGACCTCCTCCGCGGCATCTACGCCTACGGCTTCGAGAAGCCCTCCGCCATCCAGCAGCGCGCCGTCCTCCCCATCATCAGCGGCCGCGACGTCATCGCCCAGGCCCAGTCCGGAACCGGCAAGACCTCCATGATCTCGCTCTCCGTCTGCCAGATCGTCGACACCGCCGTCCGAGAGGTTCAGGCCTTGATACTCTCACCAACTAGAGAACTTGCTGCACAAACAGAAAGAGTTATGCTGGCCATTGGTGATTACATCAATATCCAAGTGCATGCTTGTATTGGTGGCAAAAGTATTGGTGAGGATATTAGAAAGCTTGAGCATGGAGTGCATGTTGTGTCAGGAACACCTGGCAGAGTCTGTGATATGATCAAGAGAAGGACCTTGCGTACAAGAGCCATTAAGCTCCTAATTCTGGATGAAGCCGATGAGATGTTGGGCAGAGGCTTTAAGGATCAGATATATGATGTCTACAGATATCTACCCCCAGAGCTCCAGGTTTGCTTGATCTCCGCAACTCTGCCACATGAGATCTTGGAAATGACCAGCAAGTTCATGACTGACCCAGTCCGGATCCTTGTAAAGCGTGATGAATTGACCCTAGAGGGCATCAAACAATTCTTTGTTGCTGTTGAGAAAGAAGAATGGAAGTTTGATACTCTTTGTGATCTTTATGATACACTGACAATCACCCAAGCTGTCATTTTCTGCAACACGAAGAGAAAGGTTGATTGGCTTACAGAAAGAATGCGCAGCAATAACTTCACGGTATCAGCTATGCATGGTGACATGCCTCAAAAGGAAAGGGATGCCATTATGGGTGAATTCAGGTCTGGTGCAACCCGTGTTCTAATTACGACAGATGTGTGGGCTCGAGGCCTGGATGTTCAGCAGGTCTCTCTTGTCATAAACTATGATCTTCCAAATAATCGTGAACTTTACATCCATCGCATTGGTCGCTCTGGACGTTTTGGTCGCAAGGGTGTGGCCATCAATTTTGTCAAAAAGGAAGACATCCGTATCCTGAGAGATATTGAGCAGTACTACAGCACACAGATTGATGAAATGCCAATGAATGTTGCTGATCTAATT
diff -r 000000000000 -r ef6cd36613a8 test-data/species2.faa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/species2.faa Wed Mar 01 10:29:54 2017 -0500
@@ -0,0 +1,8 @@
+>species2_5
+MESQSAVVPLIAELPEKRGGKTLVEEVWEESKKLWEVTGPAAFTGMVLYSMTIVSQAFAGHLGDRHLAAFSIANTVISGLNFGILLGMASALETLCGQAYGAKQYSMMGTYLQRSWLVLLAFAVLLAPTYIFSGQLLMVLGQPAELSREAGLLGMYLLPLHLMFAIQLPLNKFLQCQRKNWVIALSSVLGFPVHVVATWLLAQRFQLGVLGAAMSLNLSWALITGLQLAYAVGGGCPETWRGFSSSAFMGLKDFVSLSVASGVMTCLESWYYRLLIFLTAYAKNAELAVDALSICLSWAGWEMMIHFGFLAGTGVRVANELGANNGRAAKFATIVSTTTSFLICLLISSLALIFHDKLAILFTSSEAVIDAVDGISVLLALTILLNGIQPVLSGVAVGSGWQALVAYVNIGSYYIIGVPFGVLLAWGFHYGVLGIWVGMIGGTMVQTLILSFITLRCDWNEEALKASSRMRTWSSSK
+>species2_6
+MEENRSDIPLISGSELPDRRGGGKISELAKEVWGESKKLWVVAGPAAFTRLTFYGMTVVSQAFAGHIGDLELAAFSIATTVISGLSFGFFVGMASAMETLCGQAYGAKQYHMMGIYLQRSWLILLSFAVLLTPTYIFSEQLLTALGQPAELSRQAGLVSLYMLPLHFVYAIVLPLNKFLQCQRKNWVAAVTTAAAFPVHVVATWLLVRCFRLGVFGAAMALTLSWALATVGLLSYALGGGCPETWRGFSASAFVDLKDFIKLSAASGVMLCLENWYYRILVFLTGYVKNAELAVDALSICISYAGWEMMIHLGFLAGTGVRVANELGAANGARARFATIVSMTTSFLISLFISLLILIFHDKLGMIFSSSQAVIDAVDNISFLLALTILLNGIQPVLSGVAVGSGWQALVAYVNIGSYYLIGVPFGFLLGWGLHYGVQGIWVGMIVGTMVQTLILAYITLRCDWNEEALKASTRMRRWSNSK
+>species2_9
+MGTLGGHVAPGAFFFLIGLWHLFGHSRLFLLQRGSYVAPVWFPVPGVRHIELIMIIIGSVISVSMELVIVQPKHQPFDDDGTIPSVHLHNFEHASISLAWLVFAAATIHMDRVRAPMRDAVSQLAAAAAFAQQLLIFHFHSADHAGVQGRYHRLLEMVVAVTLAASLLLIPYQRSIALSLVRSASLVFQGVWFTVMGVMMWTPALVPKGCFMNDEDGLQVVRCRTDEALDRAKSLVNLQFNWYLTGTVAFVVVFYLQMAKQYQEQPQYAPLVKGGRGSDGRCTIGEVNDDEDDLEASKGGLGYIEIER
+>species2_10
+MGTLVGHVAPGAGFLLIGLWQLFSHIRLFLLRPSSYSAPVWFPAPGVRHLELILIIIGAAMSILMELVIGPAKHQPFDDDGTIPSDHLHNFEHASISLALLVFAAVTIHLDRVKAPLRDAVSQLVAAAAFAQQLLIFHLHSADHMGVEGQFHWLLQTVIAVTLATTLLGIPYPRSIVVSLVRSASLVLQGVWFVVMGVMLWTPALIPKGCFLNLEEGHDVVRCRTDEALDRAKSLVNLQFSWYLTGTVVFVVLFYLQMAKLYPEEPQYLPLVKGGGGGGDDRDSRFSIGDDDHDDEDDVEAAKRGFGHVVSGTKPVEIER
diff -r 000000000000 -r ef6cd36613a8 test-data/species2.fna
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/species2.fna Wed Mar 01 10:29:54 2017 -0500
@@ -0,0 +1,8 @@
+>species2_5
+ATGGAGAGTCAGAGCGCCGTCGTCCCGCTCATTGCCGAGCTCCCGGAGAAGCGGGGAGGCAAAACCCTGGTGGAGGAGGTATGGGAGGAGTCCAAGAAGCTGTGGGAAGTCACCGGCCCGGCCGCCTTTACGGGGATGGTACTCTACAGCATGACCATCGTCAGCCAGGCCTTCGCCGGCCACCTTGGTGACCGCCATCTCGCCGCTTTCTCCATCGCCAACACCGTCATATCTGGCCTTAACTTTGGCATTTTGCTTGGCATGGCGAGTGCGCTGGAGACATTATGCGGCCAAGCCTACGGTGCAAAGCAGTACTCGATGATGGGCACCTATCTCCAGCGCTCATGGCTCGTCCTCCTCGCCTTCGCGGTGCTCCTTGCTCCGACGTACATCTTCAGCGGGCAGCTGCTCATGGTCCTGGGCCAGCCCGCCGAGCTGTCTCGCGAGGCGGGCTTGCTCGGCATGTACCTGCTCCCGCTGCACCTCATGTTTGCCATCCAGCTGCCGCTCAACAAGTTCTTGCAGTGCCAGCGCAAGAACTGGGTCATCGCGCTGTCCTCGGTGCTGGGTTTCCCGGTGCACGTCGTGGCGACCTGGCTGCTGGCGCAGCGCTTTCAGCTTGGCGTCCTGGGCGCAGCGATGTCACTCAACCTGTCCTGGGCGCTCATCACGGGCCTGCAGCTCGCGTACGCTGTTGGCGGTGGGTGCCCAGAGACGTGGAGAGGGTTCTCGTCGTCGGCATTCATGGGCTTGAAGGACTTCGTCAGCTTGTCCGTCGCGTCGGGAGTCATGACGTGCTTGGAGAGTTGGTACTACCGGTTATTGATTTTCCTAACGGCGTACGCGAAGAACGCAGAATTGGCTGTGGATGCACTGTCTATCTGCTTGAGTTGGGCTGGATGGGAGATGATGATTCATTTCGGGTTCTTAGCAGGCACTGGGGTGAGGGTTGCCAATGAGCTAGGCGCCAATAATGGACGAGCTGCAAAGTTTGCGACGATCGTGTCCACGACGACATCATTCCTGATCTGCCTCTTAATTAGTTCACTCGCACTCATTTTCCATGACAAACTCGCAATACTGTTCACGTCTAGTGAGGCTGTGATCGATGCAGTTGACGGTATTTCTGTTCTGCTAGCCCTCACCATCCTCCTCAATGGCATCCAACCTGTGCTATCCGGAGTTGCCGTTGGTTCAGGGTGGCAAGCGCTAGTTGCGTATGTGAACATTGGGAGCTACTACATTATCGGTGTTCCTTTCGGTGTTCTGCTAGCATGGGGTTTCCACTACGGGGTCCTTGGCATTTGGGTTGGAATGATCGGTGGCACGATGGTGCAAACTCTGATTCTTTCATTTATCACCTTACGATGCGACTGGAATGAAGAGGCACTGAAAGCTTCTAGCAGAATGCGGACATGGAGCAGCTCCAAG
+>species2_6
+ATGGAGGAGAATCGGAGCGATATCCCGCTCATCTCCGGCTCCGAGCTGCCGGACAGGAGGGGAGGAGGCAAGATCTCCGAGCTTGCGAAGGAGGTATGGGGAGAGTCCAAGAAGCTGTGGGTGGTCGCCGGCCCGGCCGCGTTCACGAGGCTGACATTCTATGGCATGACCGTGGTCAGCCAGGCCTTTGCCGGGCACATCGGTGACCTCGAGCTCGCCGCCTTCTCCATAGCCACCACCGTCATTTCTGGTCTCAGCTTTGGCTTCTTTGTTGGCATGGCGAGTGCAATGGAGACGCTGTGCGGCCAAGCCTACGGTGCAAAGCAGTACCACATGATGGGCATCTACCTGCAGCGCTCGTGGCTCATCCTCCTCAGCTTCGCCGTGCTTCTTACTCCGACCTACATCTTCAGCGAGCAGCTGCTCACCGCGCTGGGCCAGCCCGCCGAGCTGTCGCGCCAGGCGGGCTTGGTCAGCCTGTACATGCTCCCGCTGCACTTCGTCTACGCCATCGTCCTGCCGCTCAACAAGTTCCTGCAGTGCCAGCGCAAGAACTGGGTCGCCGCGGTCACCACGGCCGCGGCGTTCCCCGTTCACGTCGTCGCCACCTGGCTGCTGGTGCGTTGCTTCCGGCTCGGGGTCTTTGGAGCAGCGATGGCGCTCACCCTGTCCTGGGCACTCGCCACGGTGGGTCTCCTCTCGTATGCCTTGGGCGGCGGGTGCCCGGAGACGTGGAGGGGATTCTCAGCTTCTGCCTTCGTGGACTTGAAGGACTTCATCAAGTTGTCCGCGGCGTCTGGTGTCATGCTCTGCTTGGAGAATTGGTACTACCGGATCTTGGTTTTCCTGACGGGCTATGTGAAGAACGCTGAACTGGCTGTCGATGCACTGTCCATCTGTATAAGTTATGCTGGATGGGAGATGATGATTCATTTGGGATTCTTAGCAGGCACTGGGGTGAGGGTGGCTAATGAGCTCGGTGCAGCCAACGGAGCACGAGCGAGATTTGCGACAATTGTGTCGATGACGACATCATTTCTGATCAGCCTATTCATTAGTTTGCTCATCCTGATTTTCCATGACAAACTCGGAATGATCTTCTCGTCGAGTCAGGCTGTGATTGATGCAGTAGACAACATTTCCTTTCTGCTGGCCCTCACCATCCTCCTCAACGGAATCCAACCTGTGCTCTCTGGAGTTGCTGTTGGCTCAGGGTGGCAGGCATTGGTTGCTTATGTCAACATTGGGAGCTATTACTTGATTGGTGTTCCTTTCGGTTTTCTGCTAGGATGGGGCTTGCATTATGGGGTTCAAGGAATTTGGGTCGGAATGATCGTTGGCACAATGGTGCAAACTCTAATACTGGCATATATCACTCTACGGTGTGATTGGAATGAAGAGGCATTGAAAGCTAGTACCCGAATGCGGAGATGGAGCAACTCCAAG
+>species2_9
+ATGGGCACACTAGGCGGGCACGTCGCGCCGGGCGCCTTCTTCTTCCTCATCGGCCTGTGGCATCTGTTCGGCCACAGCCGCCTGTTCTTGCTACAGCGGGGCTCCTACGTGGCTCCGGTGTGGTTCCCGGTGCCGGGCGTCCGTCACATCGAGCTCATAATGATAATAATCGGCTCGGTGATCTCCGTCTCGATGGAGCTCGTCATCGTGCAGCCGAAGCACCAGCCGTTCGACGACGACGGCACCATCCCCAGCGTCCACCTGCACAACTTCGAGCACGCGTCCATCTCGCTGGCGTGGCTCGTCTTCGCCGCCGCCACCATCCACATGGACAGGGTCCGGGCGCCGATGCGGGACGCGGTGTCGCAGCTGGCGGCCGCGGCCGCGTTCGCGCAGCAGCTGCTCATCTTCCACTTCCACTCCGCGGACCACGCGGGCGTGCAGGGGCGGTACCACCGTCTGCTGGAGATGGTGGTCGCCGTCACGCTCGCCGCCTCGCTGCTCTTGATCCCCTACCAACGGAGCATCGCGCTGAGCCTGGTCCGCTCGGCCAGCCTCGTGTTCCAGGGCGTCTGGTTCACCGTCATGGGCGTCATGATGTGGACGCCGGCGCTCGTCCCCAAAGGCTGCTTCATGAACGACGAAGATGGCCTCCAAGTCGTCCGGTGCCGCACCGACGAGGCGCTCGACCGCGCCAAGTCGCTCGTCAACCTGCAGTTCAACTGGTACCTGACCGGCACCGTGGCGTTCGTCGTCGTGTTCTACCTCCAGATGGCCAAGCAGTACCAGGAGCAGCCGCAGTACGCTCCGCTGGTGAAGGGAGGGAGAGGCAGCGATGGCCGGTGCACCATCGGAGAGGTCAATGACGACGAGGATGACCTTGAGGCCTCCAAAGGAGGCTTAGGATATATCGAAATTGAGAGG
+>species2_10
+ATGGGCACTCTCGTCGGGCACGTCGCGCCGGGCGCCGGCTTCCTCCTCATCGGCCTGTGGCAGCTATTCAGCCACATCCGCCTGTTCCTGCTGCGCCCGAGCTCGTACTCTGCTCCGGTCTGGTTCCCGGCGCCGGGCGTGCGCCACCTCGAGCTCATACTCATCATCATCGGCGCGGCGATGTCCATCCTGATGGAGCTCGTCATCGGCCCCGCGAAGCACCAGCCGTTCGACGACGACGGCACCATCCCGTCAGACCACCTCCACAACTTCGAGCACGCGTCCATCTCGCTGGCGCTGCTCGTCTTCGCCGCGGTCACCATCCACCTCGACAGGGTAAAGGCGCCCCTGCGTGACGCCGTGTCGCAGCTCGTCGCCGCCGCGGCGTTCGCGCAGCAGCTGCTCATCTTCCACCTCCACTCGGCGGACCACATGGGCGTGGAGGGGCAGTTCCACTGGCTGCTGCAGACGGTCATCGCCGTCACGCTCGCCACCACGCTGCTCGGGATCCCTTACCCGCGGAGCATCGTGGTGAGCCTTGTCCGGTCGGCCAGCCTCGTGCTCCAGGGCGTCTGGTTCGTCGTCATGGGCGTCATGCTGTGGACGCCGGCGCTCATACCCAAGGGCTGCTTCCTCAACCTCGAGGAAGGGCACGACGTCGTCCGGTGCCGCACCGACGAGGCGCTCGACCGCGCCAAGTCGCTCGTCAACCTGCAGTTCAGCTGGTACCTCACCGGCACGGTGGTGTTCGTCGTCCTGTTCTACCTCCAGATGGCGAAGCTCTACCCCGAGGAGCCGCAGTATTTGCCGCTGGTGAAGGGAGGAGGCGGCGGCGGCGATGACCGCGATAGCCGGTTCAGCATCGGAGACGATGATCACGACGATGAGGACGATGTCGAGGCTGCAAAACGTGGCTTCGGACACGTGGTTAGCGGCACAAAGCCTGTCGAAATCGAGAGG
diff -r 000000000000 -r ef6cd36613a8 tool_data_table_conf.xml.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_data_table_conf.xml.sample Wed Mar 01 10:29:54 2017 -0500
@@ -0,0 +1,6 @@
+
+
+ value, name, path, description
+
+
+