# HG changeset patch # User galaxyp # Date 1505420096 14400 # Node ID 8eb27726271529fba0a82cd5a37c23155adb3c70 planemo upload commit dd9bf5d878d54362e928a834956feedf082960f3 diff -r 000000000000 -r 8eb277262715 test-data/fastaFilteringTest_IN.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/fastaFilteringTest_IN.fasta Thu Sep 14 16:14:56 2017 -0400 @@ -0,0 +1,84 @@ +>MCHU - Calmodulin - Human, rabbit, bovine, rat, and chicken +ADQLTEEQIAEFKEAFSLFDKDGDGTITTKELGTVMRSLGQNPTEAELQDMINEVDADGNGTID +FPEFLTMMARKMKDTDSEEEIREAFRVFDKDGNGYISAAELRHVMTNLGEKLTDEEVDEMIREA +DIDGDGQVNYEEFVQMMTAK* +>gi||||5524211gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5523211gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5524201gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5524212gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5523511gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5524299gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5524871gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5524741gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>sp|Q01912|1A1C_VIGRR 1-aminocyclopropane-1-carboxylate synthase (Fragment) OS=Vigna radiata var. radiata GN=ACS5 PE=2 SV=1 +QMGLAENQLTSDLVEDWILNNPEASICTPEGINDFRAIANFQDYHGLAEFRNAVAKFMAR +TRGNRITFDPDRIVMSGGATGAHEVTAFCLADPGEAFLVPIPYYPGFDRDLRWRTGVKLV +PVMCDSSNNFVLTKEALEDAYEKAREDNIRVKGLLITNPSNPLGTIMDRKTLRTVVSFIN +EKRIHLVCDEIYAATVFSQPGFISIAEILEDETDIECDRNLVHIVYSLSKDMGFPGFRVG +IIYSYNDAVVNCARKMSSFGLVSTQTQYLLASMLNDDEFVERFLAESAKRLAQRFRVFTG +GLAKVGIKCLQSNAGLFVWMDLRQLLKKPTFDSETELWKVIIHEVKINVSPGYSFHCTEP +GWFRVCFA +>sp|B9K206|1A1D_AGRVS 1-aminocyclopropane-1-carboxylate deaminase OS=Agrobacterium vitis (strain S4 / ATCC BAA-846) GN=acdS PE=3 SV=1 +MLDAFDRYPLTFGPTPIEKLERLTDHLGGKVQLYAKREDCNSGLAFGGNKLRKLEYIIPD +AIASGADTLVSIGGVQSNHTRMVAAVAAKIGFKCRLVQEAWVPHEDAVYDRVGNIMLSRI +MGADVRLVDDGFDIGIRRSWEEAIEEVKAAGGKPYAIPAGASVHKYGGLGYVGFAEEVRA +QEAALGFAFDYIVVCTVTGSSHAGMAVGFAKDGRADHVIGIDASFTPDQTRAQVLEIAQR +TADLVKLGREMRPEDIVLVEDYAYPVYGVPSEETKDAIRLVGRLEGMITDPVYEGKSMQG +MIDLVKKGYFPEGSKVLYAHLGGAPALNGYGYAFRNG +>sp|A3ME84|1A1D_BURM7 1-aminocyclopropane-1-carboxylate deaminase OS=Burkholderia mallei (strain NCTC 10247) GN=acdS PE=3 SV=1 +MNLQKFSRYPLTFGPTPIQPLKRLSAHLGGKVELYAKRDDCNSGLAFGGNKTRKLEYLIP +DALAQGCDTLVSIGGIQSNQTRQVAAVAAHLGMKCVLVQENWVNYHDAVYDRVGNIQMSR +MMGADVRLVPDGFDIGFRKSWEDALADVRARGGKPYAIPAGCSDHPLGGLGFVGFAEEVR +AQEAELGFQFDYVVVCSVTGSTQAGMVVGFAADGRADRVIGVDASAKPAQTREQILRIAK +HTADRVELGRDITSADVVLDERFGGPEYGLPNEGTLEAIRLCAKLEGVLTDPVYEGKSMH +GMIEKVRLGEFPAGSKVLYAHLGGVPALNAYSFLFRDG +>sp|Q62CE3|1A1D_BURMA 1-aminocyclopropane-1-carboxylate deaminase OS=Burkholderia mallei (strain ATCC 23344) GN=acdS PE=3 SV=1 +MNLQKFSRYPLTFGPTPIQPLKRLSAHLGGKVELYAKRDDCNSGLAFGGNKTRKLEYLIP +DALAQGCDTLVSIGGIQSNQTRQVAAVAAHLGMKCVLVQENWVNYHDAVYDRVGNIQMSR +MMGADVRLVPDGFDIGFRKSWEDALADVRARGGKPYAIPAGCSDHPLGGLGFVGFAEEVR +AQEAELGFQFDYVVVCSVTGSTQAGMVVGFAADGRADRVIGVDASAKPAQTREQILRIAK +HTADRVELGRDITSADVVLDERFGGPEYGLPNEGTLEAIRLCAKLEGVLTDPVYEGKSMH +GMIEKVRLGEFPAGSKVLYAHLGGVPALNAYSFLFRDG +>BAB62851.1 bcr/abl e8a2 fusion protein, partial [Homo sapiens] from GenBank +LLYKPVDRVTRSTLVLHDLLKHTPASHPDHPLLQDALRISQNFLSSINEEITPRRQSMTVKKGEGEDRMK +ASSTRKRLLLMEEALQRPVASDFEPQGLSEAARWNSKENLLAGPSENDPNLFVALYDFVASGDNTLSITK \ No newline at end of file diff -r 000000000000 -r 8eb277262715 test-data/fastaFilteringTest_OUT1.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/fastaFilteringTest_OUT1.fasta Thu Sep 14 16:14:56 2017 -0400 @@ -0,0 +1,36 @@ +>MCHU - Calmodulin - Human, rabbit, bovine, rat, and chicken +ADQLTEEQIAEFKEAFSLFDKDGDGTITTKELGTVMRSLGQNPTEAELQDMINEVDADGNGTID +FPEFLTMMARKMKDTDSEEEIREAFRVFDKDGNGYISAAELRHVMTNLGEKLTDEEVDEMIREA +DIDGDGQVNYEEFVQMMTAK* +>sp|Q01912|1A1C_VIGRR 1-aminocyclopropane-1-carboxylate synthase (Fragment) OS=Vigna radiata var. radiata GN=ACS5 PE=2 SV=1 +QMGLAENQLTSDLVEDWILNNPEASICTPEGINDFRAIANFQDYHGLAEFRNAVAKFMAR +TRGNRITFDPDRIVMSGGATGAHEVTAFCLADPGEAFLVPIPYYPGFDRDLRWRTGVKLV +PVMCDSSNNFVLTKEALEDAYEKAREDNIRVKGLLITNPSNPLGTIMDRKTLRTVVSFIN +EKRIHLVCDEIYAATVFSQPGFISIAEILEDETDIECDRNLVHIVYSLSKDMGFPGFRVG +IIYSYNDAVVNCARKMSSFGLVSTQTQYLLASMLNDDEFVERFLAESAKRLAQRFRVFTG +GLAKVGIKCLQSNAGLFVWMDLRQLLKKPTFDSETELWKVIIHEVKINVSPGYSFHCTEP +GWFRVCFA +>sp|B9K206|1A1D_AGRVS 1-aminocyclopropane-1-carboxylate deaminase OS=Agrobacterium vitis (strain S4 / ATCC BAA-846) GN=acdS PE=3 SV=1 +MLDAFDRYPLTFGPTPIEKLERLTDHLGGKVQLYAKREDCNSGLAFGGNKLRKLEYIIPD +AIASGADTLVSIGGVQSNHTRMVAAVAAKIGFKCRLVQEAWVPHEDAVYDRVGNIMLSRI +MGADVRLVDDGFDIGIRRSWEEAIEEVKAAGGKPYAIPAGASVHKYGGLGYVGFAEEVRA +QEAALGFAFDYIVVCTVTGSSHAGMAVGFAKDGRADHVIGIDASFTPDQTRAQVLEIAQR +TADLVKLGREMRPEDIVLVEDYAYPVYGVPSEETKDAIRLVGRLEGMITDPVYEGKSMQG +MIDLVKKGYFPEGSKVLYAHLGGAPALNGYGYAFRNG +>sp|A3ME84|1A1D_BURM7 1-aminocyclopropane-1-carboxylate deaminase OS=Burkholderia mallei (strain NCTC 10247) GN=acdS PE=3 SV=1 +MNLQKFSRYPLTFGPTPIQPLKRLSAHLGGKVELYAKRDDCNSGLAFGGNKTRKLEYLIP +DALAQGCDTLVSIGGIQSNQTRQVAAVAAHLGMKCVLVQENWVNYHDAVYDRVGNIQMSR +MMGADVRLVPDGFDIGFRKSWEDALADVRARGGKPYAIPAGCSDHPLGGLGFVGFAEEVR +AQEAELGFQFDYVVVCSVTGSTQAGMVVGFAADGRADRVIGVDASAKPAQTREQILRIAK +HTADRVELGRDITSADVVLDERFGGPEYGLPNEGTLEAIRLCAKLEGVLTDPVYEGKSMH +GMIEKVRLGEFPAGSKVLYAHLGGVPALNAYSFLFRDG +>sp|Q62CE3|1A1D_BURMA 1-aminocyclopropane-1-carboxylate deaminase OS=Burkholderia mallei (strain ATCC 23344) GN=acdS PE=3 SV=1 +MNLQKFSRYPLTFGPTPIQPLKRLSAHLGGKVELYAKRDDCNSGLAFGGNKTRKLEYLIP +DALAQGCDTLVSIGGIQSNQTRQVAAVAAHLGMKCVLVQENWVNYHDAVYDRVGNIQMSR +MMGADVRLVPDGFDIGFRKSWEDALADVRARGGKPYAIPAGCSDHPLGGLGFVGFAEEVR +AQEAELGFQFDYVVVCSVTGSTQAGMVVGFAADGRADRVIGVDASAKPAQTREQILRIAK +HTADRVELGRDITSADVVLDERFGGPEYGLPNEGTLEAIRLCAKLEGVLTDPVYEGKSMH +GMIEKVRLGEFPAGSKVLYAHLGGVPALNAYSFLFRDG +>BAB62851.1 bcr/abl e8a2 fusion protein, partial [Homo sapiens] from GenBank +LLYKPVDRVTRSTLVLHDLLKHTPASHPDHPLLQDALRISQNFLSSINEEITPRRQSMTVKKGEGEDRMK +ASSTRKRLLLMEEALQRPVASDFEPQGLSEAARWNSKENLLAGPSENDPNLFVALYDFVASGDNTLSITK diff -r 000000000000 -r 8eb277262715 test-data/fastaFilteringTest_OUT2.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/fastaFilteringTest_OUT2.fasta Thu Sep 14 16:14:56 2017 -0400 @@ -0,0 +1,48 @@ +>gi||||5524211gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5523211gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5524201gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5524212gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5523511gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5524299gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5524871gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY +>gi||||5524741gbAAD44166.1 cytochrome b [Elephas maximus maximus] +LCLYTHIGRNIYYGSYLYSETWNTGIMLLLITMATAFMGYVLPWGQMSFWGATVITNLFSAIPYIGTNLV +EWIWGGFSVDKATLNRFFAFHFILPFTMVALAGVHLTFLHETGSNNPLGLTSDSDKIPFHPYYTIKDFLG +LLILILLLLLLALLSPDMLGDPDNHMPADPLNTPLHIKPEWYFLFAYAILRSVPNKLGGVLALFLSIVIL +GLMPFLHTSKHRSMMLRPLSQALFWTLTMDLLTLTWIGSQPVEYPYTIIGQMASILYFSIILAFLPIAGX +IENY diff -r 000000000000 -r 8eb277262715 test-data/geneticFiltering.in --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/geneticFiltering.in Thu Sep 14 16:14:56 2017 -0400 @@ -0,0 +1,8 @@ +>generic|001 +ACTGACTG +>generic|002 +ACUGACUG +>generic|003 +MKMMMMM +>generic|004 +MKMMMMMX \ No newline at end of file diff -r 000000000000 -r 8eb277262715 test-data/geneticFilteringBad.out --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/geneticFilteringBad.out Thu Sep 14 16:14:56 2017 -0400 @@ -0,0 +1,6 @@ +>generic|001 +ACTGACTG +>generic|002 +ACUGACUG +>generic|004 +MKMMMMMX \ No newline at end of file diff -r 000000000000 -r 8eb277262715 test-data/geneticFilteringGood.out --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/geneticFilteringGood.out Thu Sep 14 16:14:56 2017 -0400 @@ -0,0 +1,2 @@ +>generic|003 +MKMMMMM \ No newline at end of file diff -r 000000000000 -r 8eb277262715 test-data/length5Filtering.in --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/length5Filtering.in Thu Sep 14 16:14:56 2017 -0400 @@ -0,0 +1,6 @@ +>generic|001 +MMMMMMMMMM +>generic|002 +MMMMM +>generic|003 +MMMM \ No newline at end of file diff -r 000000000000 -r 8eb277262715 test-data/length5FilteringBad.out --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/length5FilteringBad.out Thu Sep 14 16:14:56 2017 -0400 @@ -0,0 +1,2 @@ +>generic|003 +MMMM \ No newline at end of file diff -r 000000000000 -r 8eb277262715 test-data/length5FilteringGood.out --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/length5FilteringGood.out Thu Sep 14 16:14:56 2017 -0400 @@ -0,0 +1,4 @@ +>generic|001 +MMMMMMMMMM +>generic|002 +MMMMM \ No newline at end of file diff -r 000000000000 -r 8eb277262715 validate_fasta_database.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/validate_fasta_database.xml Thu Sep 14 16:14:56 2017 -0400 @@ -0,0 +1,106 @@ + + + validate-fasta-database + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +sw|" or ">SW|") + * NCBI (starts with ">gi|" or ">GI|") + * Halobacterium from Max Planck (starts with "OE") + * H Influenza, from Novartis (starts with ">hflu_") + * C Trachomatis (starts with ">C.tr\_" or "C\_trachomatis\_") + * M Tuberculosis (starts with ">M. tub") + * Saccharomyces Genome Database (contains "SGDID") + * Genome translation (ex. ">dm345\_3L-sense [2343534-234353938]") + * Genome Annotation Framework for Flexible Analysis (GAFFA) (starts with ">GAFFA") + * UPS (contains "\_HUMAN\_UPS") + +Many sequences are reported as Generic, which may or may not allow for extraction of the accession number. +]]> + + + + @misc{fastaValidationTool, + author = {The GalaxyP Team}, + date = {22 June 2017}, + title = {FASTA Database Validation Tool} + } + + +