diff test-data/AASequences.fasta @ 25:ea9ae5b25ce1 draft default tip

planemo upload for repository https://github.com/iracooke/protk-galaxytools/blob/master/omssa/.shed.yml commit 24e0fef2496984648a8a5cd5bff4d6b9b634a302-dirty
author iracooke
date Tue, 20 Oct 2015 20:31:23 -0400
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/AASequences.fasta	Tue Oct 20 20:31:23 2015 -0400
@@ -0,0 +1,204 @@
+>tr|O70238|O70238_MOUSE Homeobox protein PSX OS=Mus musculus GN=Rhox6 PE=2 SV=2
+METPQDSRQSIQKPPSPAAEEDKEEQPGGNAVVSGAPEERIDKKELVLNWLAQGEFDQGE
+GAQGEVAGGEQAQEEPAPLSPAQEATGGEEEGENKEGEMEGRHAGDGASSSEDDSILEEG
+GENIDQQPPQQEAASPDSIRNPHVLNRLAQLRYRRTRFTHSQLHDLERLFQETRYPSLRA
+RRDLARWMGVDECDVQNWFRMRRALFQRNRRVLMFCELPPLPQSDSP
+>sp|P20269|HM05_CAEEL Homeobox protein ceh-5 OS=Caenorhabditis elegans GN=ceh-5 PE=2 SV=4
+MPSADTEFIRVIRIKSANGSEKMLEIPAKLDLERPKRPRTVFTDEQLEKLEESFNTSGYL
+SGSTRAKLAESLGLSDNQVKVWFQNRRTKQKKIDSRDPIKPETLKPAENYQNVYQNYQNY
+WTAAAFLSNNVISS
+>sp|P34663|HM23_CAEEL Homeobox protein ceh-23 OS=Caenorhabditis elegans GN=ceh-23 PE=2 SV=1
+MDTHLPFQTLPVSTPLPVSSSSLTDVLQTIAALQACPTSCIPSTSTGMLSPNLPFSATIP
+RVNLFPPSQPANSLILPTIPAQPFIPNPSLLQANPSAVEALANALFATTSRRASCPEPPA
+SSQATVTLQVPSTGSPERRRYSETNMEVLLREQLAQLMPPTSQLPGMPGCYYQHVPAAGT
+SGIQGSLDAALMGAVPLAMNSMAHSRRAANHRKARTIYGTTQTQQLEDMFKGQMYVVGAE
+RENLAQRLGLSPSQVRIWFQNRRSKHRRKQQEEQQSTTLEEKSEEIGKDEEEDDEEDEDD
+VKVLN
+>sp|P52955|LBX1_MOUSE Transcription factor LBX1 OS=Mus musculus GN=Lbx1 PE=1 SV=2
+MTSKEDGKAAPGEERRRSPLDHLPPPANSNKPLTPFSIEDILNKPSVRRSYSLCGAAHLL
+AAADKHAPGGLPLAGRALLSQTSPLCALEELASKTFKGLEVSVLQAAEGRDGMTIFGQRQ
+TPKKRRKSRTAFTNHQIYELEKRFLYQKYLSPADRDQIAQQLGLTNAQVITWFQNRRAKL
+KRDLEEMKADVESAKKLGPSGQMDIVALAELEQNSEASGGGGGGGCGRAKSRPGSPALPP
+GAPQAPGGGPLQLSPASPLTDQRASSQDCSEDEEDEEIDVDD
+>sp|Q26604|SMOX5_SCHMA Homeobox protein SMOX-5 OS=Schistosoma mansoni GN=SMOX-5 PE=2 SV=1
+MTTSTMQQLKHDGDFSDELNETSTIQFYNKVSQQRKRRKTRTTFSNCQLNELENNFNRQR
+YLTPTDRDRIAKHLGLTNTQVITWFQNRRAKLKREAEELERDVMALRKQKQQKFTCLSLS
+DHDHEETQIDDENEQGDNNNDDDGDDNDVEEDDGEEQEKNHTKYLTQPPSISNILPSSLK
+HFPSSTLNTLEIDNKHETLNMNLFINPFSNEKCLKRNKDLIRQQCYLFNHHINNYCTVNN
+DNNINNNNNNNNRKNSIDGMNKGRSIKKGNKIWCPALELEQEIH
+>tr|O77024|O77024_EPHMU EmH-3 (Fragment) OS=Ephydatia muelleri GN=EmH-3 PE=3 SV=1
+MDNCRGDKKPLLSTNQQSFRIDNLLTRKVIEQQQQPDHYTMYPPSKVENHDILSLTTGPS
+HDDMISDGTEIYEQGRESTSSTSGNDAEDDLLTRRKKARTAFSREQVAELEKKFQDKKYL
+SSAERGELAEKLKLSDMQVKTWFQNRRMKYKRQSEETEMEMKSPKY
+>sp|O93367|TLX3_CHICK T-cell leukemia homeobox protein 3 OS=Gallus gallus GN=TLX3 PE=2 SV=1
+MEPAAGAQGPHQHEPISFGIDQILSGPEQDGAPPPPPPPPPPPPPPPPPPRGPDGAAFLG
+GPRGGAPYPALPGPFPAIAAPFEESGPYGVNLSLAPGGVIRVPAHRPIPGAVPPPVPSAI
+PAVPGLGGLSFPWMESSRRFVKERFTAAAALTPFTVTRRIGHPYQNRTPPKRKKPRTSFS
+RVQICELEKRFHRQKYLASAERAALAKSLKMTDAQVKTWFQNRRTKWRRQTAEEREAERQ
+QASRLMLQLQHDAFQKSLNESIQPDPLCLHNSSLFALQNLQPWEEESAKIPPVTSLV
+>sp|P56407|HM09_CAEEL Homeobox protein ceh-9 OS=Caenorhabditis elegans GN=ceh-9 PE=4 SV=2
+METDLLFQLLQPYFALLTSDVKPQRRTSHLIKDILDLPTVNGEIDEFGRCKSSLDQAKES
+PIEKCQKTKRKKARTTFSGKQVFELEKQFEAKKYLSSSDRSELAKRLDVTETQVKIWFQN
+RRTKWKKIESEKERSGEIPDDQIVKPQ
+>tr|Q24786|Q24786_9METZ Homeobox-containing protein (Fragment) OS=Ephydatia fluviatilis GN=prox1 PE=3 SV=1
+NSDEDKDRYASDLDTDRASSAGGALQMSRHKKRRPRALFSHAQVYELERRFAVQKYLTAH
+EQSKLATVLHLTETQVKIWFQNRRYKSKRQQIEQTRVSPKVVKTSRMVRCSSGYITAI
+>sp|O35767|NKX25_RAT Homeobox protein Nkx-2.5 OS=Rattus norvegicus GN=Nkx2-5 PE=2 SV=1
+MFPSPALTHTPFSVKDILNLEQQQRSLAAGDLSARLEATLAPASCMLAAFKPDGYSGPEA
+AAPGLAELRAELGPAPSPPKCSPAFPTAPTFYPRAYGDPDPAKDPRADKKELCALQKAVE
+LDKAETDGAERRRPRRRRKPRVLFSQAQVYELERRFKQQRYLSPAERDQLASVLKLTSTQ
+VKIWFQNRRYKCKRQRQDQTLELLGPPPPPARRIAVPVLVRDGKPCLGDSAAYAPAYGLG
+LNAYGYNAYPYPGYGGAACSPAYSCAAYPAAPPAAHAPAASANSNFVNFGVGDLNTVQSP
+GMPQGNSGVSTLHGIRAW
+>tr|Q9YH59|Q9YH59_CHICK Homeodomain protein NKx2.1 OS=Gallus gallus GN=NKx2.1 PE=2 SV=1
+MSMSPKHTTPFSVSDILSPWEESYKKVGMEGSNLGAPLSAYRQSQVSQPAMQQHPMGHNG
+TVTAAYHMTAAGVPQLSHATMGGYCNGNLGNMSELPPYQDTMRNSASATGWYGTNPDPRF
+SSISRFMAPSSGMNMGGMGGLSSLGDVSKSMAPLQSTPRRKRRVLFSQAQVYELERRFKQ
+QKYLSAPEREHLASMIHLTPTQVKIWFQNHRYKMKRQAKDKAAHEMQQENGSCQQQQSPR
+RVAVPVLVKDGKPCQAGSNTPTAAIQSHPQQAATTITVATNGNSLGQHQSHQTNSAGQSP
+DMGQHSASPSSLQSQVSSLSHLNSSTSDYGTAMSCSTLLYGRTW
+>tr|O35455|O35455_MOUSE Homeobox protein Nkx2.6 (Fragment) OS=Mus musculus GN=Nkx2-6 PE=2 SV=1
+VGAPGRQSWRWARILWGSHVKTPPGTISRLGARNPMTDRGVGNLSGDMRRGGPVSTRTRP
+QRKSRVLFSQAQVLALERRFKQQRYLTAPEREHLASALQLTSTQVKIWFQNRRYKSKSQR
+QDQNLELAGHPLAPRPGSSASTGTGRQPLPGSDVAAFLVPTKPPRPIPASVATRALPTTL
+AMRAAAPAPAPAPGRSHHWPALASAQVAKVRLRRAICPLRLRESRPGEKPELTYCHSVPD
+AWSPPLPAGGRGAGKHCPPY
+>sp|P22711|TIN_DROME Muscle-specific homeobox protein tinman OS=Drosophila melanogaster GN=tin PE=2 SV=2
+MLQHHQQQAQSGGYYDHYTQSPSPGSLTNADALNTTPFSVKDILNMVNQTEAYEGSYGHI
+DGAATASALFAAGEYQNPHQYLNHQQHQQSELPIPQQQLHHQHLDDGATTSSSLSPLLPP
+PPHQLYGGYQDYGMPAHMFQHHHGHPHQSFQHSASAYNMSASQFYAGASATAYQTPATYN
+YNYAGSGEVYGGATPSAVGIKSEYIPTPYVTPSPTLDLNSSAEVDSLQAPTQKLCVNPLS
+QRLMETASNSSSLRSIYGSDEGAKKKDNSQVTSSRSELRKNSISGNSNPGSNSGSTKPRM
+KRKPRVLFSQAQVLELECRFRLKKYLTGAEREIIAQKLNLSATQVKIWFQNRRYKSKRGD
+IDCEGIAKHLKLKSEPLDSPTSLPPPIPNHVMWPPTMQQSQQQQQHHAQQQQMQHM
+>tr|O16132|O16132_HYDVU NK-2 class homeobox transcription factor OS=Hydra vulgaris GN=CnNK-2 PE=2 SV=1
+MDFSILPVNSSFLVDDILRRKHYENKIHQSNFSQFSVLSDEISIKTRLSAFPIYNKGMHK
+NKELVNKPFQMNDKNITETERDFNKSSISFDMTSNVEYSFGDKRMNNRHSFQGLSCRVAE
+AEMYARGKREDNSSDENSPKCESPSLTAKTEYHNASGDAMHVTSESLIQQNLLNIKSSRK
+KPRILFSQSQVMELGKKFKDQKYLSASERDQIANKLNLTPTQVKIWFQNKRYKCKKQTIE
+SRTRPPPYEWLHFQHRNVPVLVQNNQVSSDVCLPYCNRPTYLPSNSPVDMNYPPFYPDPY
+NGHNHHYSNSYNTPSQTSTYPNSWPFYK
+>sp|O93590|ZAX_XENLA Homeobox protein zampogna OS=Xenopus laevis GN=zax PE=2 SV=1
+MSLTSFSIQDILARTGGNRGKDTRTDGNNISPPPSPSADEGHNEWPRAENPPLTPEKEKT
+DTDSGTEDFHWERDTETANNGAFTDPSSGDRLADSPKSSKKRSRAAFSHAQVYELERRFS
+LQRYLSGPERADLAASLKLTETQVKIWFQNRRYKTKRKLIATQTAPKSSLVPTRKVAVRV
+LVKDDQRQYCPEDMLSPSLLSLYHAYQYYPYMYCLPAWVPHLPL
+>tr|Q90853|Q90853_CHICK Homeobox protein OS=Gallus gallus GN=GH6 PE=2 SV=1
+MAQDRECLCSAGFQRGDYTQGNTDRSTAAGNCRRRGSGEPRSHPPAEADPPSRSCFTDDA
+GRSDGKRRLHICPRLVLFHRGPAGHRSGGGTRRAAAGGGGGRRTSRCGPHSPLRLGASGC
+PLRDAAVGWYRRAFLGCAAPTPATGTRRSCPEDTERAGGGGRAAGGAAGGRQSSGGREEE
+EERGEEAGEAEQRAAGRKKKTRTVFSRSQVFQLESTFDVKRYLSSSERAGLAASLHLTET
+QVKIWFQNRRNKWKRHVAADLEAANLSHAAQRIVRVPILYHENSPASALGFGLPHMSPPL
+VGFSGGVSYPPGHLPRRLPSLPSLADDGTRLSAHLCRDRGPEPPPLASSFTLGLFLSTFT
+IFRFSTFI
+>tr|O97671|O97671_RABIT Homeobox protein (Fragment) OS=Oryctolagus cuniculus GN=HEX PE=2 SV=1
+GKPLLWSPFLQRPLHKRKGGQVRFSNDQTIELEKKFETQKYLSPPERKRLAKMLQLSERQ
+VKTWFQNRRAKWRRLKQENPQSGKKEQENLDSSCEQRPDLPGDQHKGASLDSSQCSQSPA
+SQEDLESEISEDSDQEVD
+>tr|Q9YHC2|Q9YHC2_CHICK Homeodomain protein (Fragment) OS=Gallus gallus GN=Nkx-6.1 PE=2 SV=1
+PPWRDARIGCAPHQGSILLDKDGKRKHTRPTFSGQQIFALEKTFEQTKYLAGPERARLAY
+SLGMTESQVKVWFQNRRTKWRKKHAAEMATAKKKQDSETERLKGASDNEDDDDDYNKPLD
+PNSDDEKIAQLLKKHKPGAGGLLPHPAEGEASA
+>sp|P28468|HOX1_HALRO Homeobox protein AHox1 OS=Halocynthia roretzi GN=AHOX1 PE=2 SV=1
+MEKMHSKSVSPVPFNNSNNTSLGGLRKSSSIPTLAVPECESMGNKHIEEERTNNITTMAM
+KRRLLDPQNKKKQNRFERYSSSNHAQEQSSEENFCRSKKDSTVLKFGIDSILKNKNAEKV
+PKGISNAGRIQDERFTEACTNTSSNVNPLSKYFKPSSNDQLGARRTATSFSSSSEASDSK
+SCCTNNNEEARYKYRVIDKRKSADSDWSEDATGNEADDPDDHINQDNCDLASTLEQSRIV
+ALEILKNKRLRLDSSEALNDLTPYDQLSRTEDQQISRRVEMMNHQAFARENNEWPRSFSS
+GLQDPFAKNLPNAFLPFYMQPYLRAYYNIQKYIYHKKLLNRNDRFYREANVENDNYKTEE
+SLRSPSETKQYSPDASTFYPIRTEDSNGSRNLKVDVEEGDKEANKLFKDLCVSVGDRLSN
+ALSYGRKDYNGLSTSQTSGNRFLNFSDKGIQAGSYYQTGERNDSLAGPLKNSGMSFDFPP
+KFGSNNSSTDKPEQEDNNPQTIGSEYQINTQRSMKDNLLTAKLLENEAKLRYGNIVTQYP
+RPFSWPFAASVRKSYDPALRSYFSRFNNSDAPHYGAAQVNPTAGNNFKSMLPGNFENPYF
+FNELNTLDTTGFLSRQYGHMSSSQNPHSETQNRSEEVRGTVKKRRKWNRAVFSLMQRRGL
+EKSFQSQKYVAKPERRKLADALSLTDAQVKIWFQNRRMKWRQEIKMKNRGLVPVHILGQD
+HEIEKEKTQTPSDEGEVINVD
+>sp|O88181|BARH2_RAT BarH-like 2 homeobox protein OS=Rattus norvegicus GN=Barhl2 PE=2 SV=1
+MTAMEGASGSSFGIDTILSGAGSGSPGMMNGDFRSLGEARTTDFRSQATPSPCSEIDTVG
+TAPSSPISVTLEPPEPHLVTDGPQHHHHLHHGQQPPPPSAPPAQSLQPSPQQQPPPQPQS
+AAQQLGSAAAAPRTSTSSFLIKDILGDSKPLAACAPYSTSVSSPHHTPKQECNAAHESFR
+PKLEQEDSKTKLDKREDSQSDIKCHGTKEEGDREITSSRESPPVRAKKPRKARTAFSDHQ
+LNQLERSFERQKYLSVQDRMDLAAALNLTDTQVKTWYQNRRTKWKRQTAVGLELLAEAGN
+YSALQRMFPSPYFYHPSLLGSMDSTTAAAAAAAMYSSMYRTPPAPHPQLQRPLVPRVLIH
+GLGPGGQPALNPLSNPIPGTPHPR
+>sp|Q24255|BARH1_DROME Homeobox protein B-H1 OS=Drosophila melanogaster GN=B-H1 PE=2 SV=2
+MKDSMSILTQTPSEPNAAHPQLHHHLSTLQQQHHQHHLHYGLQPPAVAHSIHSTTTMSSG
+GSTTTASGIGKPNRSRFMINDILAGSAAAAFYKQQQHHQQLHHHNNNNNSGSSGGSSPAH
+SNNNNNINGDNCEASNVAGVGVLPSALHHPQPHPPTHPHTHPHALMHPHGKLGHFPPTAG
+GNGLNVAQYAAAMQQHYAAAAAAAAARNNAAAAAAAAAAAAAAGVAAPPVDGGVDGGVGL
+APPAGGDLDDSSDYHEENEDCDSGNMDDHSVCSNGGKDDDGNSVKSGSTSDMSGLSKKQR
+KARTAFTDHQLQTLEKSFERQKYLSVQERQELAHKLDLSDCQVKTWYQNRRTKWKRQTAV
+GLELLAEAGNFAAFQRLYGGSPYLGAWPYAAAAGAAHGATPHTNIDIYYRQAAAAAAMQK
+PLPYNLYAGVPSVGVGVGVGVGPAPFSHLSASSSLSSLSSYYQSAAAAASAANPGGPHPV
+APPPSVGGGSPPSGLVKPIPAHSASASPPPRPPSTPSPTLNPGSPPGRSVDSCSQSDDED
+QIQV
+>sp|Q22909|HM30_CAEEL Homeobox protein ceh-30 OS=Caenorhabditis elegans GN=ceh-30 PE=2 SV=2
+MSLLDPRQFLLPAFYLDPTTQALLAQAASTSPCNKISSSSSFRISDILEQSPNNSSHSND
+HDPSPQSIKSDFSTSPRASSPGGDRMGSPGSCKKSRKARTIFTDKQLQELENTFEKQKYL
+SVQDRMDLAHRMGLTDTQVKTWYQNRRTKWKRQATSGMDLLSEPGNLSAVQNLIRSSPYW
+ANYITALPMGTQLPMMGLPMSMIVPPAHAFQPSSSSNSPSTHISSESPQLDVSSNSE
+>sp|P26797|HM19_CAEEL Homeobox protein ceh-19 OS=Caenorhabditis elegans GN=ceh-19 PE=2 SV=2
+MAFNIESLLEKKSNPVEEGNDFEEENDSEKNGEEDEEEEEKNVIDGWTNMATSQLAMFAI
+ANDLRTPTLVELQMLLGVSARKHDYKRSRKSVCERKPRQAYSARQLDRLETEFQTDKYLS
+VNKRIQLSQTLNLTETQIKTWFQNRRTKWKKQLTSSIRQMVKDAPTSTSVGVPFQSLLTP
+PTPPTTLACHVNSLFACEQ
+>sp|P22807|SLOU_DROME Homeobox protein slou OS=Drosophila melanogaster GN=slou PE=2 SV=1
+MVMLQSPAQKASDSASAQNTAVGGLMSPNSNPDSPKSNTSPDVASADSVVSGTGGGSTPP
+AAKIPKFIISANGAAVAGKQEQELRYSLERLKQMSSESGSLLSRLSPLQEDSQDKEKPNH
+NNNNSLTNHNANSNTRRSQSPPASVGSVSFSSPAQQRKLLELNAVRHLARPEPLQHPHAA
+LLQQHPHLLQNPQFLAAAQQHMHHHQHQHHQHPAHPHSHQHPHPHPHPHPHPHPSAVFHL
+RAPSSSSTAPPSPATSPLSPPTSPAMHSDQQMSPPIAPPQNPPHSSQPPQQQQVAAPSDM
+DLERIKLVAAVAARTTQASSTSALASASNSVSNASISISNSSSGSPSGRDLSDYGFRIQL
+GGLAAAAAAAAATSRQIAAATYARSDTSEELNVDGNDEDSNDGSHSTPSVCPVDLTRSVN
+SSAAANPSSASTSASSDRDAATKRLAFSVENILDPNKFTGNKLPSGPFGHPRQWSYERDE
+EMQERLDDDQSEDMSAQDLNDMDQDDMCDDGSDIDDPSSETDSKKGGSRNGDGKSGGGGG
+GGSKPRRARTAFTYEQLVSLENKFKTTRYLSVCERLNLALSLSLTETQVKIWFQNRRTKW
+KKQNPGMDVNSPTIPPPGGGSFGPGAYASGLLYSHAVPYPPYGPYFHPLGAHHLSHSHS
+>sp|Q04787|BSH_DROME Brain-specific homeobox protein OS=Drosophila melanogaster GN=bsh PE=2 SV=5
+MAMLNEASLSPADAHAHANATTPTHSKAAAMASATTMLTTKTPFSIEHILFQNLNSASNN
+NNSSDTNGIAANTNNYAPKSSRNAVKSARSAFAHDNNPHKHPSQHSHPPQSHPPASASAS
+ATATARSNQAASGYAGEDYGKSMHSTPRSNHHSRHGTSHYNGDQISQQLGSGAAQHPPVP
+TTQPQPPPPPPLNGGSGASNGVLYPNAPYTDHGFLQMTLGYLSPSSGTYKSVDPYFLSQA
+SLFGGAPFFGAPGCVPELALGLGMGVNALRHCRRRKARTVFSDPQLSGLEKRFEGQRYLS
+TPERVELATALGLSETQVKTWFQNRRMKHKKQLRRRDNANEPVDFSRSEPGKQPGEATSS
+SGDSKHGKLNPGSVGGTPTQPTSEQQLQMCLMQQGYSTDDYSDLEADSGDEDNSSDVDIV
+GDAKLYQLT
+>sp|O08686|BARX2_MOUSE Homeobox protein BarH-like 2 OS=Mus musculus GN=Barx2 PE=2 SV=2
+MHCHAELRLSSPGQLKAARRRYKTFMIDEILSKETCDYFEKLSLYSVCPSLVVRPKPLHS
+CTGSPSLRAYPLLSVITRQPTVISHLVPTGSGLTPVLTRHPVAAAEAAAAAAETPGGEAL
+ASSESETEQPTPRQKKPRRSRTIFTELQLMGLEKKFQKQKYLSTPDRLDLAQSLGLTQLQ
+VKTWYQNRRMKWKKMVLKGGQEAPTKPKGRPKKNSIPTSEEIEAEEKMNSQAQSQELLES
+SERQEEPCDTQEPKACLVPLEVAEPIHQPQELSEASSEPPPLS
+>tr|Q23819|Q23819_HYDVD Cnox3 protein (Fragment) OS=Hydra viridissima GN=cnox3 PE=2 SV=1
+NLYPILNTDQNHCTYAKEDSLIPEVEEPSTYLQLKQNNAKGSGIKCRKPRTVFSDLQLMV
+LEREFNNRKYLSTPQRTNLADRLGLNQTQVKTWYQNRRMKWKKETFESEDKEPKIS
+>sp|Q01702|DLX3B_DANRE Homeobox protein Dlx3b OS=Danio rerio GN=dlx3b PE=2 SV=1
+MSGPTYDRKIPGISTDLSGSMSCHPTSKDSPTLPESSATDMGYYSSHHEYYQSPPYPQQM
+NSYHQFNLSGMGATPGAYPTKTEYPYNTYRQYGHFNRDLQTPPQSAVKEEPETEVRMVNG
+KPKKIRKPRTIYSSYQLAALQRRFQKAQYLALPERAELAAQLGLTQTQVKIWFQNRRSKF
+KKLYKNGEVPLEHSPNASDSMACNSPPSPAVWDNNAHSSQVNRGQIPQPPLSSTPPYMED
+YSNHWYQQGSHLQHPVHHPGPPQSVGAVY
+>sp|Q18273|HM43_CAEEL Homeobox protein ceh-43 OS=Caenorhabditis elegans GN=ceh-43 PE=2 SV=1
+MDPSKGFEYVAGDYYQTSGVAPPTSNGAGSNVSPYFPYHAYPTSSTNGATGGSMYGTPQQ
+TSAYAMYPPGPGSSPEEAFPEHTTTKIVEGCEAKYNVKGKKMRKPRTIYNSSQLQMLQKK
+FQKTQYLALPDRAALAHELGLSQTQVKIWFQNRRSKQKKQKGGSSDHASDEEDDDTEESK
+PESPPMGESVMIQESSEPRTLVSSSIKTEMKEEYPPMTLNEQYASPYLYGSDFSTILPPS
+QGFPNNALYNTAGAYPSIDYTNGVYQNTLYKYV
+>tr|Q23824|Q23824_HYDVD Msh protein (Fragment) OS=Hydra viridissima GN=msh PE=2 SV=1
+EFQFDLSKCFLRKHKANRKPRTPFSVNQLLTLEQKFKRKQYLSISERAELSELLRLTETQ
+IKIWFQNRRAKQKRSKEAEIEESVRNRLPLSAADYRSLDHLTLLSSFIAFIPIEYEVKIF
+MNVQRGIE
+>tr|Q24785|Q24785_9METZ Homeobox-containing protein (Fragment) OS=Ephydatia fluviatilis GN=prox3 PE=3 SV=1
+PHSSGSNASTINKQKKDRKPRTPFTSTQLIALERKFRQQKYLSVAERAEFAEYLKLTETQ
+VKIWFQNRRAKEKRLHEAEAERAARSLGFHFHMPMQSKMNTFRHPYCNSQYQTLCLCQFR
+HKIGIGTFPARTTDSISSNSSQPTLPWFLTCNSSTPL
+>sp|P70354|MSX3_MOUSE Homeobox protein MSX-3 OS=Mus musculus GN=Msx3 PE=1 SV=1
+MARATFDMNAAGLEARGGGHTEHGPLPFSVESLLEAERVPGSESGELGVERPLGASKPGA
+WPPPVAHSCPPRAPSPPPCTLRKHKTNRKPRTPFTTAQLLALERKFHQKQYLSIAERAEF
+SSSLSLTETQVKIWFQNRRAKAKRLQEAELEKLKLAAKPLLPAAFALPFPLGTQLHSSAA
+TFGGNAVPGILAGPVAAYGMYYLS
+>tr|Q90263|Q90263_DANRE Empty spiracles homeobox 3 OS=Danio rerio GN=emx3 PE=2 SV=1
+MFQHNKKCFTIESLVGKDSNSSNAAADEPIRPTALRFTESIHPSPFGSCFQNSGRTLYSS
+SPEMMFTDPSTHSTNSGLSLRHLQIPTQPFFSPHQRDTLNFYPWVLRNRYLGHRFQGDDS
+SPENLLLHGPFSRKPKRIRTAFSPSQLLRLERAFEKNHYVVGAERKQLANGLCLTETQVK
+VWFQNRRTKHKRQKLEEESPDPQQKRKGSQHVSRWRVATQQGSPEDIDVISED