Mercurial > repos > rnateam > targetfinder
comparison TargetFinder.xml @ 1:c69fbd1f8c69 draft default tip
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/targetfinder/ commit fe9dd99a14770b6c5f26e24893599acb577e304f"
| author | rnateam |
|---|---|
| date | Thu, 25 Mar 2021 19:52:04 +0000 |
| parents | 48aeeeff1977 |
| children |
comparison
equal
deleted
inserted
replaced
| 0:48aeeeff1977 | 1:c69fbd1f8c69 |
|---|---|
| 1 <tool id="targetfinder" name="Plant small RNA target prediction tool" version="1.7.0"> | 1 <tool id='targetfinder' name='TargetFinder' version='1.7.0+galaxy1' profile='20.01'> |
| 2 <requirements> | 2 <description>plant small RNA target prediction tool</description> |
| 3 <requirement type="package" version="1.7">targetfinder</requirement> | 3 <macros> |
| 4 </requirements> | 4 <import>macros.xml</import> |
| 5 </macros> | |
| 6 <expand macro='edam' /> | |
| 7 <expand macro='requirements' /> | |
| 5 <stdio> | 8 <stdio> |
| 6 <exit_code range="1:" /> | 9 <exit_code range='1:' /> |
| 7 </stdio> | 10 </stdio> |
| 8 <command><![CDATA[ | 11 <command><![CDATA[ |
| 9 targetfinder_threads.pl | 12 targetfinder_threads.pl |
| 10 -f $f | 13 -f '$f' |
| 11 -d $d | 14 -d '$d' |
| 12 -c $c | 15 -c $c |
| 16 -p $output_format | |
| 13 -t "\${GALAXY_SLOTS:-12}" | 17 -t "\${GALAXY_SLOTS:-12}" |
| 14 $r | 18 $r |
| 15 -o $output1 | 19 -o '$output_file' |
| 20 | |
| 16 ]]></command> | 21 ]]></command> |
| 17 <inputs> | 22 <inputs> |
| 18 <param label="Input small RNA sequences file" help="(-f) FASTA-format" name="f" type="data" format="fasta" /> | 23 <param argument='-f' type='data' format='fasta' label='Input small RNA sequences file' help='FASTA-format' /> |
| 19 <param label="Target sequence database file" help="(-d) FASTA-format" name="d" type="data" format="fasta" /> | 24 <param argument='-d' type='data' format='fasta' label='Target sequence database file' help='FASTA-format' /> |
| 20 <param label="Prediction score cutoff value" help="(-c) DEFAULT = 4" name="c" type="float" value="4.0" /> | 25 <param argument='-c' type='float' value='4.0' label='Prediction score cutoff value' help='Predicted targets are printed out if they are equal to or lower than the cutoff score specified. DEFAULT = 4' /> |
| 21 <param label="Search reverse strand for targets?" help="(-r) Use this option if the database is genomic DNA." name="r" type="boolean" falsevalue="" truevalue="-r" checked="false" /> | 26 <param argument='-c' type='float' value='4.0' label='Prediction score cutoff value' help='Predicted targets are printed out if they are equal to or lower than the cutoff score specified. DEFAULT = 4' /> |
| 27 <param argument='-r' type='boolean' falsevalue='' truevalue='-r' checked='false' label='Search reverse strand for targets?' help='Use this option if the database is genomic DNA.' /> | |
| 28 <param name='output_format' argument='-p' type='select' label='Output format' help='Output format for small RNA-target pairs (Default = classic).' > | |
| 29 <option value='classic'>Original TargetFinder base-pair format</option> | |
| 30 <option value='gff'>GFF</option> | |
| 31 <option value='json'>JavaScript Object Notation (JSON)</option> | |
| 32 <option value='table'>Tab-delimited format</option> | |
| 33 </param> | |
| 22 </inputs> | 34 </inputs> |
| 23 <outputs> | 35 <outputs> |
| 24 <data name="output1" format="data"/> | 36 <data name='output_file' format='txt'> |
| 37 <change_format> | |
| 38 <when input="output_format" value="gff" format="gff" /> | |
| 39 <when input="output_format" value="json" format="json" /> | |
| 40 <when input="output_format" value="table" format="tabular" /> | |
| 41 </change_format> | |
| 42 </data> | |
| 25 </outputs> | 43 </outputs> |
| 26 <tests> | 44 <tests> |
| 27 <test> | 45 <test> |
| 28 <param name="f" value="ath_miRNAs_test.fa"/> | 46 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> |
| 29 <param name="d" value="Antirrhinum_majus.mRNA.EST.fasta"/> | 47 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> |
| 30 <param name="r" value=""/> | 48 <param name='r' value='false'/> |
| 31 <param name="c" value="4.0"/> | 49 <param name='c' value='4.0'/> |
| 32 <param name="t" value="1"/> | 50 <param name='output_format' value='classic'/> |
| 33 <output name="output1" file="ath_miRNAs_predicted_targets.txt" compare="contains"/> | 51 <output name='output_file' file='targetfinder_test_01.txt' compare='contains'/> |
| 52 </test> | |
| 53 <test> | |
| 54 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
| 55 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
| 56 <param name='r' value='true'/> | |
| 57 <param name='c' value='4.0'/> | |
| 58 <param name='output_format' value='classic'/> | |
| 59 <output name='output_file' file='targetfinder_test_02.txt' compare='contains'/> | |
| 60 </test> | |
| 61 <test> | |
| 62 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
| 63 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
| 64 <param name='r' value='false'/> | |
| 65 <param name='c' value='6.0'/> | |
| 66 <param name='output_format' value='classic'/> | |
| 67 <output name='output_file' file='targetfinder_test_03.txt' compare='contains'/> | |
| 68 </test> | |
| 69 <test> | |
| 70 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
| 71 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
| 72 <param name='r' value='false'/> | |
| 73 <param name='c' value='4.0'/> | |
| 74 <param name='output_format' value='classic'/> | |
| 75 <output name='output_file' file='targetfinder_test_04.txt' compare='contains'/> | |
| 76 </test> | |
| 77 <test> | |
| 78 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
| 79 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
| 80 <param name='r' value='false'/> | |
| 81 <param name='c' value='4.0'/> | |
| 82 <param name='output_format' value='gff'/> | |
| 83 <output name='output_file' file='targetfinder_test_05.gff' compare='contains'/> | |
| 84 </test> | |
| 85 <test> | |
| 86 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
| 87 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
| 88 <param name='r' value='false'/> | |
| 89 <param name='c' value='4.0'/> | |
| 90 <param name='output_format' value='table'/> | |
| 91 <output name='output_file' file='targetfinder_test_06.tab' compare='contains'/> | |
| 92 </test> | |
| 93 <test> | |
| 94 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
| 95 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
| 96 <param name='r' value='false'/> | |
| 97 <param name='c' value='4.0'/> | |
| 98 <param name='output_format' value='json'/> | |
| 99 <output name='output_file' file='targetfinder_test_07.json' compare='contains' lines_diff='1'/> | |
| 100 </test> | |
| 101 <test> | |
| 102 <param name='f' value='arabidopsis_thaliana_miRNA.fasta'/> | |
| 103 <param name='d' value='arabidopsis_thaliana_mRNA.fasta'/> | |
| 104 <param name='r' value='true'/> | |
| 105 <param name='c' value='6.5'/> | |
| 106 <param name='output_format' value='table'/> | |
| 107 <output name='output_file' file='targetfinder_test_08.tab' compare='contains'/> | |
| 34 </test> | 108 </test> |
| 35 </tests> | 109 </tests> |
| 36 <help><![CDATA[ | 110 <help><![CDATA[ |
| 111 .. class:: infomark | |
| 112 | |
| 37 **What it does** | 113 **What it does** |
| 38 | 114 |
| 39 TargetFinder will computationally predict small RNA binding sites on target transcripts from a sequence database. | 115 TargetFinder will computationally predict small RNA binding sites on target transcripts from a sequence database. |
| 40 | 116 |
| 41 This is done by aligning the input small RNA sequence against all transcripts, | 117 This is done by aligning the input small RNA sequence against all transcripts, followed by site scoring using a position-weighted scoring matrix. |
| 42 followed by site scoring using a position-weighted scoring matrix. | 118 |
| 119 ---- | |
| 120 | |
| 121 .. class:: infomark | |
| 43 | 122 |
| 44 **Input** | 123 **Input** |
| 45 | 124 |
| 46 -f Input small RNA sequences file (FASTA-format). | 125 This tool requires two fasta files: |
| 47 | 126 |
| 48 -d Target sequence database file (FASTA-format) | 127 :: |
| 49 | 128 |
| 50 **Output** | 129 -f Input small RNA sequences file (FASTA-format). |
| 51 | 130 -d Target sequence database file (FASTA-format) |
| 52 Each predicted target site is printed out separately. | 131 |
| 53 The output consists of two parts. | 132 ---- |
| 54 | 133 |
| 55 The first is a description line and the second is a base-pairing diagram of the target and small RNA (query) sequence. | 134 .. class:: infomark |
| 56 | 135 |
| 57 The description line contains the query name, the description line from the target sequence database, and the target prediction score. | 136 **Original TargetFinder Output** |
| 58 | 137 |
| 59 The base-pairing diagram has the target site sequence on top in 5'-3' orientation and the query sequence on the bottom in 3'-5' orientation. | 138 |
| 60 | 139 Each predicted target site is printed out separately. |
| 61 Between the target site sequece and the query sequence are base pair symbols. | 140 |
| 62 | 141 The output consists of two parts. The first is a description line and the second is a base-pairing diagram of the target and small RNA (query) sequence. The description line contains the query name, the description line from the target sequence database, and the target prediction score. |
| 63 A ":" (colon) symbol represents an ordinary Watson-Crick base pair, a "." (period) represents a G:U base pair, and a " " (space) represents a mismatch. | 142 |
| 143 :: | |
| 144 | |
| 145 query=miR399a, target=AT2G33770.1 | Symbol: None | ubiquitin-conjugating enzyme family protein, low similarity to u, score=1.5 | |
| 146 | |
| 147 | |
| 148 The base-pairing diagram has the target site sequence on top in 5'-3' orientation and the query sequence on the bottom in 3'-5' orientation. Between the target site sequece and the query sequence are base pair symbols. A ':' (colon) symbol represents an ordinary Watson-Crick base pair, a '.' (period) represents a G:U base pair, and a ' ' (space) represents a mismatch. | |
| 149 | |
| 150 :: | |
| 151 | |
| 152 target 5' UAGGGCAAAUCUUCUUUGGCA 3' | |
| 153 .:::::::::::.:::::::: | |
| 154 query 3' GUCCCGUUUAGAGGAAACCGU 5' | |
| 155 | |
| 64 | 156 |
| 65 If a small RNA is predicted to target a sequence more than once, each target site will be output as separate output. | 157 If a small RNA is predicted to target a sequence more than once, each target site will be output as separate output. |
| 158 | |
| 159 | |
| 160 ---- | |
| 161 | |
| 162 .. class:: infomark | |
| 163 | |
| 164 **Additional output formats** | |
| 165 | |
| 166 In addition to the output described above ('classic' output), three new output format options were added to TargetFinder. | |
| 167 | |
| 168 Generic Feature Format (GFF3): | |
| 169 | |
| 170 :: | |
| 171 | |
| 172 AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN targetfinder rna_target 607 627 1.5 + . smallRNA=miR399a;target_seq=UAGGGCAAAUCUUCUUUGGCA;base_pairs=.:::::::::::.::::::::;miR_seq=GUCCCGUUUAGAGGAAACCGU | |
| 173 AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN targetfinder rna_target 740 760 1.5 + . smallRNA=miR399a;target_seq=UAGGGCAUAUCUCCUUUGGCA;base_pairs=.:::::: :::::::::::::;miR_seq=GUCCCGUUUAGAGGAAACCGU | |
| 174 AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN targetfinder rna_target 829 849 1.5 + . smallRNA=miR399a;target_seq=UUGGGCAAAUCUCCUUUGGCA;base_pairs=. :::::::::::::::::::;miR_seq=GUCCCGUUUAGAGGAAACCGU | |
| 175 | |
| 176 | |
| 177 Tab-deliminated Format: | |
| 178 | |
| 179 :: | |
| 180 | |
| 181 miR399a AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN 607 627 + 1.5 UAGGGCAAAUCUUCUUUGGCA .:::::::::::.:::::::: GUCCCGUUUAGAGGAAACCGU | |
| 182 miR399a AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN 740 760 + 1.5 UAGGGCAUAUCUCCUUUGGCA .:::::: ::::::::::::: GUCCCGUUUAGAGGAAACCGU | |
| 183 miR399a AT2G33770.1 | Symbols: UBC24 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN 829 849 + 1.5 UUGGGCAAAUCUCCUUUGGCA . ::::::::::::::::::: GUCCCGUUUAGAGGAAACCGU | |
| 184 | |
| 185 JavaScript Object Notation Format (JSON): | |
| 186 | |
| 187 :: | |
| 188 | |
| 189 { | |
| 190 'miR399a': { | |
| 191 'hits' : [ | |
| 192 { | |
| 193 'Target accession': 'AT2G33770.1 | Symbols: UBC24, ATUBC24, PHO2 | phosphate 2 | chr2:14277558-14283040 REVERSE LEN', | |
| 194 'Score': '1.5', | |
| 195 'Coordinates': '607-627', | |
| 196 'Strand': '+', | |
| 197 'Target sequence': 'UAGGGCAAAUCUUCUUUGGCA', | |
| 198 'Base pairing': '.:::::::::::.::::::::', | |
| 199 'amiRNA sequence': 'GUCCCGUUUAGAGGAAACCGU' | |
| 200 } | |
| 201 ] | |
| 202 } | |
| 203 } | |
| 204 | |
| 205 | |
| 206 ---- | |
| 207 | |
| 208 .. class:: infomark | |
| 209 | |
| 210 **Method** | |
| 211 | |
| 212 TargetFinder searches for potential miRNA target sites in a FASTA-formated sequence database using three main steps. | |
| 213 | |
| 214 | |
| 215 1. The small RNA query sequence is aligned to every sequence in the FASTA-formated sequence database using `Smith-Waterman (SW) alignments <https://en.wikipedia.org/wiki/Smith%E2%80%93Waterman_algorithm>`_ implemented in the FASTA package (ssearch35_t). | |
| 216 2. The SW alignments are converted into RNA duplexes. | |
| 217 3. Each duplex is scored using a position-dependent scoring matrix. | |
| 218 | |
| 219 SW alignments are used to identify the best complementary regions between the small RNA query sequence and every sequence in the FASTA-formated sequence database. | |
| 220 | |
| 66 ]]></help> | 221 ]]></help> |
| 67 <citations> | 222 <expand macro='citations' /> |
| 68 <citation type="doi">10.1016/j.cell.2005.04.004</citation> | |
| 69 <citation type="doi">10.1371/journal.pone.0000219</citation> | |
| 70 <citation type="doi">10.1007/978-1-60327-005-2_4</citation> | |
| 71 </citations> | |
| 72 </tool> | 223 </tool> |
| 73 | 224 |
