comparison mirdeep2.xml @ 1:ea20fb8d849e draft default tip

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/mirdeep2/mirdeep2 commit 04c75332ac618b43ce5c3f307f7866e97147e865
author rnateam
date Thu, 05 Apr 2018 08:38:04 -0400
parents 6d5125a67880
children
comparison
equal deleted inserted replaced
0:6d5125a67880 1:ea20fb8d849e
1 <tool id="rbc_mirdeep2" name="MiRDeep2" version="2.0.0"> 1 <tool id="rbc_mirdeep2" name="MiRDeep2" version="2.0.0.8.1">
2 <description> 2 <description>identification of novel and known miRNAs</description>
3 <![CDATA[
4 identification of novel and known miRNAs
5 ]]>
6 </description>
7 <requirements> 3 <requirements>
8 <requirement type="package" version="2.0">mirdeep2</requirement> 4 <requirement type="package" version="2.0.0.8">mirdeep2</requirement>
9 <requirement type="package" version="2.0">mirdeep2_quantifier</requirement>
10 <requirement type="package" version="0.12.7">bowtie</requirement>
11 <requirement type="package" version="5.18.1">perl</requirement>
12 <requirement type="package" version="1.8.5">vienna_rna</requirement>
13 <requirement type="package" version="2.023">pdf_api2</requirement>
14 <requirement type="package" version="2.0">randfold</requirement>
15 </requirements> 5 </requirements>
16 6 <command detect_errors="aggressive">
17 <command>
18 <![CDATA[ 7 <![CDATA[
19 miRDeep2.pl 8 miRDeep2.pl
20 9
21 $reads 10 $reads
22 $genome 11 $genome
23 $mappings 12 $mappings
24 13
25 #if $mature_this 14 #if $mature_this
26 $mature_this 15 $mature_this
27 #else 16 #else
28 none 17 none
29 #end if 18 #end if
30 19
31 #if $mature_other 20 #if $mature_other
32 $mature_other 21 $mature_other
33 #else 22 #else
34 none 23 none
35 #end if 24 #end if
36 25
37 #if $precursors 26 #if $precursors
38 $precursors 27 $precursors
39 #else 28 #else
40 none 29 none
41 #end if 30 #end if
42 31
43 #if $species.value != 'all' 32 #if $species.value != 'all'
44 -t $species 33 -t $species
45 #end if 34 #end if
46 35
47 #if $star_sequences 36 #if $star_sequences
48 -s $star_sequences 37 -s $star_sequences
49 #end if 38 #end if
50 39
51 #if $min_read_stack 40 #if $min_read_stack
52 -a $min_read_stack 41 -a $min_read_stack
53 #end if 42 #end if
54 43
55 #if $min_read_stack 44 #if $min_read_stack
56 -a $min_read_stack 45 -a $min_read_stack
57 #end if 46 #end if
58 47
59 -g $max_precursors_analyze 48 -g $max_precursors_analyze
60 -b $min_score_cutoff 49 -b $min_score_cutoff
61 $disable_randfold 50 $disable_randfold
62 51
63 ; cp result*.bed result.bed 2> /dev/null 52 &&
64 ; cp result*.csv result.csv 2> /dev/null 53
65 ; cp mirdeep_runs/run*/output.mrd . 2> /dev/null
66 ; cp mirdeep_runs/run*/survey.csv . 2> /dev/null
67
68 ## html output 54 ## html output
69 ; 55 mv result*.html $html 2> /dev/null
70 cp result*.html $html 2> /dev/null 56
71
72 ## move pdf directory to be accessible from the new index.html 57 ## move pdf directory to be accessible from the new index.html
73 ; 58 &&
74 mkdir -p $html.files_path 2> /dev/null 59 mkdir -p $html.files_path 2> /dev/null
75 ; 60 &&
76 cp -R pdfs* $html.files_path 2> /dev/null 61 mv pdfs* $html.files_path 2> /dev/null
77
78 ]]> 62 ]]>
79 </command> 63 </command>
80 <stdio> 64 <inputs>
81 <!-- Anything other than zero is an error -->
82 <exit_code range="1:" />
83 <exit_code range=":-1" />
84 <!-- In case the return code has not been set propery check stderr too -->
85 <regex match="Error:" />
86 <regex match="Exception:" />
87 </stdio>
88 <inputs>
89 <param name="reads" format="fasta" type="data" label="Collapsed deep sequencing reads"> 65 <param name="reads" format="fasta" type="data" label="Collapsed deep sequencing reads">
90 <help> 66 <help>
91 <![CDATA[ 67 <![CDATA[
92 Reads in fasta format. The identifier should contain a prefix, a running 68 Reads in fasta format. The identifier should contain a prefix, a running
93 number and a '_x' to indicate the number of reads that have this sequence. 69 number and a '_x' to indicate the number of reads that have this sequence.
95 ]]> 71 ]]>
96 </help> 72 </help>
97 </param> 73 </param>
98 <param name="genome" format="fasta" type="data" label="Genome" help="Genome contigs in fasta format. The identifiers should be unique."/> 74 <param name="genome" format="fasta" type="data" label="Genome" help="Genome contigs in fasta format. The identifiers should be unique."/>
99 <param name="mappings" format="tabular" type="data" label="Mappings" help="Reads mapped against genome. Mappings should be in ARF format."/> 75 <param name="mappings" format="tabular" type="data" label="Mappings" help="Reads mapped against genome. Mappings should be in ARF format."/>
100 <param name="mature_this" optional="true" format="fasta" type="data" label="Mature miRNA sequences for this species" 76 <param name="mature_this" optional="true" format="fasta" type="data" label="Mature miRNA sequences for this species"
101 help="miRBase miRNA sequences in fasta format. These should be the known mature sequences for the species being analyzed."/> 77 help="miRBase miRNA sequences in fasta format. These should be the known mature sequences for the species being analyzed."/>
102 <param name="mature_other" optional="true" format="fasta" type="data" label="Mature miRNA sequences for related species"> 78 <param name="mature_other" optional="true" format="fasta" type="data" label="Mature miRNA sequences for related species">
103 <help> 79 <help>
104 <![CDATA[ 80 <![CDATA[
105 miRBase miRNA sequences in fasta format. These should be the pooled known 81 miRBase miRNA sequences in fasta format. These should be the pooled known
106 mature sequences for 1-5 species closely related to the species being analyzed. 82 mature sequences for 1-5 species closely related to the species being analyzed.
107 ]]> 83 ]]>
108 </help> 84 </help>
109 </param> 85 </param>
110 <param name="precursors" optional="true" format="fasta" type="data" label="Precursor sequences" 86 <param name="precursors" optional="true" format="fasta" type="data" label="Precursor sequences"
111 help="miRBase miRNA precursor sequences in fasta format. These should be the known precursor sequences for the species being analyzed."/> 87 help="miRBase miRNA precursor sequences in fasta format. These should be the known precursor sequences for the species being analyzed."/>
112 88
113 <param name="species" type="select" label="Search in species" help="If not searching in a specific species all species in your files will be analyzed. (-t)"> 89 <param name="species" type="select" label="Search in species" help="If not searching in a specific species all species in your files will be analyzed. (-t)">
114 <option value="all">All species</option> 90 <option value="all">All species</option>
115 <option value="tni">tetraodon</option> 91 <option value="tni">tetraodon</option>
116 <option value="dps">d.pseudoobscura</option> 92 <option value="dps">d.pseudoobscura</option>
117 <option value="dya">d.yakuba</option> 93 <option value="dya">d.yakuba</option>
143 <option value="dan">d.ananassae</option> 119 <option value="dan">d.ananassae</option>
144 <option value="hsa">human</option> 120 <option value="hsa">human</option>
145 <option value="dsi">d.simulans</option> 121 <option value="dsi">d.simulans</option>
146 </param> 122 </param>
147 <param name="star_sequences" format="fasta" type="data" optional="true" label="Star sequences" help="From miRBase in fasta format (optional) (-s)"/> 123 <param name="star_sequences" format="fasta" type="data" optional="true" label="Star sequences" help="From miRBase in fasta format (optional) (-s)"/>
148 124
149 <param name="min_read_stack" optional="true" type="integer" minvalue="0" label="Minimum read stack height"> 125 <param name="min_read_stack" optional="true" type="integer" min="0" label="Minimum read stack height">
150 <help> 126 <help>
151 <![CDATA[ 127 <![CDATA[
152 minimum read stack height that triggers analysis. Using this option disables 128 minimum read stack height that triggers analysis. Using this option disables
153 automatic estimation of the optimal value and all detected precursors are analyzed. (-a) 129 automatic estimation of the optimal value and all detected precursors are analyzed. (-a)
154 ]]> 130 ]]>
155 </help> 131 </help>
156 </param> 132 </param>
157 <param name="max_precursors_analyze" type="integer" value="50000" label="Maximum precursors" 133 <param name="max_precursors_analyze" type="integer" value="50000" label="Maximum precursors"
158 help="Maximum number of precursors to analyze when automatic excision gearing is used. If set to -1 all precursors will be analyzed. (-g)."/> 134 help="Maximum number of precursors to analyze when automatic excision gearing is used. If set to -1 all precursors will be analyzed. (-g)."/>
159 <param name="min_score_cutoff" type="integer" value="0" label="Minimum miRNA score" 135 <param name="min_score_cutoff" type="integer" value="0" label="Minimum miRNA score"
160 help="Minimum score cut-off for predicted novel miRNAs to be displayed in the overview table. (-b)"/> 136 help="Minimum score cut-off for predicted novel miRNAs to be displayed in the overview table. (-b)"/>
161 <param name="disable_randfold" type="boolean" truevalue="-c" falsevalue="" label="Disable randfold analysis" help="(-c)"/> 137 <param name="disable_randfold" type="boolean" truevalue="-c" falsevalue="" label="Disable randfold analysis" help="(-c)"/>
138 <param name="detailed_fasta" type="boolean" checked="false" label="Detailed fasta output" help="Output fasta files of precursors, mature and star strand for both novel and known miRNAs"/>
162 </inputs> 139 </inputs>
163 <outputs> 140 <outputs>
164 <data name="tab_results" format="tabular" from_work_dir="result.csv" label="Tabular output of ${tool.name} on ${on_string}"/> 141 <data name="tab_results" format="tabular" from_work_dir="result*.csv" label="Tabular output of ${tool.name} on ${on_string}"/>
165 <data format="html" name="html" label="${tool.name} on ${on_string} (html report)"/> 142 <data format="html" name="html" label="${tool.name} on ${on_string} (html report)"/>
166 <data name="pred_acc" format="tabular" from_work_dir="survey.csv" label="Prediction accuracy output of ${tool.name} on ${on_string}"/> 143 <data name="pred_acc" format="tabular" from_work_dir="mirdeep_runs/run*/survey.csv" label="Prediction accuracy output of ${tool.name} on ${on_string}"/>
167 <data name="bed_out" format="bed" from_work_dir="result.bed" label="Bed output of ${tool.name} on ${on_string}"/> 144 <data name="bed_out" format="bed" from_work_dir="result*.bed" label="Bed output of ${tool.name} on ${on_string}"/>
168 <data name="mrd_out" format="txt" from_work_dir="output.mrd" label="Text output of ${tool.name} on ${on_string}"/> 145 <data name="mrd_out" format="txt" from_work_dir="mirdeep_runs/run*/output.mrd" label="Text output of ${tool.name} on ${on_string}"/>
146
147 <data name="known_mature" format="fasta" from_work_dir="mirna_results_*/known_mature_*.fa" label="${tool.name} on ${on_string}: known mature">
148 <filter>detailed_fasta</filter>
149 </data>
150 <data name="known_pres" format="fasta" from_work_dir="mirna_results_*/known_pres_*.fa" label="${tool.name} on ${on_string}: known precursors">
151 <filter>detailed_fasta</filter>
152 </data>
153 <data name="known_star" format="fasta" from_work_dir="mirna_results_*/known_star_*.fa" label="${tool.name} on ${on_string}: known star">
154 <filter>detailed_fasta</filter>
155 </data>
156 <data name="not_mature" format="fasta" from_work_dir="mirna_results_*/not_mature_*.fa" label="${tool.name} on ${on_string}: not detected mature">
157 <filter>detailed_fasta</filter>
158 </data>
159 <data name="not_pres" format="fasta" from_work_dir="mirna_results_*/not_pres_*.fa" label="${tool.name} on ${on_string}: not detected precursors">
160 <filter>detailed_fasta</filter>
161 </data>
162 <data name="not_star" format="fasta" from_work_dir="mirna_results_*/not_star_*.fa" label="${tool.name} on ${on_string}: not detected star">
163 <filter>detailed_fasta</filter>
164 </data>
165 <data name="novel_mature" format="fasta" from_work_dir="mirna_results_*/novel_mature_*.fa" label="${tool.name} on ${on_string}: novel mature">
166 <filter>detailed_fasta</filter>
167 </data>
168 <data name="novel_pres" format="fasta" from_work_dir="mirna_results_*/novel_pres_*.fa" label="${tool.name} on ${on_string}: novel precursors">
169 <filter>detailed_fasta</filter>
170 </data>
171 <data name="novel_star" format="fasta" from_work_dir="mirna_results_*/novel_star_*.fa" label="${tool.name} on ${on_string}: novel star">
172 <filter>detailed_fasta</filter>
173 </data>
169 </outputs> 174 </outputs>
170 <tests> 175 <tests>
171 <test> 176 <test>
172 <param name="reads" value="reads_collapsed.fa"/> 177 <param name="reads" value="reads_collapsed.fa"/>
173 <param name="genome" value="cel_cluster.fa"/> 178 <param name="genome" value="cel_cluster.fa"/>
174 <param name="mappings" value="reads_collapsed_vs_genome.arf"/> 179 <param name="mappings" value="reads_collapsed_vs_genome.arf"/>
175 <param name="mature_this" value="mature_ref_this_species.fa"/> 180 <param name="mature_this" value="mature_ref_this_species.fa"/>
176 <param name="mature_other" value="mature_ref_other_species.fa"/> 181 <param name="mature_other" value="mature_ref_other_species.fa"/>
177 <param name="precursors" value="precursors_ref_this_species.fa"/> 182 <param name="precursors" value="precursors_ref_this_species.fa"/>
178 183
179 <output name="tab_results" file="result.csv" compare="sim_size"/> 184 <output name="tab_results" file="result.csv" compare="sim_size"/>
180 <output name="prec_acc" file="survey.csv" compare="sim_size"/> 185 <output name="pred_acc" file="survey.csv" compare="sim_size"/>
181 <output name="bed_out" file="result.bed" compare="sim_size"/> 186 <output name="bed_out" file="result.bed" compare="sim_size"/>
182 <output name="mrd_out" file="output.mrd" compare="sim_size"/> 187 <output name="mrd_out" file="output.mrd" compare="sim_size"/>
183 </test> 188 </test>
189 <test>
190 <param name="reads" value="reads_collapsed.fa"/>
191 <param name="genome" value="cel_cluster.fa"/>
192 <param name="mappings" value="reads_collapsed_vs_genome.arf"/>
193 <param name="mature_this" value="mature_ref_this_species.fa"/>
194 <param name="mature_other" value="mature_ref_other_species.fa"/>
195 <param name="precursors" value="precursors_ref_this_species.fa"/>
196 <param name="detailed_fasta" value="true"/>
197
198 <output name="tab_results" file="result.csv" compare="sim_size"/>
199 <output name="pred_acc" file="survey.csv" compare="sim_size"/>
200 <output name="bed_out" file="result.bed" compare="sim_size"/>
201 <output name="mrd_out" file="output.mrd" compare="sim_size"/>
202
203 <output name="known_mature" file="detailed_fasta/known_mature.fa" compare="sim_size"/>
204 <output name="known_pres" file="detailed_fasta/known_pres.fa" compare="sim_size"/>
205 <output name="known_star" file="detailed_fasta/known_star.fa" compare="sim_size"/>
206 <output name="not_mature" file="detailed_fasta/not_mature.fa" compare="sim_size"/>
207 <output name="not_pres" file="detailed_fasta/not_pres.fa" compare="sim_size"/>
208 <output name="not_star" file="detailed_fasta/not_star.fa" compare="sim_size"/>
209 <output name="novel_mature" file="detailed_fasta/novel_mature.fa" compare="sim_size"/>
210 <output name="novel_pres" file="detailed_fasta/novel_pres.fa" compare="sim_size"/>
211 <output name="novel_star" file="detailed_fasta/novel_star.fa" compare="sim_size"/>
212 </test>
184 </tests> 213 </tests>
185 <help> 214 <help>
186 <![CDATA[ 215 <![CDATA[
187 **What MiRDeep2 does** 216
217 **What it does**
188 218
189 MiRDeep2 is a software package for identification of novel and known miRNAs in deep sequencing data. Furthermore, it can be used for miRNA expression profiling across samples. 219 MiRDeep2 is a software package for identification of novel and known miRNAs in deep sequencing data. Furthermore, it can be used for miRNA expression profiling across samples.
220
221 **Input**
222
223 A FASTA file with deep sequencing reads, a FASTA file of the corresponding genome, a file of mapped reads to the genome in miRDeep2 arf format, an optional fasta file with known miRNAs of the analysing species and an option fasta file of known miRNAs of related species.
224
225 Arf format:
226 Is a proprietary file format generated and processed by miRDeep2. It contains information of reads mapped to a reference genome. Each line in such a file contains 13 columns:
227
228 1. read identifier
229 2. length of read sequence
230 3. start position in read sequence that is mapped
231 4. end position in read sequence that is mapped
232 5. read sequence
233 6. identifier of the genome-part to which a read is mapped to. This is either a scaffold id or a chromosome name
234 7. length of the genome sequence a read is mapped to
235 8. start position in the genome where a read is mapped to
236 9. end position in the genome where a read is mapped to
237 10. genome sequence to which a read is mapped
238 11. genome strand information. Plus means the read is aligned to the sense-strand of the genome. Minus means it is aligned to the antisense-strand of the genome.
239 12. Number of mismatches in the read mapping
240 13. Edit string that indicates matches by lowercase 'm' and mismatches by uppercase 'M'
241
242
190 ]]> 243 ]]>
191 </help> 244 </help>
192 <citations> 245 <citations>
193 <citation type="doi">10.1093/nar/gkr688</citation> 246 <citation type="doi">10.1093/nar/gkr688</citation>
194 <citation type="doi">10.1002/0471250953.bi1210s36</citation> 247 <citation type="doi">10.1002/0471250953.bi1210s36</citation>