comparison dia_umpire_se.xml @ 4:e8822850243a draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/dia_umpire commit 2379480213ba2e084a93bf82052fac858ffd074f
author galaxyp
date Mon, 04 Mar 2019 11:49:42 -0500
parents 6caa9011f245
children
comparison
equal deleted inserted replaced
3:6caa9011f245 4:e8822850243a
5 </macros> 5 </macros>
6 <expand macro="requirements" /> 6 <expand macro="requirements" />
7 <expand macro="stdio" /> 7 <expand macro="stdio" />
8 <command> 8 <command>
9 <![CDATA[ 9 <![CDATA[
10 #set $output_dir = 'gx_path'
10 #import re 11 #import re
11 ## want to save all outputs in a directory output.extra_files_path to be used by dia_umpire_quant
12 ## Is file naming going to be a problem? May need to have a name param
13 #if $se_extraction_data:
14 #set se_params = $se_ser
15 #set $ser_dir = $se_ser.extra_files_path
16 mkdir $ser_dir
17 && ln -s '$ser_dir' '$output_dir'
18 && cat $se_config > $se_ser
19 #else:
20 #set se_params = $params
21 mkdir '$output_dir' 12 mkdir '$output_dir'
22 && cat $se_config > $se_params 13 && cat $se_config > $se_params
23 #end if
24 ##
25 && echo " " >> $se_params 14 && echo " " >> $se_params
26 && echo "Thread = \$GALAXY_SLOTS" >> $se_params 15 && echo "Thread = \$GALAXY_SLOTS" >> $se_params
27 #if $input_prefix and len($input_prefix.strip()) > 0: 16 #if $input_prefix and len($input_prefix.strip()) > 0:
28 #set $input_path = str($output_dir) + '/' + $input_prefix.__str__ + '_rep' + str($i + 1) + '.mzXML' 17 #set $input_path = str($output_dir) + '/' + $input_prefix.__str__ + '_rep' + str($i + 1) + '.mzXML'
29 #else: 18 #else:
30 #set $input_path = str($output_dir) + '/' + $re.sub('\.[mM]\w+$','',$re.sub('[^-a-zA-Z0-9_.]','_',$input.name)) + '.mzXML' 19 #set $input_path = str($output_dir) + '/' + $re.sub('\.[mM]\w+$','',$re.sub('[^-a-zA-Z0-9_.]','_',$input.element_identifier)) + '.mzXML'
31 #end if 20 #end if
32 && ln -s '${input}' '$input_path' 21 && ln -s '${input}' '$input_path'
33 && dia_umpire_se '$input_path' '$se_params' 22 && dia_umpire_se '$input_path' '$se_params'
34 && cat $output_dir/*.log >> "$logfile" 23 && cat $output_dir/*.log >> "$logfile"
35 #if not $mgfs_as_collection: 24 #if not $mgfs_as_collection:
199 <inputs> 188 <inputs>
200 <param name="input" type="data" format="mzxml" label="Proteomics Spectrum files in mzXML format"/> 189 <param name="input" type="data" format="mzxml" label="Proteomics Spectrum files in mzXML format"/>
201 <param name="input_prefix" type="text" value="" optional="true" label="File name prefix" help="Names inputs: prefix_rep#.mzXML Leave blank to use History names of input"> 190 <param name="input_prefix" type="text" value="" optional="true" label="File name prefix" help="Names inputs: prefix_rep#.mzXML Leave blank to use History names of input">
202 <validator type="regex" message="">[a-zA-Z][a-zA-Z0-9_-]*</validator> 191 <validator type="regex" message="">[a-zA-Z][a-zA-Z0-9_-]*</validator>
203 </param> 192 </param>
204 <param name="output_dir" type="hidden" value="gx_path"/>
205
206 <conditional name="instrument"> 193 <conditional name="instrument">
207 <param name="model" type="select" label="instrument used" help="Sets default parameters"> 194 <param name="model" type="select" label="instrument used" help="Sets default parameters">
208 <option value="Thermo_Orbitrap">Thermo Orbitrap</option> 195 <option value="Thermo_Orbitrap">Thermo Orbitrap</option>
209 <option value="AB_SCIEX_Triple_TOF_5600">AB SCIEX Triple TOF 5600</option> 196 <option value="AB_SCIEX_Triple_TOF_5600">AB SCIEX Triple TOF 5600</option>
210 <option value="other">other</option> 197 <option value="other">other</option>
211 </param> 198 </param>
212 <when value="Thermo_Orbitrap"> 199 <when value="Thermo_Orbitrap">
213
214 <param name="SE_MS1PPM" type="float" value="5" min="1" max="20" optional="true" label="Maximum mass error for two MS1 peaks"> 200 <param name="SE_MS1PPM" type="float" value="5" min="1" max="20" optional="true" label="Maximum mass error for two MS1 peaks">
215 <help> 201 <help>
216 SE.MS1PPM: (Unit: ppm) Maximum mass error for two MS1 peaks in consecutive spectra to be considered signal of the same ion. Used in MS1 signal detection and precursor alignment between samples/runs. 202 SE.MS1PPM: (Unit: ppm) Maximum mass error for two MS1 peaks in consecutive spectra to be considered signal of the same ion. Used in MS1 signal detection and precursor alignment between samples/runs.
217 Recommended value: Depends on the instrument. Typical values are 5-10 ppm for Thermo Orbitrap. 203 Recommended value: Depends on the instrument. Typical values are 5-10 ppm for Thermo Orbitrap.
218 </help> 204 </help>
222 SE.MS2PPM: (Unit: ppm) Maximum mass error for two MS2 peaks in consecutive spectra to be considered signal of the same ion. 208 SE.MS2PPM: (Unit: ppm) Maximum mass error for two MS2 peaks in consecutive spectra to be considered signal of the same ion.
223 Recommended value: Depends on the instrument. If fragmentation spectra are measured with the same detector as MS1 spectra, set the same as Para.MS1PPM or a little higher, e.g. if you've set Para.MS1PPM=30 ppm for AB SCIEX Triple TOF 5600, consider setting to 40ppm. 209 Recommended value: Depends on the instrument. If fragmentation spectra are measured with the same detector as MS1 spectra, set the same as Para.MS1PPM or a little higher, e.g. if you've set Para.MS1PPM=30 ppm for AB SCIEX Triple TOF 5600, consider setting to 40ppm.
224 </help> 210 </help>
225 </param> 211 </param>
226 <expand macro="common_se_params" /> 212 <expand macro="common_se_params" />
227
228 </when> 213 </when>
229 <when value="AB_SCIEX_Triple_TOF_5600"> 214 <when value="AB_SCIEX_Triple_TOF_5600">
230 <param name="SE_MS1PPM" type="float" value="30" min="1" max="50" optional="true" label="Maximum mass error for two MS1 peaks"> 215 <param name="SE_MS1PPM" type="float" value="30" min="1" max="50" optional="true" label="Maximum mass error for two MS1 peaks">
231 <help> 216 <help>
232 SE.MS1PPM: (Unit: ppm) Maximum mass error for two MS1 peaks in consecutive spectra to be considered signal of the same ion. Used in MS1 signal detection and precursor alignment between samples/runs. 217 SE.MS1PPM: (Unit: ppm) Maximum mass error for two MS1 peaks in consecutive spectra to be considered signal of the same ion. Used in MS1 signal detection and precursor alignment between samples/runs.
285 <param name="RTOverlap" type="float" value=".3" min="0" optional="true" label="RTOverlap" > 270 <param name="RTOverlap" type="float" value=".3" min="0" optional="true" label="RTOverlap" >
286 <help> 271 <help>
287 RTOverlap: Retention time overlap. (Default: 0.3) 272 RTOverlap: Retention time overlap. (Default: 0.3)
288 </help> 273 </help>
289 </param> 274 </param>
290
291 <param name="DeltaApex" type="float" value=".6" min="0" optional="true" label="DeltaApex" > 275 <param name="DeltaApex" type="float" value=".6" min="0" optional="true" label="DeltaApex" >
292 <help> 276 <help>
293 DeltaApex: (Unit: minute) Maximum retention time difference of LC profile apexes between precursor and fragment (the lower, the more stringent). (Default: 0.6) 277 DeltaApex: (Unit: minute) Maximum retention time difference of LC profile apexes between precursor and fragment (the lower, the more stringent). (Default: 0.6)
294 </help> 278 </help>
295 </param> 279 </param>
311 <option value="no">no</option> 295 <option value="no">no</option>
312 <option value="yes">yes</option> 296 <option value="yes">yes</option>
313 </param> 297 </param>
314 <when value="no"/> 298 <when value="no"/>
315 <when value="yes"> 299 <when value="yes">
316
317 <param name="SE_MinMSIntensity" type="float" value="" optional="true" label="MinMSIntensity" > 300 <param name="SE_MinMSIntensity" type="float" value="" optional="true" label="MinMSIntensity" >
318 <help> 301 <help>
319 SE.MinMSIntensity: Minimum signal intensity for a peak in an MS1 spectrum to be considered as a valid signal. Any MS1 peak having intensity lower than this threshold will be ignored. It is the main parameter controlling how many peaks and isotopic envelopes will be detected. 302 SE.MinMSIntensity: Minimum signal intensity for a peak in an MS1 spectrum to be considered as a valid signal. Any MS1 peak having intensity lower than this threshold will be ignored. It is the main parameter controlling how many peaks and isotopic envelopes will be detected.
320 Recommended value: Depends on the data. Check raw data for average noise- levels. E.g. TOF data often have thousands of random small intensity peaks. 303 Recommended value: Depends on the data. Check raw data for average noise- levels. E.g. TOF data often have thousands of random small intensity peaks.
321 Warning: Setting this parameter too low (or zero) in such a case will significantly increase processing time and memory requirements. 304 Warning: Setting this parameter too low (or zero) in such a case will significantly increase processing time and memory requirements.
376 </help> 359 </help>
377 </param> 360 </param>
378 361
379 <param name="SE_MinRTRange" type="float" value="" optional="true" label="MinRTRange" > 362 <param name="SE_MinRTRange" type="float" value="" optional="true" label="MinRTRange" >
380 <help> 363 <help>
381
382 </help> 364 </help>
383 </param> 365 </param>
384 <param name="SE_MaxNoPeakCluster" type="integer" value="" optional="true" label="MaxNoPeakCluster" > 366 <param name="SE_MaxNoPeakCluster" type="integer" value="" optional="true" label="MaxNoPeakCluster" >
385 <help> 367 <help>
386 SE.MaxNoPeakCluster (new parameter in v1.4): Maximum number of isotope peaks for a precursor feature. 368 SE.MaxNoPeakCluster (new parameter in v1.4): Maximum number of isotope peaks for a precursor feature.
392 </help> 374 </help>
393 </param> 375 </param>
394 <param name="SE_MinMS2NoPeakCluster" type="integer" value="" optional="true" label="MinMS2NoPeakCluster" > 376 <param name="SE_MinMS2NoPeakCluster" type="integer" value="" optional="true" label="MinMS2NoPeakCluster" >
395 <help> 377 <help>
396 SE.MinMS2NoPeakCluster (new parameter in v1.4): Minimum number of isotope peaks for a MS2 feature. When it is set as 1, the algorithm will group fragments even for peaks without any isotope signal being found. For these cases, the assumed charged states will be from the parameter SE.StartCharge to SE.EndCharge. 378 SE.MinMS2NoPeakCluster (new parameter in v1.4): Minimum number of isotope peaks for a MS2 feature. When it is set as 1, the algorithm will group fragments even for peaks without any isotope signal being found. For these cases, the assumed charged states will be from the parameter SE.StartCharge to SE.EndCharge.
397
398 </help> 379 </help>
399 </param> 380 </param>
400 <param name="SE_RTtol" type="float" value="" optional="true" label="RTtol" > 381 <param name="SE_RTtol" type="float" value="" optional="true" label="RTtol" >
401 <help> 382 <help>
402 </help> 383 </help>
435 label="ExportPrecursorPeak" 416 label="ExportPrecursorPeak"
436 help="Output detailed information about detected MS1 precursor and MS2 unfragmented precursor signals"/> 417 help="Output detailed information about detected MS1 precursor and MS2 unfragmented precursor signals"/>
437 <param name="ExportFragmentPeak" type="boolean" truevalue="true" falsevalue="false" checked="false" 418 <param name="ExportFragmentPeak" type="boolean" truevalue="true" falsevalue="false" checked="false"
438 label="ExportFragmentPeak" 419 label="ExportFragmentPeak"
439 help="Output detailed information about detected MS2 signals"/> 420 help="Output detailed information about detected MS2 signals"/>
440 <param name="se_extraction_data" type="boolean" truevalue="Signal Extraction data" falsevalue="diaumpire_se.params" checked="false"
441 label="Output Signal Extraction data for DIA_Umpire_Quant" />
442 <param name="mgfs_as_collection" type="boolean" truevalue="true" falsevalue="false" checked="false" 421 <param name="mgfs_as_collection" type="boolean" truevalue="true" falsevalue="false" checked="false"
443 label="Output MGFs as a collection" /> 422 label="Output MGFs as a collection" />
444 423
445 </inputs> 424 </inputs>
446 425
447 <outputs> 426 <outputs>
448 <data format="txt" name="logfile" label="${tool.name} ${on_string} log"/> 427 <data format="txt" name="logfile" label="${tool.name} ${on_string} log"/>
449 <data format="dia_umpire.ser" name="se_ser" label="${tool.name} ${input.name} ${se_extraction_data}"> 428 <data format="txt" name="se_params" label="${tool.name} ${input.name} diaumpire_se.params"/>
450 <filter>se_extraction_data</filter>
451 </data>
452 <data format="txt" name="params" label="${tool.name} ${input.name} ${se_extraction_data}">
453 <filter>not se_extraction_data</filter>
454 </data>
455 <data format="csv" name="PrecursorPeak" label="${tool.name} ${input.name} PeakCluster.csv" from_work_dir="gx_path/swath_PeakCurve.csv"> 429 <data format="csv" name="PrecursorPeak" label="${tool.name} ${input.name} PeakCluster.csv" from_work_dir="gx_path/swath_PeakCurve.csv">
456 <filter>ExportPrecursorPeak</filter> 430 <filter>ExportPrecursorPeak</filter>
457 </data> 431 </data>
458 <!-- 432 <!--
459 <data format="csv" name="FragmentPeak" label="" from_work_dir="gx_path/swath_PeakCurve.csv"> 433 <data format="csv" name="FragmentPeak" label="" from_work_dir="gx_path/swath_PeakCurve.csv">
487 </conditional> 461 </conditional>
488 </conditional> 462 </conditional>
489 <output name="q2_mgf"> 463 <output name="q2_mgf">
490 <assert_contents> 464 <assert_contents>
491 <has_text text="BEGIN IONS" /> 465 <has_text text="BEGIN IONS" />
492 <has_text_matching expression="^PEPMASS=740.\d+$" /> 466 <has_text text="PEPMASS=740" />
493 </assert_contents> 467 </assert_contents>
494 </output> 468 </output>
495 </test> 469 </test>
496 </tests> 470 </tests>
497 <help> 471 <help>
559 2. <filename>_Q2.mgf 533 2. <filename>_Q2.mgf
560 3. <filename>_Q3.mgf 534 3. <filename>_Q3.mgf
561 535
562 Note: Each file corresponds to a different "quality level" of precursor ions (Q1= More than two isotopic peaks detected in MS1, Q2 = only two isotopic peak detected, Q3 = detected unfragmented precursor in MS2). These spectra are written to separate files, because they must be searched separately against a protein database as a consequence of differences in FDR estimates for these varying quality data. 536 Note: Each file corresponds to a different "quality level" of precursor ions (Q1= More than two isotopic peaks detected in MS1, Q2 = only two isotopic peak detected, Q3 = detected unfragmented precursor in MS2). These spectra are written to separate files, because they must be searched separately against a protein database as a consequence of differences in FDR estimates for these varying quality data.
563 537
564 2. *DIA_Umpire_SE Signal Extraction data* - includes the binary files (.ser) containing contain all necessary information for quantitation procedures (parameter settings, all detected precursor and fragment peaks, precursor-fragment grouping information). 538 2. If ExportPrecursorPeak and/or ExportFragmentPeak options were set to true, text files with detailed information about detected MS1 and/or MS2 features will be generated.
565
566 3. If ExportPrecursorPeak and/or ExportFragmentPeak options were set to true, text files with detailed information about detected MS1 and/or MS2 features will be generated.
567 539
568 540
569 ]]> 541 ]]>
570 </help> 542 </help>
571 <expand macro="citations" /> 543 <expand macro="citations" />