dia_umpire: dia_umpire_se.xml comparison

comparison dia_umpire_se.xml @ 3:6caa9011f245 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/dia_umpire commit 2379480213ba2e084a93bf82052fac858ffd074f

author	galaxyp
date	Mon, 04 Mar 2019 11:49:18 -0500
parents	b4f82d15cac0
children	e8822850243a

comparison

equal deleted inserted replaced

-:b4f82d15cac0
+:6caa9011f245
 <tool id="dia_umpire_se" name="DIA_Umpire_SE" version="@VERSION@.0">
 <description>DIA signal extraction</description>
 <macros>
-<import>macros.xml</import>
+<import>dia_umpire_macros.xml</import>
 </macros>
 <expand macro="requirements" />
 <expand macro="stdio" />
 <command>
 <![CDATA[
 #import re
-## want to save all outputs in a directory output.extra_files_path to be used by
+## want to save all outputs in a directory output.extra_files_path to be used by dia_umpire_quant
 ## Is file naming going to be a problem? May need to have a name param
-#set $ser_dir = $se_params.extra_files_path
+#if $se_extraction_data:
+#set se_params = $se_ser
+#set $ser_dir = $se_ser.extra_files_path
 mkdir $ser_dir
-&& ln -s $ser_dir $output_dir
+&& ln -s '$ser_dir' '$output_dir'
+&& cat $se_config > $se_ser
+#else:
+#set se_params = $params
+mkdir '$output_dir'
 && cat $se_config > $se_params
+#end if
 ##
 && echo " " >> $se_params
 && echo "Thread = \$GALAXY_SLOTS" >> $se_params
-#for $i, $input_file in enumerate( $inputs ):
 #if $input_prefix and len($input_prefix.strip()) > 0:
-#set $input_path = $ser_dir + "/" + $input_prefix.__str__ + "_rep" + str($i + 1) + ".mzXML"
+#set $input_path = str($output_dir) + '/' + $input_prefix.__str__ + '_rep' + str($i + 1) + '.mzXML'
 #else:
-#set $input_path = $ser_dir + "/" + $re.sub('\.[mM]\w+$','',$re.sub('[^-a-zA-Z0-9_.]','_',$input_file.name)) + ".mzXML"
+#set $input_path = str($output_dir) + '/' + $re.sub('\.[mM]\w+$','',$re.sub('[^-a-zA-Z0-9_.]','_',$input.name)) + '.mzXML'
 #end if
-&& ln -s "${input_file}" "$input_path"
+&& ln -s '${input}' '$input_path'
-&& java -jar \$DIA_UMPIRE_SE_JAR $input_path $se_params
+&&  dia_umpire_se '$input_path' '$se_params'
 && cat $output_dir/*.log >> "$logfile"
-#end for
+#if not $mgfs_as_collection:
+&& cp "$output_dir/"*_Q1.mgf '$q1_mgf'
+&& cp "$output_dir/"*_Q2.mgf '$q2_mgf'
+&& cp "$output_dir/"*_Q3.mgf '$q3_mgf'
+#end if
+#if $ExportPrecursorPeak:
+&& cp "$output_dir/"*PeakCluster.csv '$PrecursorPeak'
+#end if
 ]]>
 </command>
 <configfiles>
 <configfile name="se_config"><![CDATA[#slurp
 #DIA-Umpire (version @VERSION@)
 #Data Independent Acquisition data processing and analysis package (Signal extraction module)
 #import re
-#for $i, $input_file in enumerate( $inputs ):
 #if $input_prefix:
 #set $input_path = $input_prefix.__str__ + "_rep" + str($i + 1) + ".mzXML"
 #else:
-#set $input_path = $re.sub('\.[mM]\w+$','',$re.sub('[^-a-zA-Z0-9_.]','_',$input_file.name)) + ".mzXML"
+#set $input_path = $re.sub('\.[mM]\w+$','',$re.sub('[^-a-zA-Z0-9_.]','_',$input.name)) + ".mzXML"
 #end if
-# $input_file.name $input_path $input_file
+# $input.name $input_path $input
-#end for
 #No of threads
 Thread = 6
 #Report peak
 SE.EstimateBG = true
 SE.MinNoPeakCluster = 2
 SE.MaxNoPeakCluster = 3#slurp
 #end if
+## SE.RemoveGroupedPeaksRTOverlap
+## SE.RemoveGroupedPeaksCorr
+## SE.IsoCorrThreshold
 #if $instrument.model != 'Thermo_Orbitrap':
 WindowType = $instrument.window.WindowType
 #if $instrument.window.WindowType == 'SWATH':
 WindowSize = #if $instrument.window.WindowSize then $instrument.window.WindowSize else 25#
 #else if $instrument.window.WindowType == 'V_SWATH':
 #slurp]]>
 </configfile>
 </configfiles>
 <inputs>
-<param name="inputs" type="data" format="mzxml" multiple="true" label="Proteomics Spectrum  files in mzXML format"/>
+<param name="input" type="data" format="mzxml" label="Proteomics Spectrum  files in mzXML format"/>
-<param name="input_prefix" type="text" value="" optional="true" label="File name prefix" help="Names inputs: prefix_rep#.mzXML Leave blank to use History names of inputs">
+<param name="input_prefix" type="text" value="" optional="true" label="File name prefix" help="Names inputs: prefix_rep#.mzXML Leave blank to use History names of input">
 <validator type="regex" message="">[a-zA-Z][a-zA-Z0-9_-]*</validator>
 </param>
 <param name="output_dir" type="hidden" value="gx_path"/>
 <conditional name="instrument">
 </help>
 </param>
 </when>
 </conditional>
-<param name="ExportPrecursorPeak" type="boolean" truevalue="true" falsevalue="false" checked="false" label="ExportPrecursorPeak"
+<param name="ExportPrecursorPeak" type="boolean" truevalue="true" falsevalue="false" checked="false"
+label="ExportPrecursorPeak"
 help="Output detailed information about detected MS1 precursor and MS2 unfragmented precursor signals"/>
-<param name="ExportFragmentPeak" type="boolean" truevalue="true" falsevalue="false" checked="false" label="ExportFragmentPeak"
+<param name="ExportFragmentPeak" type="boolean" truevalue="true" falsevalue="false" checked="false"
+label="ExportFragmentPeak"
 help="Output detailed information about detected MS2 signals"/>
+<param name="se_extraction_data" type="boolean" truevalue="Signal Extraction data" falsevalue="diaumpire_se.params" checked="false"
+label="Output Signal Extraction data for DIA_Umpire_Quant" />
+<param name="mgfs_as_collection" type="boolean" truevalue="true" falsevalue="false" checked="false"
+label="Output MGFs as a collection" />
 </inputs>
 <outputs>
-<data format="txt" name="logfile" label="${tool.name} log"/>
+<data format="txt" name="logfile" label="${tool.name} ${on_string} log"/>
-<data format="dia_umpire.ser" name="se_params" label="${tool.name} Signal Extraction data">
+<data format="dia_umpire.ser" name="se_ser" label="${tool.name} ${input.name} ${se_extraction_data}">
-</data>
+<filter>se_extraction_data</filter>
-<data format="csv" name="PrecursorPeak" label="" from_work_dir="gx_path/swath_PeakCurve.csv">
+</data>
+<data format="txt" name="params" label="${tool.name} ${input.name} ${se_extraction_data}">
+<filter>not se_extraction_data</filter>
+</data>
+<data format="csv" name="PrecursorPeak" label="${tool.name} ${input.name} PeakCluster.csv" from_work_dir="gx_path/swath_PeakCurve.csv">
 <filter>ExportPrecursorPeak</filter>
 </data>
+<!--
 <data format="csv" name="FragmentPeak" label="" from_work_dir="gx_path/swath_PeakCurve.csv">
 <filter>ExportFragmentPeak</filter>
 </data>
+-->
 <collection name="dia_umpire_se_mgfs" type="list" label="${tool.name} MGFs">
+<filter>mgfs_as_collection</filter>
 <discover_datasets pattern="(?P&lt;name&gt;.*Q[1-3]\.mgf)" ext="mgf" visible="false" directory="gx_path" />
 </collection>
+<data format="mgf" name="q1_mgf" label="${tool.name} ${($input.name[:-6] if $input.name.endswith('.mxXML') or $input.name.endswith('.mxxml') else $input.name).rsplit('.',1)[0]}_Q1.mgf" >
+<filter>not mgfs_as_collection</filter>
+</data>
+<data format="mgf" name="q2_mgf" label="${tool.name} ${($input.name[:-6] if $input.name.endswith('.mxXML') or $input.name.endswith('.mxxml') else $input.name).rsplit('.',1)[0]}_Q2.mgf" >
+<filter>not mgfs_as_collection</filter>
+</data>
+<data format="mgf" name="q3_mgf" label="${tool.name} ${($input.name[:-6] if $input.name.endswith('.mxXML') or $input.name.endswith('.mxxml') else $input.name).rsplit('.',1)[0]}_Q3.mgf" >
+<filter>not mgfs_as_collection</filter>
+</data>
 </outputs>
 <tests>
 <test>
+<param name="input" value="LongSwath_UPS1_1ug_rep1_xs.mzXML" ftype="mzxml"/>
+<conditional name="instrument">
+<param name="model" value="AB_SCIEX_Triple_TOF_5600"/>
+<param name="SE_MS1PPM" value="30"/>
+<param name="SE_MS2PPM" value="40"/>
+<conditional name="window">
+<param name="WindowType" value="SWATH"/>
+<param name="WindowSize" value="25"/>
+</conditional>
+</conditional>
+<output name="q2_mgf">
+<assert_contents>
+<has_text text="BEGIN IONS" />
+<has_text_matching expression="^PEPMASS=740.\d+$" />
+</assert_contents>
+</output>
 </test>
 </tests>
 <help>
 <![CDATA[
 ================================
 **Input** (DIA-Umpire signal extraction module):
 ================================================
 1. Spectral data in mzXML format
-**Important**: for AB SCIEX data, use AB SCIEX MS Data Converter (http://goo.gl/wf7KRV):
+**Important**: for AB SCIEX data, use AB SCIEX MS Data Converter (https://sciex.com/x32750):
-Use it for .wiff -> .mzML conversion, then use MSConvert for .mzML -> .mzXML. Read "Raw spectral data files conversion to mzXML" section in the manual for more details.
+Galaxy tool:  https://toolshed.g2.bx.psu.edu/view/galaxyp/ms_data_converter/a36e9f847308
+Use it for .wiff -> .mzML conversion, then use MSConvert for .mzML -> .mzXML. Read "Raw spectral data files conversion to mzXML" section in the manual for more details.
 **Signal extraction parameters**:
 =================================
 *SE.MS1PPM*: (Unit: ppm) Maximum mass error for two MS1 peaks in consecutive spectra to be considered signal of the same ion. Used in MS1 signal detection and precursor alignment between samples/runs.  Recommended value: Depends on the instrument. Typical values are 5-10 ppm for Thermo Orbitrap, 20-40pm for AB SCIEX Triple TOF 5600.
 **Output files of DIA-Umpire signal extraction module**:
 ========================================================
-1. *DIA_Umpire_SE MGFs* - A Dataset Collection containing three .mgf files per input .mzXML file - pseudo MS/MS spectra sets for different quality categories of detected precursor signals (see the Online Methods of the publication for details). Example:
+1. *DIA_Umpire_SE MGFs* - Three .mgf files per input .mzXML file - pseudo MS/MS spectra sets for different quality categories of detected precursor signals (see the Online Methods of the publication for details). These can be either individual history items or a dataset collection.  Example:
 1. <filename>_Q1.mgf
 2. <filename>_Q2.mgf
 3. <filename>_Q3.mgf

Mercurial > repos > galaxyp > dia_umpire

comparison dia_umpire_se.xml @ 3:6caa9011f245 draft