comparison msnbase_readmsdata.xml @ 0:24f7d4e5c186 draft

planemo upload for repository https://github.com/workflow4metabolomics/xcms commit f01148783819c37e474790dbd56619862960448a-dirty
author lecorguille
date Tue, 03 Apr 2018 11:50:50 -0400
parents
children fa17ee3bc9ce
comparison
equal deleted inserted replaced
-1:000000000000 0:24f7d4e5c186
1 <tool id="msnbase_readmsdata" name="MSnbase readMSData" version="@WRAPPER_VERSION@.0">
2 <description>Imports mass-spectrometry raw data files</description>
3
4 <macros>
5 <import>macros.xml</import>
6 <import>macros_msnbase.xml</import>
7 </macros>
8
9 <expand macro="requirements"/>
10 <expand macro="stdio"/>
11
12 <command><![CDATA[
13 @COMMAND_RSCRIPT@/msnbase_readmsdata.r
14
15 #if $input.is_of_type("mzxml") or $input.is_of_type("mzml") or $input.is_of_type("mzdata") or $input.is_of_type("netcdf"):
16 singlefile_galaxyPath '$input' singlefile_sampleName '$input.name'
17 #else
18 zipfile '$input'
19 #end if
20
21 @COMMAND_LOG_EXIT@
22 ]]></command>
23
24 <inputs>
25
26 <param name="input" type="data" format="mzxml,mzml,mzdata,netcdf,no_unzip.zip,zip" label="File(s) from your history containing your chromatograms" help="Single file mode for the format: mzxml, mzml, mzdata and netcdf. Zip file mode for the format: no_unzip.zip, zip. See the help section below." />
27
28 </inputs>
29
30 <outputs>
31 <data name="xsetRData" format="rdata.msnbase.raw" label="${input.name.rsplit('.',1)[0]}.raw.RData" from_work_dir="readmsdata.RData" />
32 <data name="sampleMetadata" format="tabular" label="${input.name.rsplit('.',1)[0]}.sampleMetadata.tsv" from_work_dir="sampleMetadata.tsv" >
33 <filter>input.extension not in ["mzxml","mzml","mzdata","netcdf"]</filter>
34 </data>
35 </outputs>
36
37 <tests>
38
39 <test>
40 <param name="input" value="faahKO_reduce.zip" ftype="zip" />
41 <assert_stdout>
42 <has_text text="rowNames: faahKO_reduce/KO/ko15.CDF faahKO_reduce/KO/ko16.CDF" />
43 <has_text text="faahKO_reduce/WT/wt15.CDF faahKO_reduce/WT/wt16.CDF" />
44 <has_text text="featureNames: F1.S0001 F1.S0002 ... F4.S1278 (5112 total)" />
45 <has_text text="fvarLabels: fileIdx spIdx ... spectrum (27 total)" />
46 <has_text text="faahKO_reduce/KO/ko15.CDF ko15 KO" />
47 <has_text text="faahKO_reduce/KO/ko16.CDF ko16 KO" />
48 <has_text text="faahKO_reduce/WT/wt15.CDF wt15 WT" />
49 <has_text text="faahKO_reduce/WT/wt16.CDF wt16 WT" />
50 </assert_stdout>
51 <output name="sampleMetadata" value="sampleMetadata.tsv" />
52 </test>
53 <test>
54 <param name="input" value="ko15.CDF" ftype="netcdf" />
55 <assert_stdout>
56 <has_text text="rowNames: ./ko15.CDF" />
57 <has_text text="ko15.CDF" />
58 <has_text text="featureNames: F1.S0001 F1.S0002 ... F1.S1278 (1278 total)" />
59 <has_text text="fvarLabels: fileIdx spIdx ... spectrum (27 total)" />
60 <has_text text="./ko15.CDF ko15 ." />
61 </assert_stdout>
62 </test>
63 <!-- DISABLE FOR TRAVIS
64 Useful to generate test-data for the further steps
65 <test>
66 <param name="input" value="ko16.CDF" ftype="netcdf" />
67 <assert_stdout>
68 <has_text text="rowNames: ./ko16.CDF" />
69 <has_text text="ko16.CDF" />
70 <has_text text="./ko16.CDF ko16 ." />
71 </assert_stdout>
72 </test>
73 <test>
74 <param name="input" value="wt15.CDF" ftype="netcdf" />
75 <assert_stdout>
76 <has_text text="rowNames: ./wt15.CDF" />
77 <has_text text="wt15.CDF" />
78 <has_text text="./wt15.CDF wt15 ." />
79 </assert_stdout>
80 </test>
81 <test>
82 <param name="input" value="wt16.CDF" ftype="netcdf" />
83 <assert_stdout>
84 <has_text text="rowNames: ./wt16.CDF" />
85 <has_text text="wt16.CDF" />
86 <has_text text="./wt16.CDF wt16 ." />
87 </assert_stdout>
88 </test>
89 -->
90 </tests>
91
92 <help><![CDATA[
93
94 @HELP_AUTHORS@
95
96 ==================
97 MSnbase readMSData
98 ==================
99
100 -----------
101 Description
102 -----------
103
104 Reads as set of XML-based mass-spectrometry data files and
105 generates an MSnExp object. This function uses the functionality
106 provided by the ‘mzR’ package to access data and meta data in
107 ‘mzData’, ‘mzXML’ and ‘mzML’.
108
109 .. _xcms: https://bioconductor.org/packages/release/bioc/html/xcms.html
110 .. _here: http://web11.sb-roscoff.fr/download/w4m/howto/w4m_HowToPerformXcmsPreprocessing_v02.pdf
111
112
113 -----------------
114 Workflow position
115 -----------------
116
117 **Upstream tools**
118
119 ========================= ================= ======= =========
120 Name output file format parameter
121 ========================= ================= ======= =========
122 NA NA zip NA
123 ========================= ================= ======= =========
124
125
126 **Downstream tools**
127
128 =========================== ==================== ====================
129 Name Output file Format
130 =========================== ==================== ====================
131 xcms.findChromPeaks xset.RData rdata.msnbase.raw
132 --------------------------- -------------------- --------------------
133 PCA ellipsoid by factors sampleMetadata.tsv Tabular
134 --------------------------- -------------------- --------------------
135 Anova sampleMetadata.tsv Tabular
136 =========================== ==================== ====================
137
138
139
140 **Example of a metabolomic workflow**
141
142 .. image:: mnsbase_readmsdata_workflow.png
143
144 ---------------------------------------------------
145
146
147
148 -----------
149 Input files
150 -----------
151
152 =========================== ==================================
153 Parameter : num + label Format
154 =========================== ==================================
155 OR : Zip file zip
156 --------------------------- ----------------------------------
157 OR : Single file mzXML, mzML, mzData, netCDF
158 =========================== ==================================
159
160 **Choose your inputs**
161
162 You have two methods for your inputs:
163
164 | Single file (recommended): You can put a single file as input. That way, you will be able to launch several xcmsSet in parallel and use "xcms.xcmsSet Merger" before "xcms.group"
165 | Zip file: You can put a zip file containing your inputs: myinputs.zip (containing all your conditions as sub-directories).
166
167 Zip file: Steps for creating the zip file
168 -----------------------------------------
169
170 **Step1: Creating your directory and hierarchize the subdirectories**
171
172
173 VERY IMPORTANT: If you zip your files under Windows, you must use the 7Zip_ software, otherwise your zip will not be well unzipped on the platform W4M (zip corrupted bug).
174
175 .. _7Zip: http://www.7-zip.org/
176
177 Your zip should contain all your conditions as sub-directories. For example, two conditions (mutant and wild):
178 arabidopsis/wild/01.raw
179 arabidopsis/mutant/01.raw
180
181 **Step2: Creating a zip file**
182
183 Create your zip file (e.g.: arabidopsis.zip).
184
185 **Step 3 : Uploading it to our Galaxy server**
186
187 If your zip file is less than 2Gb, you get use the Get Data tool to upload it.
188
189 Otherwise if your zip file is larger than 2Gb, please refer to the HOWTO_ on workflow4metabolomics.org.
190
191 .. _HOWTO: http://application.sb-roscoff.fr/download/w4m/howto/galaxy_upload_up_2Go.pdf
192
193 For more informations, don't hesitate to send us an email at supportATworkflow4metabolomics.org).
194
195 Advices for converting your files for the XCMS input
196 ----------------------------------------------------
197
198 We recommend you to convert your raw files to **mzXML** in centroid mode (smaller files) and the files will be compatible with the xmcs centWave method.
199
200 **We recommend you the following parameters:**
201
202 Use Filtering: **True**
203
204 Use Peak Picking: **True**
205
206 Peak Peaking -Apply to MS Levels: **All Levels (1-)** : Centroid Mode
207
208 Use zlib: **64**
209
210 Binary Encoding: **64**
211
212 m/z Encoding: **64**
213
214 Intensity Encoding: **64**
215
216
217 ------------
218 Output files
219 ------------
220
221 sampleMetadata.tsv
222
223 | Tabular file that contains for each sample, it's associated class and polarity (positive,negative and mixed).
224 | This file is necessary in the Anova and PCA step of the workflow.
225
226 xset.RData: rdata.msnbase.raw format
227
228 | Rdata file that is necessary in the second step of the workflow "xcms.findChromPeaks".
229
230 ---------------------------------------------------
231
232 Changelog/News
233 --------------
234
235
236 **Version 2.4.0.0 - 29/03/2018**
237
238 - NEW: a new dedicated tool to read the raw data. This function was previously included in xcms.findChromPeaks. This way, you will now be able to display TICs and BPCs before xcms.findChromPeaks.
239
240 ]]></help>
241
242 <expand macro="citation" />
243 </tool>