Mercurial > repos > ethevenot > heatmap
comparison heatmap_config.xml @ 0:81ffd91ba495 draft default tip
planemo upload for repository https://github.com/workflow4metabolomics/heatmap.git commit bbfc13f2e4fa9e7e5b562c96d0e570318d3482d9
| author | ethevenot |
|---|---|
| date | Tue, 24 Oct 2017 09:32:23 -0400 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| -1:000000000000 | 0:81ffd91ba495 |
|---|---|
| 1 <tool id="Heatmap" name="Heatmap" version="2.2.2"> | |
| 2 <description>Heatmap of the dataMatrix</description> | |
| 3 | |
| 4 <requirements> | |
| 5 <requirement type="package">r-batch</requirement> | |
| 6 </requirements> | |
| 7 | |
| 8 <stdio> | |
| 9 <exit_code range="1:" level="fatal" /> | |
| 10 </stdio> | |
| 11 | |
| 12 <command><![CDATA[ | |
| 13 Rscript $__tool_directory__/heatmap_wrapper.R | |
| 14 | |
| 15 dataMatrix_in "$dataMatrix_in" | |
| 16 sampleMetadata_in "$sampleMetadata_in" | |
| 17 variableMetadata_in "$variableMetadata_in" | |
| 18 | |
| 19 disC "$disC" | |
| 20 cutSamN "$cutSamN" | |
| 21 cutVarN "$cutVarN" | |
| 22 | |
| 23 #if $advPar.oppC == "full" | |
| 24 corMetC "$advPar.corMetC" | |
| 25 aggMetC "$advPar.aggMetC" | |
| 26 colC "$advPar.colC" | |
| 27 scaL "$advPar.scaL" | |
| 28 cexN "$advPar.cexN" | |
| 29 #end if | |
| 30 | |
| 31 dataMatrix_out "$dataMatrix_out" | |
| 32 sampleMetadata_out "$sampleMetadata_out" | |
| 33 variableMetadata_out "$variableMetadata_out" | |
| 34 figure "$figure" | |
| 35 information "$information" | |
| 36 ]]></command> | |
| 37 | |
| 38 <inputs> | |
| 39 <param name="dataMatrix_in" type="data" label="Data matrix file" help="" format="tabular" /> | |
| 40 <param name="sampleMetadata_in" type="data" label="Sample metadata file" help="" format="tabular" /> | |
| 41 <param name="variableMetadata_in" type="data" label="Variable metadata file" help="" format="tabular" /> | |
| 42 | |
| 43 <param name="disC" label="Dissimilarity to be used for clustering" type="select" help="If correlation is selected, the pearson method will be used by default unless a specific method is selected in the advanced parameters below"> | |
| 44 <option value="euclidean">euclidean</option> | |
| 45 <option value="maximum">maximum</option> | |
| 46 <option value="manhattan">manhattan</option> | |
| 47 <option value="canberra">canberra</option> | |
| 48 <option value="binary">binary</option> | |
| 49 <option value="minkowski">minkowski</option> | |
| 50 <option value="1-cor" selected="true">1-correlation</option> | |
| 51 <option value="1-abs(cor)">1-abs(correlation)</option> | |
| 52 </param> | |
| 53 | |
| 54 <param name="cutSamN" label="Number of sample clusters to identify" type="select" help=""> | |
| 55 <option value="1" selected="true">1</option> | |
| 56 <option value="2">2</option> | |
| 57 <option value="3">3</option> | |
| 58 <option value="4">4</option> | |
| 59 <option value="5">5</option> | |
| 60 <option value="6">6</option> | |
| 61 <option value="7">7</option> | |
| 62 <option value="8">8</option> | |
| 63 <option value="9">9</option> | |
| 64 <option value="10">10</option> | |
| 65 <option value="11">11</option> | |
| 66 <option value="12">12</option> | |
| 67 <option value="13">13</option> | |
| 68 <option value="14">14</option> | |
| 69 <option value="15">15</option> | |
| 70 </param> | |
| 71 | |
| 72 <param name="cutVarN" label="Number of variable clusters to identify" type="select" help=""> | |
| 73 <option value="1" selected="true">1</option> | |
| 74 <option value="2">2</option> | |
| 75 <option value="3">3</option> | |
| 76 <option value="4">4</option> | |
| 77 <option value="5">5</option> | |
| 78 <option value="6">6</option> | |
| 79 <option value="7">7</option> | |
| 80 <option value="8">8</option> | |
| 81 <option value="9">9</option> | |
| 82 <option value="10">10</option> | |
| 83 <option value="11">11</option> | |
| 84 <option value="12">12</option> | |
| 85 <option value="13">13</option> | |
| 86 <option value="14">14</option> | |
| 87 <option value="15">15</option> | |
| 88 </param> | |
| 89 | |
| 90 <conditional name="advPar"> | |
| 91 <param name="oppC" type="select" label="Advanced parameters" > | |
| 92 <option value="default" selected="true">Use default</option> | |
| 93 <option value="full">Full list</option> | |
| 94 </param> | |
| 95 <when value="default"> | |
| 96 <param name="corMetC" type="hidden" value="pearson"/> | |
| 97 <param name="aggMetC" type="hidden" value="ward"/> | |
| 98 <param name="colC" type="hidden" value="blueOrangeRed"/> | |
| 99 <param name="scaL" type="hidden" value="TRUE"/> | |
| 100 <param name="cexN" type="hidden" value="0.8"/> | |
| 101 </when> | |
| 102 <when value="full"> | |
| 103 <param name="corMetC" label="Method of correlation to be used" type="select" help=""> | |
| 104 <option value="pearson" selected="true">pearson</option> | |
| 105 <option value="spearman">spearman</option> | |
| 106 <option value="kendall">kendall</option> | |
| 107 </param> | |
| 108 <param name="aggMetC" label="Method of agglomeration to be used" type="select" help=""> | |
| 109 <option value="ward" selected="true">ward</option> | |
| 110 <option value="single">single</option> | |
| 111 <option value="complete">complete</option> | |
| 112 <option value="average">average</option> | |
| 113 <option value="mcquitty">mcquitty</option> | |
| 114 <option value="median">median</option> | |
| 115 <option value="centroid">centroid</option> | |
| 116 </param> | |
| 117 <param name="colC" label="Color scale" type="select" help=""> | |
| 118 <option value="blueOrangeRed" selected="true">blue-orange-red</option> | |
| 119 <option value="redBlackGreen">red-black-green</option> | |
| 120 </param> | |
| 121 <param name="scaL" label="Variable standardization (for plotting only)" type="select" help="Standardization is performed after the clustering for display only (may enhance contrast) and does not modify cluster computation nor intensities in the output files"> | |
| 122 <option value="TRUE" selected="true">yes</option> | |
| 123 <option value="FALSE">no</option> | |
| 124 </param> | |
| 125 <param name="cexN" label="Size of labels" type="select" help=""> | |
| 126 <option value="0.5">0.5</option> | |
| 127 <option value="0.6">0.6</option> | |
| 128 <option value="0.7">0.7</option> | |
| 129 <option value="0.8" selected="true">0.8</option> | |
| 130 <option value="0.9">0.9</option> | |
| 131 <option value="1">1</option> | |
| 132 </param> | |
| 133 </when> | |
| 134 </conditional> | |
| 135 | |
| 136 </inputs> | |
| 137 | |
| 138 <outputs> | |
| 139 <data name="dataMatrix_out" label="${tool.name}_${dataMatrix_in.name}" format="tabular" ></data> | |
| 140 <data name="sampleMetadata_out" label="${tool.name}_${sampleMetadata_in.name}" format="tabular" ></data> | |
| 141 <data name="variableMetadata_out" label="${tool.name}_${variableMetadata_in.name}" format="tabular" ></data> | |
| 142 <data name="figure" label="${tool.name}_figure.pdf" format="pdf"/> | |
| 143 <data name="information" label="${tool.name}_information.txt" format="txt"/> | |
| 144 </outputs> | |
| 145 | |
| 146 <tests> | |
| 147 <test> | |
| 148 <param name="dataMatrix_in" value="input-dataMatrix.tsv"/> | |
| 149 <param name="sampleMetadata_in" value="input-sampleMetadata.tsv"/> | |
| 150 <param name="variableMetadata_in" value="input-variableMetadata.tsv"/> | |
| 151 <param name="disC" value="1-cor"/> | |
| 152 <param name="cutSamN" value="4"/> | |
| 153 <param name="cutVarN" value="3"/> | |
| 154 <param name="oppC" value="full"/> | |
| 155 <param name="corMetC" value="spearman"/> | |
| 156 <param name="aggMetC" value="ward"/> | |
| 157 <param name="colC" value="blueOrangeRed"/> | |
| 158 <param name="scaL" value="TRUE"/> | |
| 159 <param name="cexN" value="0.8"/> | |
| 160 <output name="variableMetadata_out" file="output-variableMetadata.tsv"/> | |
| 161 </test> | |
| 162 </tests> | |
| 163 | |
| 164 <help> | |
| 165 | |
| 166 .. class:: infomark | |
| 167 | |
| 168 | **Tool update: See the 'NEWS' section at the bottom of the page** | |
| 169 | |
| 170 --------------------------------------------------- | |
| 171 | |
| 172 .. class:: infomark | |
| 173 | |
| 174 **Author** Etienne Thevenot (W4M Core Development Team, MetaboHUB Paris, CEA) | |
| 175 | |
| 176 --------------------------------------------------- | |
| 177 | |
| 178 .. class:: infomark | |
| 179 | |
| 180 **References** | |
| 181 | |
| 182 | Etienne A. Thevenot, Aurelie Roux, Ying Xu, Eric Ezan, and Christophe Junot (2015). Analysis of the human adult urinary metabolome variations with age, body mass index and gender by implementing a comprehensive workflow for univariate and OPLS statistical analyses. *Journal of Proteome Research*, **14**:3322-3335 (http://dx.doi.org/10.1021/acs.jproteome.5b00354). | |
| 183 | R Core Team (2013). R: A language and environment for statistical computing. R Foundation for Statistical Computing, Vienna, Austria (http://www.r-project.org) | |
| 184 | | |
| 185 | |
| 186 --------------------------------------------------- | |
| 187 | |
| 188 .. class:: infomark | |
| 189 | |
| 190 **Tool updates** | |
| 191 | |
| 192 See the **NEWS** section at the bottom of this page | |
| 193 | |
| 194 --------------------------------------------------- | |
| 195 | |
| 196 | |
| 197 ======================== | |
| 198 Heatmap | |
| 199 ======================== | |
| 200 | |
| 201 ----------- | |
| 202 Description | |
| 203 ----------- | |
| 204 | |
| 205 | Performs hierarchical clustering on both the samples (rows) and variables (columns) of the dataMatrix | |
| 206 | Displays the dataMatrix with sorted rows and samples and the dendrograms (heatmap) | |
| 207 | In the output dataMatrix, sampleMetadata and variableMetadata files sample and variables are sorted according to the dendrograms | |
| 208 | Optionally, indicates the groups of samples and/or variables obtained by cutting the dendrograms into a specific number of partitions | |
| 209 | | |
| 210 | Note: 1) Computations rely on the 'hclust' function. The dissimilarity is 1 - cor (where cor is the Spearman correlation) and the 'ward.D' aggregating method is used. | |
| 211 | 2) A "blue-orange-red" palette is generated with the function 'colorRampPalette'; **By default, variables are standardized (mean-centered and unit-scaled) to enhance contrast on the figure**; standardization can be turned off by using the full list of parameters; in any case, standardizing is performed after the computation of clusters, for display only | |
| 212 | 3) When a specific number of sample and/or variable groups (i.e. > 1) are selected, the group numbers are indicated on the plot and in an additional 'heat_clust" column in the sampleMetadata and/or variableMetadata | |
| 213 | 4) Example of computation times: for 126 variables: a few seconds; for 4324 variables: 30 min | |
| 214 | | |
| 215 | |
| 216 | |
| 217 ----------------- | |
| 218 Workflow position | |
| 219 ----------------- | |
| 220 | |
| 221 | In the workflow example below, the structure of the dataset (dataMatrix) is visualized by using first the "Quality Metrics" (for checking potential signal drift, sample outliers, etc.), then the "Heatmap" (for correlations between samples or variables), and finally the "Multivariate" (for PCA or PLS) modules. | |
| 222 | | |
| 223 | |
| 224 .. image:: heatmap_workflowPositionImage.png | |
| 225 :width: 600 | |
| 226 | |
| 227 | |
| 228 | |
| 229 ----------- | |
| 230 Input files | |
| 231 ----------- | |
| 232 | |
| 233 +--------------------------+-------------+ | |
| 234 | File type | Format | | |
| 235 +==========================+=============+ | |
| 236 | 1 : Data matrix | tabular | | |
| 237 +--------------------------+-------------+ | |
| 238 | 2 : Sample metadata | tabular | | |
| 239 +--------------------------+-------------+ | |
| 240 | 3 : Variable metadata | tabular | | |
| 241 +--------------------------+-------------+ | |
| 242 | |
| 243 | | |
| 244 | Required formats for the dataMatrix, sampleMetadata and variableMetadata files are described in the HowTo entitled 'Format Data For Postprocessing' available on the main page of Workflow4Metabolomics.org; formats of the three files can be further checked with the 'Check Data' module (in the 'Quality Control' section) | |
| 245 | | |
| 246 | |
| 247 ---------- | |
| 248 Parameters | |
| 249 ---------- | |
| 250 | |
| 251 Number of sample clusters | |
| 252 | By default (cluster = 1), only dendrograms are displayed; when a specific number of sample clusters is selected, the sample dendrogram is cut at the corresponding level: the sample groups are displayed on the dendrogram and a "heat_clust" column is added in the sampleMetadata file with the group of each sample | |
| 253 | | |
| 254 | |
| 255 Number of variable clusters | |
| 256 | Same as above for variables | |
| 257 | | |
| 258 | |
| 259 Standardization (Full list) | |
| 260 | By default, variables are standardized for display to enhance contrast of the heatmap (note that standardization is performed after the clustering for display only and does not modify cluster computation nor intensities in the output files) | |
| 261 | | |
| 262 | |
| 263 Size of labels (Full list) | |
| 264 | The size of sample and variable names on the heatmap is 0.8 (note that names with more than 14 characters are truncated); this number may be lowered (or uppered) in case of many (few) names to display | |
| 265 | |
| 266 | |
| 267 ------------ | |
| 268 Output files | |
| 269 ------------ | |
| 270 | |
| 271 dataMatrix_out.tabular | |
| 272 | dataMatrix file with rows and columns sorted according to the dendrogram | |
| 273 | | |
| 274 | |
| 275 sampleMetadata_out.tabular | |
| 276 | sampleMetadata file with rows sorted according to the sample dendrogram; in case a number of sample groups is specified, and additional "heat_clust" column is added with the cluster group of each sample | |
| 277 | | |
| 278 | |
| 279 variableMetadata_out.tabular | |
| 280 | variableMetadata file with rows sorted according to the variable dendrogram; in case a number of variable groups is specified, and additional "heat_clust" column is added with the cluster group of each variable | |
| 281 | | |
| 282 | |
| 283 figure.pdf | |
| 284 | Heatmap | |
| 285 | | |
| 286 | |
| 287 information.txt | |
| 288 | File with all messages and warnings generated during the computation | |
| 289 | | |
| 290 | |
| 291 --------------------------------------------------- | |
| 292 | |
| 293 --------------- | |
| 294 Working example | |
| 295 --------------- | |
| 296 | |
| 297 .. class:: infomark | |
| 298 | |
| 299 See the **W4M00001a_sacurine-subset-statistics** shared history in the **Shared Data/Published Histories** menu (https://galaxy.workflow4metabolomics.org/history/list_published) | |
| 300 | |
| 301 --------------------------------------------------- | |
| 302 | |
| 303 ---- | |
| 304 NEWS | |
| 305 ---- | |
| 306 | |
| 307 CHANGES IN VERSION 2.2.2 | |
| 308 ======================== | |
| 309 | |
| 310 INTERNAL MODIFICATIONS | |
| 311 | |
| 312 Minor internal modifications | |
| 313 | |
| 314 CHANGES IN VERSION 2.2.0 | |
| 315 ======================== | |
| 316 | |
| 317 NEW FEATURES | |
| 318 | |
| 319 Default method for the correlation coefficient is now 'pearson', instead of 'spearman' previously (the latter can still be selected in the advanced parameters) | |
| 320 | |
| 321 The 1-abs(correlation) dissimilarity is now available (in addition to the default '1-correlation') in case the sign of correlations between samples and between variables does not matter, as well as the euclidean, maximum, manhattan, canberra, binary, and minkowski dissimilarities | |
| 322 | |
| 323 A new red-green color scale is available | |
| 324 | |
| 325 | |
| 326 CHANGES IN VERSION 2.1.2 | |
| 327 ======================== | |
| 328 | |
| 329 INTERNAL MODIFICATIONS | |
| 330 | |
| 331 Creating additional files for planemo and travis running and installation validation | |
| 332 | |
| 333 CHANGES IN VERSION 2.1.1 | |
| 334 ======================== | |
| 335 | |
| 336 INTERNAL MODIFICATIONS | |
| 337 | |
| 338 Internal replacement of the as.hclust function which happened to produce error messages | |
| 339 | |
| 340 </help> | |
| 341 | |
| 342 <citations> | |
| 343 <citation type="bibtex">@Manual{, | |
| 344 title = {R: A Language and Environment for Statistical Computing}, | |
| 345 author = {{R Core Team}}, | |
| 346 organization = {R Foundation for Statistical Computing}, | |
| 347 address = {Vienna, Austria}, | |
| 348 year = {2016}, | |
| 349 url = {https://www.R-project.org/}, | |
| 350 }</citation> | |
| 351 <citation type="bibtex">@Article{Thevenot2015, | |
| 352 Title = {Analysis of the human adult urinary metabolome variations with age, body mass index and gender by implementing a comprehensive workflow for univariate and OPLS statistical analyses}, | |
| 353 Author = {Thevenot, Etienne A. and Roux, Aurelie and Xu, Ying and Ezan, Eric and Junot, Christophe}, | |
| 354 Journal = {Journal of Proteome Research}, | |
| 355 Year = {2015}, | |
| 356 Note = {PMID: 26088811}, | |
| 357 Number = {8}, | |
| 358 Pages = {3322-3335}, | |
| 359 Volume = {14}, | |
| 360 | |
| 361 Doi = {10.1021/acs.jproteome.5b00354}, | |
| 362 Url = {http://pubs.acs.org/doi/full/10.1021/acs.jproteome.5b00354} | |
| 363 }</citation> | |
| 364 <citation type="doi">10.1093/bioinformatics/btu813</citation> | |
| 365 </citations> | |
| 366 | |
| 367 </tool> |
