Mercurial > repos > artbio > pathifier
comparison pathifier.xml @ 0:dd01ae279778 draft default tip
"planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/pathifier commit b94cfc7bf8df30aa8e9249b75ea31332ee2bada1"
| author | artbio |
|---|---|
| date | Mon, 12 Apr 2021 09:54:52 +0000 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| -1:000000000000 | 0:dd01ae279778 |
|---|---|
| 1 <tool id="pathifier" name="Pathifier" version="1.0.1"> | |
| 2 <description>: Quantify deregulation of pathways in cancer</description> | |
| 3 <requirements> | |
| 4 <requirement type="package" version="1.6.2=r35h6115d3f_0">r-optparse</requirement> | |
| 5 <requirement type="package" version="1.22.0=r351_0">bioconductor-pathifier</requirement> | |
| 6 <requirement type="package" version="1.0.12=r351h6115d3f_0">r-pheatmap</requirement> | |
| 7 <requirement type="package" version="0.3_41=r351h6115d3f_0">r-scatterplot3d</requirement> | |
| 8 <requirement type="package" version="0.4.7=r35h6115d3f_0">r-circlize</requirement> | |
| 9 </requirements> | |
| 10 <stdio> | |
| 11 <exit_code range="1:" level="fatal" description="Tool exception" /> | |
| 12 </stdio> | |
| 13 <command detect_errors="exit_code"><![CDATA[ | |
| 14 Rscript $__tool_directory__/pathifier.R | |
| 15 --exp '$input' | |
| 16 --sep '$input_sep' | |
| 17 --genes '$genes' | |
| 18 | |
| 19 #if $reference.is_normal == "Yes": | |
| 20 --is_normal 'TRUE' | |
| 21 --normals '$reference.normals' | |
| 22 #end if | |
| 23 | |
| 24 --max_stability '$max_stability' | |
| 25 --attempts '$attempts' | |
| 26 --min_std '$min_std' | |
| 27 --min_exp '$min_exp' | |
| 28 | |
| 29 --heatmap_cluster_cells '$heatmap_cluster_cells' | |
| 30 --heatmap_cluster_pathways '$heatmap_cluster_pathways' | |
| 31 --heatmap_show_cell_labels '$heatmap_show_cell_labels' | |
| 32 --heatmap_show_pathway_labels '$heatmap_show_pathway_labels' | |
| 33 | |
| 34 --pds '$pds' | |
| 35 --logfile '$logfile' | |
| 36 --plot '$plot' | |
| 37 --rdata '$rdatafile' | |
| 38 | |
| 39 ]]></command> | |
| 40 <inputs> | |
| 41 <param name="input" type="data" format="txt,tabular" label="expression data"/> | |
| 42 <param name="input_sep" type="select" label="Input column separator"> | |
| 43 <option value="tab" selected="true">Tabs</option> | |
| 44 <option value=",">Comma</option> | |
| 45 </param> | |
| 46 <param name="genes" type="data" format="txt" label="Gene sets Pathways" | |
| 47 help="Must be in gmt format (one pathway per line : Name, description, genes (one by column), tab separated)" /> | |
| 48 <conditional name="reference"> | |
| 49 <param name="is_normal" label="Do you have non cancer transcriptomes in your data set ?" type="boolean" truevalue="Yes" falsevalue="" checked="false" | |
| 50 help="If set the starting curve depends on the matrix of points with in a certain row order (first 'normal' then 'cancer' samples), otherwise the first principal component is used. See help for more informations"/> | |
| 51 <when value="Yes"> | |
| 52 <param name="normals" type="data" format="tabular" label="Sample status" | |
| 53 help="A two-column data frame, first column contains data labels, second column the levels of sample status : 1 = Healthy, 0 = Tumor (no header)" /> | |
| 54 </when> | |
| 55 <when value=""> | |
| 56 </when> | |
| 57 </conditional> | |
| 58 <param name="max_stability" label="Throw away components leading to low stability of sampling noise" type="boolean" truevalue="TRUE" | |
| 59 falsevalue="FALSE" checked="true" /> | |
| 60 <param name="attempts" type="integer" label="Number of runs to determine stability" value="100"/> | |
| 61 <param name="min_std" type="text" value="0.4" label="Minimum of standard deviation to filter out low variable genes" | |
| 62 help="Use 'data' to use the minimum standard deviation of your data" /> | |
| 63 <param name="min_exp" type="text" value="4" label="Minimum of gene expression to filter out low variable genes" | |
| 64 help="Use 'data' to use the minimum expression of your data" /> | |
| 65 <param name="heatmap_cluster_cells" label="Cluster samples on heatmap" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="true" /> | |
| 66 <param name="heatmap_cluster_pathways" label="Cluster pathways on heatmap" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="true" /> | |
| 67 <param name="heatmap_show_cell_labels" label="Show sample labels on heatmap" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="false" /> | |
| 68 <param name="heatmap_show_pathway_labels" label="Cluster pathway labels on heatmap" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="true" /> | |
| 69 <param label="Return log file of pathifier" name="log" type="select" > | |
| 70 <option value="no" selected="True">No</option> | |
| 71 <option value="yes">Yes</option> | |
| 72 </param> | |
| 73 <param label="Return Pathifier S4 object" name="rdata" type="select" > | |
| 74 <option value="no" selected="True">No</option> | |
| 75 <option value="yes">Yes</option> | |
| 76 </param> | |
| 77 | |
| 78 </inputs> | |
| 79 <outputs> | |
| 80 <data name="pds" format="tabular" label="Pathifier Deregulation Score (PDS) of ${on_string}" /> | |
| 81 <data name="logfile" format="txt" label="Pathifier log file of ${on_string}" > | |
| 82 <filter>log == 'yes'</filter> | |
| 83 </data> | |
| 84 <data name="plot" format="pdf" label="Pathifier vizualization of ${on_string}" /> | |
| 85 <data name="rdatafile" format="rdata" label="Pathifier S4 object of ${on_string}" > | |
| 86 <filter>rds == 'yes'</filter> | |
| 87 </data> | |
| 88 </outputs> | |
| 89 <tests> | |
| 90 <test> | |
| 91 <param name="input" value="sheffer.tsv" ftype="tabular"/> | |
| 92 <param name="genes" value="kegg_pathways.gmt" ftype="txt" /> | |
| 93 <param name="is_normal" value="True" /> | |
| 94 <param name="normals" value="normals.tsv" ftype="tabular" /> | |
| 95 <param name="log" value="yes" /> | |
| 96 <param name="attempts" value="100" /> | |
| 97 <output name="logfile" file="sheffer.kegg.log" ftype="txt" compare="sim_size" /> | |
| 98 <output name="pds" file="sheffer.kegg.tsv" ftype="tabular"/> | |
| 99 <output name="plot" file="plot.pdf" ftype="pdf" compare="sim_size" /> | |
| 100 </test> | |
| 101 <test> | |
| 102 <param name="input" value="sheffer_noref.tsv" ftype="tabular"/> | |
| 103 <param name="genes" value="kegg_pathways.gmt" ftype="txt" /> | |
| 104 <param name="is_normal" value="" /> | |
| 105 <param name="log" value="no" /> | |
| 106 <param name="rdata" value="yes" /> | |
| 107 <param name="attempts" value="50" /> | |
| 108 <param name="min_exp" value="data" /> | |
| 109 <param name="min_std" value="data" /> | |
| 110 <output name="pds" file="sheffer.kegg_noref.tsv" ftype="tabular"/> | |
| 111 <output name="rdatafile" file="sheffer.kegg_noref.rdata" ftype="rdata" compare="sim_size" /> | |
| 112 <output name="plot" file="plot_noref.pdf" ftype="pdf" compare="sim_size" /> | |
| 113 </test> | |
| 114 </tests> | |
| 115 <help> | |
| 116 | |
| 117 **What it does** | |
| 118 | |
| 119 Pathifier is an algorithm that infers pathway deregulation scores for each (tumor) sample on the basis | |
| 120 of expression data. This score is determined, in a context-specific manner, for every particular dataset | |
| 121 and type of cancer that is being investigated. The algorithm transforms gene-level information into | |
| 122 pathway-level information, generating a compact and biologically relevant representation of each sample. | |
| 123 | |
| 124 For each pathway analysed, the transcriptome datasets are plotted in the gene pathway space using a | |
| 125 Principal Component analysis (PCA) and a principal curve is regressed from these points. All transcriptomes | |
| 126 are projected on the nearest point of this curve. Pathifier finally computes a score which corresponds to | |
| 127 the distance (normalized to 1) of each point (transcriptome) to the curve origin. | |
| 128 | |
| 129 **Inputs** | |
| 130 | |
| 131 * a matrix of n columns of observations (generally RNAseq experiments) and k rows of variables (generally k genes). | |
| 132 * a Gene Matrix Transposed file (GMT format) where each row represents a gene set : | |
| 133 * first column : gene set name (pathway name) | |
| 134 * second : description of gene set | |
| 135 * third and + : list of genes that composed the gene set tab-separated | |
| 136 * (Optional) a two column table with no header, to described transcriptome status (Tumor or not) : | |
| 137 * first column : sample labels | |
| 138 * second : levels of sample status : 1 = Healthy, 0 = Tumor | |
| 139 | |
| 140 **Outputs** | |
| 141 | |
| 142 * Table of Pathway Deregulation Scores : one by pathway (column) and by transcriptome (row) | |
| 143 * Visualization of PDS (pdf) : | |
| 144 * Principal curve of different PDS | |
| 145 * Heatmap of PDS that allows (through clustering) to see pattern in pathway deregulation | |
| 146 * (Optional) Log file of Pathifier algorithm | |
| 147 * (Optional) Pathifier S4 object which contains all informations and results generated by Pathifier, for each pathway : | |
| 148 * `scores` : PDS scores | |
| 149 * `genesinpathway` : Gene identifiers in each pathway | |
| 150 * `newmeanstd` | |
| 151 * `origmeanstd` | |
| 152 * `pathwaysize` : Number of genes retained in pathway | |
| 153 * `curves` : Coordinates of transcriptomes projected on the principal curve | |
| 154 * `curves_order` : Order of transcriptomes along the principal curve | |
| 155 * `z` : z-scores matrix | |
| 156 * `compin` | |
| 157 * `xm` | |
| 158 * `xs` | |
| 159 * `center` | |
| 160 * `rot` | |
| 161 * `pctaken` : Number of principal component retained for pathifier analysis | |
| 162 * `samplings` | |
| 163 * `sucess` : List of pathway index that passed Pathfiier filters (more info in log file) | |
| 164 * `logfile` : Name of logfile | |
| 165 | |
| 166 </help> | |
| 167 <citations> | |
| 168 <citation type="bibtex">@Manual{, | |
| 169 title = {{pathifier}: Quantify deregulation of pathways in cancer}, | |
| 170 author = {Yotam Drier}, | |
| 171 year = {2013-06-27}, | |
| 172 note = {R package version 1.22.0}, | |
| 173 url = {https://git.bioconductor.org/packages/pathifier}, | |
| 174 } | |
| 175 </citation> | |
| 176 <citation type="bibtex">@article {Drier6388, | |
| 177 author = {Drier, Yotam and Sheffer, Michal and Domany, Eytan}, | |
| 178 title = {Pathway-based personalized analysis of cancer}, | |
| 179 volume = {110}, | |
| 180 number = {16}, | |
| 181 pages = {6388--6393}, | |
| 182 year = {2013}, | |
| 183 doi = {10.1073/pnas.1219651110}, | |
| 184 publisher = {National Academy of Sciences}, | |
| 185 issn = {0027-8424}, | |
| 186 URL = {https://www.pnas.org/content/110/16/6388}, | |
| 187 eprint = {https://www.pnas.org/content/110/16/6388.full.pdf}, | |
| 188 journal = {Proceedings of the National Academy of Sciences} | |
| 189 } | |
| 190 </citation> | |
| 191 </citations> | |
| 192 </tool> |
