annotate mergeMutationDatasets.xml @ 55:1093078e7976

merge mutation data conform to new mutationVector data standard
author jingchunzhu
date Fri, 18 Sep 2015 10:24:39 -0700
parents bb8963939d6f
children 2a240b005731
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
41
jingchunzhu
parents: 21
diff changeset
1 <tool id="mergeMutationDatasets" description="Merge two Xena positional mutation datasets into a new dataset" name="Merge Xena Mutation by Position Data" version="0.0.1">
19
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
2 <command interpreter="python">
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
3 mergeXenaMutation.py $outputC $outputSourceMatrix $errorLog $inputA $inputB
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
4 #if $labelForDatasetA
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
5 --aLabel "${labelForDatasetA}"
41
jingchunzhu
parents: 21
diff changeset
6 #else
jingchunzhu
parents: 21
diff changeset
7 --aLabel "${inputA.name}"
19
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
8 #end if
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
9 #if $labelForDatasetB
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
10 --bLabel "${labelForDatasetB}"
41
jingchunzhu
parents: 21
diff changeset
11 #else
jingchunzhu
parents: 21
diff changeset
12 --bLabel "${inputB.name}"
19
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
13 #end if
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
14 </command>
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
15 <inputs>
41
jingchunzhu
parents: 21
diff changeset
16 <param name="inputA" format="tabular" type="data" label="Xena Mutation by Position Dataset A"/>
43
eb5acf81e609 improve messages
jingchunzhu
parents: 42
diff changeset
17 <param type="text" name="labelForDatasetA" label="Dataset A Label (eg. LGG)" value="A"/>
41
jingchunzhu
parents: 21
diff changeset
18 <param name="inputB" format="tabular" type="data" label="Xena Mutation by Position Dataset B"/>
43
eb5acf81e609 improve messages
jingchunzhu
parents: 42
diff changeset
19 <param type="text" name="labelForDatasetB" label="Dataset B Label (eg. GBM)" value="B"/>
19
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
20 </inputs>
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
21 <outputs>
44
jingchunzhu
parents: 43
diff changeset
22 <data name="errorLog" format="data" label="Execution Log" hidden="True" />
42
jingchunzhu
parents: 41
diff changeset
23 <data name="outputSourceMatrix" format="tabular" label="Data Source ${labelForDatasetA}+${labelForDatasetB}"/>
jingchunzhu
parents: 41
diff changeset
24 <data name="outputC" format="tabular" label="Mutation by Position ${labelForDatasetA}+${labelForDatasetB}"/>
19
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
25 </outputs>
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
26 <help>
21
3a259686f0fc Merged with head, tweaked labels on merge mutation data tool
melissacline
parents: 20
diff changeset
27 ***Merge Xena Positional Mutation Datasets***
19
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
28
43
eb5acf81e609 improve messages
jingchunzhu
parents: 42
diff changeset
29 Output Mutation by Position datafile is ready to be imported into a Xena Hub.
eb5acf81e609 improve messages
jingchunzhu
parents: 42
diff changeset
30
eb5acf81e609 improve messages
jingchunzhu
parents: 42
diff changeset
31 Output Data Source is of format Rows (Samples) by Columns (identifiers), ready to be imported into a Xena Hub.
eb5acf81e609 improve messages
jingchunzhu
parents: 42
diff changeset
32
19
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
33 Given two datasets of mutation data as formatted for the UCSC Xena Browser, merge them to produce a third dataset that is the union of the first two. The new dataset will contain all mutations from either dataset.
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
34
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
35 To maintain provenance, this script also outputs a second matrix, with one row for each sample ID that appears in the output dataset, and two columns per row indicating which input dataset(s) contained some mutation data for that sample. By default, the input dataset name is used to indicate which input file each column came from. Optionally, the user can specify descriptive labels to be used in place of the dataset names. </help>
371579dd9bc6 Uploaded
melissacline
parents:
diff changeset
36 </tool>