annotate subtract_query.xml @ 0:980bf1f6f37b draft default tip

Uploaded
author slegras
date Mon, 27 Jul 2015 08:14:06 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
1 <tool id="subtract_query1" name="Subtract Whole Dataset" version="0.1">
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
2 <description>from another dataset</description>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
3 <command interpreter="python">
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
4 subtract_query.py $input1 $input2 $begin_col $end_col $output
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
5 #if str($ignore_empty_end_cols) == 'true':
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
6 --ignore-empty-end-cols
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
7 #end if
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
8
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
9 </command>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
10 <inputs>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
11 <param format="txt" name="input2" type="data" label="Subtract" help="Second dataset" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
12 <param format="txt" name="input1" type="data" label="from" help="First dataset" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
13 <param name="begin_col" type="data_column" data_ref="input1" force_select="False" label="Restrict subtraction between 'begin column'" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
14 <param name="end_col" type="data_column" data_ref="input1" force_select="False" label="and 'end column'" help="Specifying columns for restricting subtraction is available only for tabular formatted datasets" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
15 <param name="ignore_empty_end_cols" type="boolean" label="Ignore empty columns and whitespace at end of line when subtracting"/>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
16 </inputs>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
17 <outputs>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
18 <data format="input" name="output" metadata_source="input1" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
19 </outputs>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
20 <tests>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
21 <!-- Subtract 2 non-tabular files with no column restrictions. -->
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
22 <!-- Cannot figure out why this test won't pass, it works in real time...
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
23 <test>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
24 <param name="input1" value="1.txt" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
25 <param name="input2" value="2.txt" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
26 <param name="begin_col" value="None" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
27 <param name="end_col" value="None" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
28 <output name="output" file="subtract-query-1.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
29 </test>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
30 -->
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
31 <!-- Subtract 2 tabular files with no column restrictions. -->
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
32 <test>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
33 <param name="input1" value="eq-showbeginning.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
34 <param name="input2" value="eq-showtail.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
35 <param name="begin_col" value="None" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
36 <param name="end_col" value="None" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
37 <output name="output" file="subtract-query-2.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
38 </test>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
39 <!-- Subtract 2 tabular files with column restrictions. -->
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
40 <test>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
41 <param name="input1" value="eq-showbeginning.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
42 <param name="input2" value="eq-removebeginning.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
43 <param name="begin_col" value="c1" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
44 <param name="end_col" value="c3" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
45 <output name="output" file="subtract-query-3.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
46 </test>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
47 <!-- Subtract a non-tabular file from a tabular file with no column restrictions. -->
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
48 <test>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
49 <param name="input1" value="eq-showbeginning.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
50 <param name="input2" value="2.txt" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
51 <param name="begin_col" value="None" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
52 <param name="end_col" value="None" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
53 <output name="output" file="subtract-query-4.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
54 </test>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
55 <!-- Subtract 2 tabular files with no column restrictions, ignoring empty end columns. -->
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
56 <test>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
57 <param name="input1" value="eq-showbeginning_e.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
58 <param name="input2" value="eq-showtail.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
59 <param name="begin_col" value="None" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
60 <param name="end_col" value="None" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
61 <param name="ignore_empty_end_cols" value="true" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
62 <output name="output" file="subtract-query-2.dat" />
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
63 </test>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
64 </tests>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
65 <help>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
66
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
67 .. class:: infomark
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
68
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
69 **TIP:** This tool complements the tool in the **Operate on Genomic Intervals** tool set which subtracts the intervals of two datasets.
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
70
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
71
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
72 -----
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
73
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
74 **Syntax**
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
75
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
76 This tool subtracts an entire dataset from another dataset.
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
77
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
78 - Any text format is valid.
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
79 - If both dataset formats are tabular, you may restrict the subtraction to specific columns **contained in both datasets** and the resulting dataset will include only the columns specified.
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
80 - The begin column must be less than or equal to the end column. If it is not, begin column is switched with end column.
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
81 - If begin column is specified but end column is not, end column will default to begin_column (and vice versa).
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
82 - All blank and comment lines are skipped and not included in the resulting dataset (comment lines are lines beginning with a # character).
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
83 - Duplicate lines are eliminated from both dataset prior to subtraction. If any duplicate lines were eliminated from the first dataset, the number is displayed in the resulting history item.
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
84
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
85 -----
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
86
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
87 **Example**
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
88
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
89 If this is the **First dataset**::
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
90
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
91 chr1 4225 19670
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
92 chr10 6 8
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
93 chr1 24417 24420
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
94 chr6_hla_hap2 0 150
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
95 chr2 1 5
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
96 chr10 2 10
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
97 chr1 30 55
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
98 chrY 1 20
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
99 chr1 1225979 42287290
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
100 chr10 7 8
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
101
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
102 and this is the **Second dataset**::
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
103
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
104 chr1 4225 19670
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
105 chr10 6 8
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
106 chr1 24417 24420
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
107 chr6_hla_hap2 0 150
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
108 chr2 1 5
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
109 chr1 30 55
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
110 chrY 1 20
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
111 chr1 1225979 42287290
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
112
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
113 Subtracting the **Second dataset** from the **First dataset** (including all columns) will yield::
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
114
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
115 chr10 7 8
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
116 chr10 2 10
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
117
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
118 Conversely, subtracting the **First dataset** from the **Second dataset** (including all columns) will result in an empty dataset.
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
119
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
120 Subtracting the **Second dataset** from the **First dataset** (restricting to columns c1 and c2) will yield::
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
121
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
122 chr10 7
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
123 chr10 2
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
124
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
125 </help>
980bf1f6f37b Uploaded
slegras
parents:
diff changeset
126 </tool>