annotate blat_wrapper.xml @ 2:df0c23b49a81 draft default tip

Readme updated
author Joachim Jacob <joachim.jacob@gmail.com>
date Wed, 24 Jul 2013 16:35:36 +0200
parents da4426cac227
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
1 <tool id="blat" name="Align sequences with BLAT" version="1.0.1">
0
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
2 <!-- Additional info: wrapper compatible with versions ..... -->
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
3 <description>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
4 to a reference genome
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
5 </description>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
6
1
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
7 <version_command>
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
8 </version_command>
0
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
9
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
10 <requirements>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
11 <requirement type="package" version="1.0.0">blat</requirement>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
12 </requirements>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
13
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
14 <command interpreter="perl">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
15 blat_wrapper.pl $configfile
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
16 </command>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
17
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
18 <inputs>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
19 <param format="fasta" name="input" type="data" label="Query fasta sequences" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
20 <param name="q" type="select" label="Process the query as">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
21 <option value="dna" selected="True">DNA</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
22 <option value="rna">RNA</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
23 <option value="prot">Protein</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
24 <option value="dnax">DNA sequence translated in six frames to protein</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
25 <option value="rnax">RNA sequence translated in six frames to protein</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
26 </param>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
27 <conditional name="refGenomeSource">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
28 <param name="genomeSource" type="select" label="Will you select a sequence database from your history or use a built-in index?" help="Built-ins were indexed using default options">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
29 <option value="indexed">Use a built-in index</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
30 <option value="history" selected="True">Use one from the history</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
31 </param>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
32 <when value="indexed">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
33 <param name="index" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact the Galaxy team">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
34 <options from_data_table="twobit.loc">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
35 <filter type="sort_by" column="1"/>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
36 <validator type="no_options" message="No indexes are available for the selected input dataset"/>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
37 </options>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
38 <param name="range" type="text" size="25" value="" label="Restrict the search space to this genomic range in the sequence database" help="Format = 'chr1:250000-260000' (i.e. name:startposition-endposition)" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
39
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
40 </param>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
41 </when>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
42 <when value="history">
1
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
43 <param name="ownFile" type="data" format="fasta" metadata_nameloc="dbkey" label="Select the sequence database" />
0
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
44 </when> <!-- history -->
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
45 </conditional> <!-- refGenomeSource -->
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
46
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
47 <param name="t" type="select" label="Process the sequence database as">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
48 <option value="dna" selected="True">DNA</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
49 <option value="prot">Protein</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
50 <option value="dnax">DNA sequence translated in six frames to protein</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
51 </param>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
52
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
53 <conditional name="advanced_params">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
54 <param name="use" type="select" label="Show advanced parameters">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
55 <option value="no" selected="True">No</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
56 <option value="yes">Yes</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
57 </param>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
58 <when value="no" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
59 <when value="yes" >
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
60 <param name="tileSize" type="text" size="3" value="11" label="size of match that triggers an alignment" help="Usually between 8 and 12. Default is 11 for DNA and 5 for protein." />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
61 <param name="stepSize" type="text" size="3" value="11" label="spacing between tiles" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
62 <param name="oneOff" type="boolean" truevalue="1" falsevalue="0" checked="False" label="Allowing one mismatch in tile?" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
63 <param name="minMatch" type="select" label="number of tile matches" >
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
64 <option value="1">1 (for proteins)</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
65 <option value="2" selected="True">2</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
66 <option value="3">3</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
67 <option value="4">4</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
68 </param>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
69 <param name="minScore" type="text" size="3" value="30" label="minimum score" help="This is the matches minus the mismatches minus some sort of gap penalty. Default is 30" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
70 <param name="maxGap" type="select" label="size of maximum gap between tiles in a clump" help=" Usually set from 0 to 3. Default is 2. Only relevent for minMatch > 1">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
71 <option value="0">0</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
72 <option value="1">1</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
73 <option value="2" selected="True">2</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
74 <option value="3">3</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
75 </param>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
76 <param name="mask" type="select" label="Mask out repeats in reference sequence" help="Alignments won't be started in masked region but may extend through it in nucleotide searches. Masked areas are ignored entirely in protein or translated searches.">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
77 <option value="lower">mask out lower cased sequence</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
78 <option value="upper">mask out upper cased sequence</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
79 </param>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
80 <param name="qMask" type="select" label="Mask out repeats in query sequence" help="Alignments won't be started in masked region but may extend through it in nucleotide searches. Masked areas are ignored entirely in protein or translated searches.">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
81 <option value="lower">mask out lower cased sequence</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
82 <option value="upper">mask out upper cased sequence</option>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
83 </param>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
84 <param name="repeats" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="Report matches in repeats separately?" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
85 <param name="trimT" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="Trim leading poly-T" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
86 <param name="noTrimA" type="boolean" truevalue="no" falsevalue="yes" checked="True" label="Trim trailing poly-A" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
87 <param name="fine" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="For high quality mRNAs look harder for small initial and terminal exons. Not recommended for ESTs" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
88 <param name="maxIntron" type="text" size="10" value="750000" label="Maximum intron size" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
89 <param name="extendThroughN" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="Extent alignment through large blocks of N's? Not recommended for ESTs" />
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
90 </when>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
91 </conditional>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
92 </inputs>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
93
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
94 <outputs>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
95 <data format="tabular" name="output" label="${tool.name} on ${on_string}: alignments"/>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
96 </outputs>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
97
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
98 <configfiles>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
99 <!-- this config file collects all parameter settings -->
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
100 <configfile name="configfile">
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
101 ## first we pass some galaxy environment variables
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
102 galtemp==${__new_file_path__}
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
103
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
104 #if $refGenomeSource.genomeSource == "indexed"
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
105 referencepath==${refGenomeSource.index.fields.path}
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
106 range=$refGenomeSource.range
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
107 #else
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
108 referencepath==${refGenomeSource.ownFile}
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
109 #end if
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
110
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
111 input==$input
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
112 output==$output
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
113 q==$q
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
114 t==$t
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
115
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
116 advanced_params.use==$advanced_params.use
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
117 #if $advanced_params.use=="yes"
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
118 tileSize==$advanced_params.tileSize
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
119 stepSize==$advanced_params.stepSize
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
120 oneOff==$advanced_params.oneOff
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
121 minMatch==$advanced_params.minMatch
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
122 minScore==$advanced_params.minScore
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
123 maxGap==$advanced_params.maxGap
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
124 mask==$advanced_params.mask
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
125 qMask==$advanced_params.qMask
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
126 repeats==$advanced_params.repeats
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
127 trimT==$advanced_params.trimT
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
128 noTrimA==$advanced_params.noTrimA
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
129 fine==$advanced_params.fine
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
130 maxIntron==$advanced_params.maxIntron
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
131 extendThroughN==$advanced_params.extendThroughN
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
132 #end if
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
133
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
134 </configfile>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
135 </configfiles>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
136
1
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
137 <tests>
0
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
138 <test>
1
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
139 <param name="input" value="input83.fas" ftype="fasta" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
140 <param name="q" value="dna" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
141 <param name="genomeSource" value="history" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
142 <param name="ownFile" value="blatdatabase1.fas" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
143 <param name="t" value="dna" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
144 <param name="use" value="yes" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
145 <param name="tileSize" value="11" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
146 <param name="stepSize" value="11" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
147 <param name="oneOff" value="0" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
148 <param name="tileSize" value="11" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
149 <param name="minMatch" value="2" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
150 <param name="minScore" value="30" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
151 <param name="maxGap" value="2" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
152 <param name="mask" value="lower" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
153 <param name="qMask" value="lower" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
154 <param name="repeats" value="no" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
155 <param name="trimT" value="yes" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
156 <param name="noTrimA" value="no" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
157 <param name="fine" value="no" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
158 <param name="maxIntron" value="750000" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
159 <param name="extendThroughN" value="no" />
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
160 <output name="output" file="blatoutput1.txt" ftype="tabular" lines_diff="2"/>
da4426cac227 Fixed tests
Joachim Jacob <joachim.jacob@gmail.com>
parents: 0
diff changeset
161 </test>
0
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
162 </tests>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
163
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
164 <help>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
165 **BLAT Overview**
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
166
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
167 BLAT_ is an alignment tool like BLAST, but it is structured differently.
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
168 On DNA, Blat works by keeping an index of an entire genome in memory.
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
169 Thus, the target database of BLAT is not a set of GenBank sequences, but
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
170 instead an index derived from the assembly of the entire genome. By
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
171 default, the index consists of all non-overlapping 11-mers except for
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
172 those heavily involved in repeats.
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
173
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
174 .. _BLAT: http://genome.ucsc.edu/FAQ/FAQblat.html
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
175
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
176 </help>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
177 </tool>
3cec538aab33 Uploaded
joachim-jacob
parents:
diff changeset
178