|
1
|
1 <tool id="blat" name="Align sequences with BLAT" version="1.0.1">
|
|
0
|
2 <!-- Additional info: wrapper compatible with versions ..... -->
|
|
|
3 <description>
|
|
|
4 to a reference genome
|
|
|
5 </description>
|
|
|
6
|
|
1
|
7 <version_command>
|
|
|
8 </version_command>
|
|
0
|
9
|
|
|
10 <requirements>
|
|
|
11 <requirement type="package" version="1.0.0">blat</requirement>
|
|
|
12 </requirements>
|
|
|
13
|
|
|
14 <command interpreter="perl">
|
|
|
15 blat_wrapper.pl $configfile
|
|
|
16 </command>
|
|
|
17
|
|
|
18 <inputs>
|
|
|
19 <param format="fasta" name="input" type="data" label="Query fasta sequences" />
|
|
|
20 <param name="q" type="select" label="Process the query as">
|
|
|
21 <option value="dna" selected="True">DNA</option>
|
|
|
22 <option value="rna">RNA</option>
|
|
|
23 <option value="prot">Protein</option>
|
|
|
24 <option value="dnax">DNA sequence translated in six frames to protein</option>
|
|
|
25 <option value="rnax">RNA sequence translated in six frames to protein</option>
|
|
|
26 </param>
|
|
|
27 <conditional name="refGenomeSource">
|
|
|
28 <param name="genomeSource" type="select" label="Will you select a sequence database from your history or use a built-in index?" help="Built-ins were indexed using default options">
|
|
|
29 <option value="indexed">Use a built-in index</option>
|
|
|
30 <option value="history" selected="True">Use one from the history</option>
|
|
|
31 </param>
|
|
|
32 <when value="indexed">
|
|
|
33 <param name="index" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact the Galaxy team">
|
|
|
34 <options from_data_table="twobit.loc">
|
|
|
35 <filter type="sort_by" column="1"/>
|
|
|
36 <validator type="no_options" message="No indexes are available for the selected input dataset"/>
|
|
|
37 </options>
|
|
|
38 <param name="range" type="text" size="25" value="" label="Restrict the search space to this genomic range in the sequence database" help="Format = 'chr1:250000-260000' (i.e. name:startposition-endposition)" />
|
|
|
39
|
|
|
40 </param>
|
|
|
41 </when>
|
|
|
42 <when value="history">
|
|
1
|
43 <param name="ownFile" type="data" format="fasta" metadata_nameloc="dbkey" label="Select the sequence database" />
|
|
0
|
44 </when> <!-- history -->
|
|
|
45 </conditional> <!-- refGenomeSource -->
|
|
|
46
|
|
|
47 <param name="t" type="select" label="Process the sequence database as">
|
|
|
48 <option value="dna" selected="True">DNA</option>
|
|
|
49 <option value="prot">Protein</option>
|
|
|
50 <option value="dnax">DNA sequence translated in six frames to protein</option>
|
|
|
51 </param>
|
|
|
52
|
|
|
53 <conditional name="advanced_params">
|
|
|
54 <param name="use" type="select" label="Show advanced parameters">
|
|
|
55 <option value="no" selected="True">No</option>
|
|
|
56 <option value="yes">Yes</option>
|
|
|
57 </param>
|
|
|
58 <when value="no" />
|
|
|
59 <when value="yes" >
|
|
|
60 <param name="tileSize" type="text" size="3" value="11" label="size of match that triggers an alignment" help="Usually between 8 and 12. Default is 11 for DNA and 5 for protein." />
|
|
|
61 <param name="stepSize" type="text" size="3" value="11" label="spacing between tiles" />
|
|
|
62 <param name="oneOff" type="boolean" truevalue="1" falsevalue="0" checked="False" label="Allowing one mismatch in tile?" />
|
|
|
63 <param name="minMatch" type="select" label="number of tile matches" >
|
|
|
64 <option value="1">1 (for proteins)</option>
|
|
|
65 <option value="2" selected="True">2</option>
|
|
|
66 <option value="3">3</option>
|
|
|
67 <option value="4">4</option>
|
|
|
68 </param>
|
|
|
69 <param name="minScore" type="text" size="3" value="30" label="minimum score" help="This is the matches minus the mismatches minus some sort of gap penalty. Default is 30" />
|
|
|
70 <param name="maxGap" type="select" label="size of maximum gap between tiles in a clump" help=" Usually set from 0 to 3. Default is 2. Only relevent for minMatch > 1">
|
|
|
71 <option value="0">0</option>
|
|
|
72 <option value="1">1</option>
|
|
|
73 <option value="2" selected="True">2</option>
|
|
|
74 <option value="3">3</option>
|
|
|
75 </param>
|
|
|
76 <param name="mask" type="select" label="Mask out repeats in reference sequence" help="Alignments won't be started in masked region but may extend through it in nucleotide searches. Masked areas are ignored entirely in protein or translated searches.">
|
|
|
77 <option value="lower">mask out lower cased sequence</option>
|
|
|
78 <option value="upper">mask out upper cased sequence</option>
|
|
|
79 </param>
|
|
|
80 <param name="qMask" type="select" label="Mask out repeats in query sequence" help="Alignments won't be started in masked region but may extend through it in nucleotide searches. Masked areas are ignored entirely in protein or translated searches.">
|
|
|
81 <option value="lower">mask out lower cased sequence</option>
|
|
|
82 <option value="upper">mask out upper cased sequence</option>
|
|
|
83 </param>
|
|
|
84 <param name="repeats" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="Report matches in repeats separately?" />
|
|
|
85 <param name="trimT" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="Trim leading poly-T" />
|
|
|
86 <param name="noTrimA" type="boolean" truevalue="no" falsevalue="yes" checked="True" label="Trim trailing poly-A" />
|
|
|
87 <param name="fine" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="For high quality mRNAs look harder for small initial and terminal exons. Not recommended for ESTs" />
|
|
|
88 <param name="maxIntron" type="text" size="10" value="750000" label="Maximum intron size" />
|
|
|
89 <param name="extendThroughN" type="boolean" truevalue="yes" falsevalue="no" checked="False" label="Extent alignment through large blocks of N's? Not recommended for ESTs" />
|
|
|
90 </when>
|
|
|
91 </conditional>
|
|
|
92 </inputs>
|
|
|
93
|
|
|
94 <outputs>
|
|
|
95 <data format="tabular" name="output" label="${tool.name} on ${on_string}: alignments"/>
|
|
|
96 </outputs>
|
|
|
97
|
|
|
98 <configfiles>
|
|
|
99 <!-- this config file collects all parameter settings -->
|
|
|
100 <configfile name="configfile">
|
|
|
101 ## first we pass some galaxy environment variables
|
|
|
102 galtemp==${__new_file_path__}
|
|
|
103
|
|
|
104 #if $refGenomeSource.genomeSource == "indexed"
|
|
|
105 referencepath==${refGenomeSource.index.fields.path}
|
|
|
106 range=$refGenomeSource.range
|
|
|
107 #else
|
|
|
108 referencepath==${refGenomeSource.ownFile}
|
|
|
109 #end if
|
|
|
110
|
|
|
111 input==$input
|
|
|
112 output==$output
|
|
|
113 q==$q
|
|
|
114 t==$t
|
|
|
115
|
|
|
116 advanced_params.use==$advanced_params.use
|
|
|
117 #if $advanced_params.use=="yes"
|
|
|
118 tileSize==$advanced_params.tileSize
|
|
|
119 stepSize==$advanced_params.stepSize
|
|
|
120 oneOff==$advanced_params.oneOff
|
|
|
121 minMatch==$advanced_params.minMatch
|
|
|
122 minScore==$advanced_params.minScore
|
|
|
123 maxGap==$advanced_params.maxGap
|
|
|
124 mask==$advanced_params.mask
|
|
|
125 qMask==$advanced_params.qMask
|
|
|
126 repeats==$advanced_params.repeats
|
|
|
127 trimT==$advanced_params.trimT
|
|
|
128 noTrimA==$advanced_params.noTrimA
|
|
|
129 fine==$advanced_params.fine
|
|
|
130 maxIntron==$advanced_params.maxIntron
|
|
|
131 extendThroughN==$advanced_params.extendThroughN
|
|
|
132 #end if
|
|
|
133
|
|
|
134 </configfile>
|
|
|
135 </configfiles>
|
|
|
136
|
|
1
|
137 <tests>
|
|
0
|
138 <test>
|
|
1
|
139 <param name="input" value="input83.fas" ftype="fasta" />
|
|
|
140 <param name="q" value="dna" />
|
|
|
141 <param name="genomeSource" value="history" />
|
|
|
142 <param name="ownFile" value="blatdatabase1.fas" />
|
|
|
143 <param name="t" value="dna" />
|
|
|
144 <param name="use" value="yes" />
|
|
|
145 <param name="tileSize" value="11" />
|
|
|
146 <param name="stepSize" value="11" />
|
|
|
147 <param name="oneOff" value="0" />
|
|
|
148 <param name="tileSize" value="11" />
|
|
|
149 <param name="minMatch" value="2" />
|
|
|
150 <param name="minScore" value="30" />
|
|
|
151 <param name="maxGap" value="2" />
|
|
|
152 <param name="mask" value="lower" />
|
|
|
153 <param name="qMask" value="lower" />
|
|
|
154 <param name="repeats" value="no" />
|
|
|
155 <param name="trimT" value="yes" />
|
|
|
156 <param name="noTrimA" value="no" />
|
|
|
157 <param name="fine" value="no" />
|
|
|
158 <param name="maxIntron" value="750000" />
|
|
|
159 <param name="extendThroughN" value="no" />
|
|
|
160 <output name="output" file="blatoutput1.txt" ftype="tabular" lines_diff="2"/>
|
|
|
161 </test>
|
|
0
|
162 </tests>
|
|
|
163
|
|
|
164 <help>
|
|
|
165 **BLAT Overview**
|
|
|
166
|
|
|
167 BLAT_ is an alignment tool like BLAST, but it is structured differently.
|
|
|
168 On DNA, Blat works by keeping an index of an entire genome in memory.
|
|
|
169 Thus, the target database of BLAT is not a set of GenBank sequences, but
|
|
|
170 instead an index derived from the assembly of the entire genome. By
|
|
|
171 default, the index consists of all non-overlapping 11-mers except for
|
|
|
172 those heavily involved in repeats.
|
|
|
173
|
|
|
174 .. _BLAT: http://genome.ucsc.edu/FAQ/FAQblat.html
|
|
|
175
|
|
|
176 </help>
|
|
|
177 </tool>
|
|
|
178
|