annotate cmsearch.xml @ 11:5c6344f67ad0 draft

Uploaded
author bgruening
date Sun, 08 Sep 2013 06:48:18 -0400
parents 0bffd4183326
children c17ed5a530d2
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
4
351013907f11 Uploaded
bgruening
parents: 3
diff changeset
1 <tool id="infernal_cmsearch" name="Search covariance model(s)" version="1.1.0.1">
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
2 <description>against a sequence database (cmsearch)</description>
5
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
3 <parallelism method="multi" split_inputs="seqdb" split_mode="to_size" split_size="100" shared_inputs="" merge_outputs="outfile,multiple_alignment_output"></parallelism>
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
4 <requirements>
9
1aa4c036e41c Uploaded
bgruening
parents: 8
diff changeset
5 <requirement type="package">infernal</requirement>
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
6 <requirement type="package" version="1.1rc4">infernal</requirement>
7
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
7 <requirement type="package" version="8.21">gnu_coreutils</requirement>
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
8 </requirements>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
9 <command>
9
1aa4c036e41c Uploaded
bgruening
parents: 8
diff changeset
10 ## a temp file is needed, because the standard tabular output from infernal is not usefull in Galaxy
1aa4c036e41c Uploaded
bgruening
parents: 8
diff changeset
11 ## it will be converted to a tab delimited file and piped to Galaxy
8
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
12 temp_tabular_output=\$(mktemp);
5
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
13
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
14 cmsearch
9
1aa4c036e41c Uploaded
bgruening
parents: 8
diff changeset
15 ## Infernal Options
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
16 --cpu 12
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
17 -o /dev/null
5
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
18 --tformat $seqdb.ext ##target format: fasta, embl, genbank, ddbj, stockholm, pfam, a2m, afa, clustal, and phylip
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
19 $bottomonly
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
20 $toponly
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
21 $cyk
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
22 $notrunc
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
23 $max
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
24 $nohmm
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
25 $mid
8
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
26 ##$bitscore_thresholds
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
27 --tblout \$temp_tabular_output
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
28 $g
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
29 #if $A:
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
30 $A $multiple_alignment_output
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
31 #end if
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
32
11
5c6344f67ad0 Uploaded
bgruening
parents: 10
diff changeset
33 #if str($inclusion_thresholds_opts.inclusion_thresholds_selector) == "--incE":
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
34 --incE $inclusion_thresholds_opts.incE
11
5c6344f67ad0 Uploaded
bgruening
parents: 10
diff changeset
35 #elif str($inclusion_thresholds_opts.inclusion_thresholds_selector) == "--incT":
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
36 --incT $inclusion_thresholds_opts.incT
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
37 #end if
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
38
11
5c6344f67ad0 Uploaded
bgruening
parents: 10
diff changeset
39 #if str($reporting_thresholds_opts.reporting_thresholds_selector) == "-E":
3
a5ef9159caa9 Uploaded
bgruening
parents: 2
diff changeset
40 -E $reporting_thresholds_opts.E
11
5c6344f67ad0 Uploaded
bgruening
parents: 10
diff changeset
41 #elif str($reporting_thresholds_opts.reporting_thresholds_selector) == "-T":
3
a5ef9159caa9 Uploaded
bgruening
parents: 2
diff changeset
42 -T $reporting_thresholds_opts.T
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
43 #end if
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
44
9
1aa4c036e41c Uploaded
bgruening
parents: 8
diff changeset
45 ## CM file from the history or stored as database on disc
1aa4c036e41c Uploaded
bgruening
parents: 8
diff changeset
46
11
5c6344f67ad0 Uploaded
bgruening
parents: 10
diff changeset
47 #if str($cm_opts.cm_opts_selector) == "db":
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
48 $cm_opts.database.fields.path
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
49 #else:
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
50 $cm_opts.cmfile
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
51 #end if
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
52
9
1aa4c036e41c Uploaded
bgruening
parents: 8
diff changeset
53 ## sequence file
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
54 $seqdb
6
c650ee099c51 Uploaded
bgruening
parents: 5
diff changeset
55 2>&#38;1
c650ee099c51 Uploaded
bgruening
parents: 5
diff changeset
56 ;
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
57
8
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
58 ## 1. replace all lines starting # (comment lines)
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
59 ## 2. replace the first 18 spaces with tabs, 18th field is a free text field (can contain spaces)
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
60 sed -e 's/#.*$//' -e '/^$/d' -e 's/ /\t/g' -e 's/\t/ /18g' \$temp_tabular_output > $outfile
6
c650ee099c51 Uploaded
bgruening
parents: 5
diff changeset
61
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
62 </command>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
63 <inputs>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
64
3
a5ef9159caa9 Uploaded
bgruening
parents: 2
diff changeset
65 <param name="seqdb" type="data" format="fasta" label="Sequence database"/>
10
0bffd4183326 Uploaded
bgruening
parents: 9
diff changeset
66
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
67 <conditional name="cm_opts">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
68 <param name="cm_opts_selector" type="select" label="Subject covariance models">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
69 <option value="db" selected="True">Locally installed covariance models</option>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
70 <option value="histdb">Covariance model from your history</option>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
71 </param>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
72 <when value="db">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
73 <param name="database" type="select" label="Covariance models">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
74 <options from_file="infernal.loc">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
75 <column name="value" index="0"/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
76 <column name="name" index="1"/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
77 <column name="path" index="2"/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
78 </options>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
79 </param>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
80 </when>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
81 <when value="histdb">
9
1aa4c036e41c Uploaded
bgruening
parents: 8
diff changeset
82 <param name="cmfile" type="data" format="cm" label="Covariance models file from the history."/>
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
83 </when>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
84 </conditional>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
85
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
86 <param name="g" truevalue="-g" falsevalue="" checked="False" type="boolean"
3
a5ef9159caa9 Uploaded
bgruening
parents: 2
diff changeset
87 label="Turn on the glocal alignment algorithm" help="... global with respect to the query model and local with respect to the target database."/>
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
88
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
89 <param name="bottomonly" truevalue="--bottomonly" falsevalue="" checked="False" type="boolean"
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
90 label="Only search the bottom (Crick) strand of target sequences" help="in the sequence database"/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
91 <param name="toponly" truevalue="--toponly" falsevalue="" checked="False" type="boolean"
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
92 label="Only search the top (Watson) strand of target sequences" help="in the sequence database"/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
93
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
94 <param name="cyk" truevalue="--cyk" falsevalue="" checked="False" type="boolean"
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
95 label="Use the CYK algorithm, not Inside, to determine the final score of all hits" help=""/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
96 <param name="--acyk" truevalue="--cyk" falsevalue="" checked="False" type="boolean"
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
97 label="Use the CYK algorithm to align hits" help="By default, the Durbin/Holmes optimal accuracy algorithm is used, which finds the alignment that maximizes the expected accuracy of all aligned residues."/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
98
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
99 <param name="notrunc" truevalue="--notrunc" falsevalue="" checked="False" type="boolean"
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
100 label="Turn off truncated hit detection" help=""/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
101
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
102 <!-- accelleration pipeline -->
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
103
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
104 <param name="max" truevalue="--max" falsevalue="" checked="False" type="boolean"
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
105 label="Turn off all filters, and run non-banded Inside on every full-length target sequence" help="This
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
106 increases sensitivity somewhat, at an extremely large cost in speed."/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
107
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
108 <param name="nohmm" truevalue="--nohmm" falsevalue="" checked="False" type="boolean"
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
109 label="Turn off all HMM filter stages " help=""/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
110
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
111 <param name="mid" truevalue="--mid" falsevalue="" checked="False" type="boolean"
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
112 label="Turn off the HMM SSV and Viterbi filter stages" help=""/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
113
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
114
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
115 <!-- Options for model-specific score thresholding -->
8
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
116 <!--
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
117 <param name="bitscore_thresholds" type="select" label="Bit score thresholds" help="Curated CM databases may define specific bit score thresholds for each CM, superseding any thresholding based on statistical significance alone.">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
118 <option value="" selected="true">None</option>
8
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
119 <option value=" - -cut_ga">GA (gathering) bit scores</option>
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
120 <option value=" - -cut_nc">NC (noise cutoff) bit score</option>
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
121 <option value=" - -cut_tc">TC (trusted cutoff) bit score</option>
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
122 </param>
8
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
123 -->
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
124 <!-- Options for inclusion thresholds -->
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
125
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
126
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
127 <conditional name="inclusion_thresholds_opts">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
128 <param name="inclusion_thresholds_selector" type="select" label="Inclusion thresholds"
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
129 help="Inclusion thresholds are stricter than reporting thresholds. Inclusion thresholds control which hits are considered to be reliable enough to be included in an output alignment or in a possible subsequent search round, or marked as significant (”!”) as opposed to questionable (”?”) in hit output.">
6
c650ee099c51 Uploaded
bgruening
parents: 5
diff changeset
130 <option value="" selected="true">default</option>
c650ee099c51 Uploaded
bgruening
parents: 5
diff changeset
131 <option value="--incE">Use E-value</option>
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
132 <option value="--incT">Use bit score</option>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
133 </param>
6
c650ee099c51 Uploaded
bgruening
parents: 5
diff changeset
134 <when />
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
135 <when value="--incE">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
136 <param name="incE" type="float" value="0.01" size="5" label="Use E-value" help="of &lt;= X as the hit inclusion threshold.">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
137 <sanitizer>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
138 <valid initial="string.printable">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
139 <remove value="&apos;"/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
140 </valid>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
141 </sanitizer>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
142 </param>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
143 </when>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
144 <when value="--incT">
2
468be760eba3 Uploaded
bgruening
parents: 1
diff changeset
145 <param name="incT" type="integer" size="5" value="0" label="Use bit score" help="of >= X as the hit inclusion threshold.">
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
146 <sanitizer>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
147 <valid initial="string.printable">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
148 <remove value="&apos;"/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
149 </valid>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
150 </sanitizer>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
151 </param>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
152 </when>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
153 </conditional>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
154
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
155 <!-- Options controlling reporting thresholds -->
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
156
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
157 <conditional name="reporting_thresholds_opts">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
158 <param name="reporting_thresholds_selector" type="select" label="reporting thresholds"
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
159 help="Reporting thresholds control which hits are reported in output files">
6
c650ee099c51 Uploaded
bgruening
parents: 5
diff changeset
160 <option value="" selected="true">default</option>
c650ee099c51 Uploaded
bgruening
parents: 5
diff changeset
161 <option value="-E">Use E-value</option>
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
162 <option value="-T">Use bit score</option>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
163 </param>
6
c650ee099c51 Uploaded
bgruening
parents: 5
diff changeset
164 <when />
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
165 <when value="-E">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
166 <param name="E" type="float" value="10.0" size="5" label="Use E-value" help="of &lt;= X as the hit reporting threshold. The default is 10.0, meaning that on average, about 10 false positives will be reported per query, so you can see the top of the noise and decide for yourself if it’s really noise.">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
167 <sanitizer>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
168 <valid initial="string.printable">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
169 <remove value="&apos;"/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
170 </valid>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
171 </sanitizer>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
172 </param>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
173 </when>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
174 <when value="-T">
2
468be760eba3 Uploaded
bgruening
parents: 1
diff changeset
175 <param name="T" type="integer" size="5" value="0" label="Use bit score" help="of >= X as the hit reporting threshold.">
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
176 <sanitizer>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
177 <valid initial="string.printable">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
178 <remove value="&apos;"/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
179 </valid>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
180 </sanitizer>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
181 </param>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
182 </when>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
183 </conditional>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
184
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
185 <param name="A" truevalue="-A" falsevalue="" checked="False" type="boolean"
5
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
186 label="Save a multiple alignment of all significant hits" help="... those satisfying inclusion thresholds"/>
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
187
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
188 </inputs>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
189 <outputs>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
190
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
191 <data format="tabular" name="outfile" label="cmsearch on ${on_string}"/>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
192 <data format="tabular" name="multiple_alignment_output" label="cmsearch on ${on_string} (multi alignment)">
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
193 <filter>A is True</filter>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
194 </data>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
195
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
196 </outputs>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
197 <help>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
198
7
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
199
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
200 **What it does**
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
201
8
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
202 Infernal is used to search sequence databases for homologs of structural RNA sequences, and to make
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
203 sequence- and structure-based RNA sequence alignments. Infernal needs a profile from a structurally
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
204 annotated multiple sequence alignment of an RNA family with a position-specific scoring system for substitutions,
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
205 insertions, and deletions. Positions in the profile that are basepaired in the consensus secondary
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
206 structure of the alignment are modeled as dependent on one another, allowing Infernal’s scoring system to
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
207 consider the secondary structure, in addition to the primary sequence, of the family being modeled. Infernal
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
208 profiles are probabilistic models called “covariance models”, a specialized type of stochastic context-free
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
209 grammar (SCFG) (Lari and Young, 1990).
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
210
8
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
211 Compared to other alignment and database search tools based only on sequence comparison, Infernal
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
212 aims to be significantly more accurate and more able to detect remote homologs because it models sequence
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
213 and structure.
7
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
214
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
215
7
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
216 Output format
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
217 -------------
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
218
5
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
219 (1) target name: The name of the target sequence or profile.
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
220 (2) accession: The accession of the target sequence or profile, or ’-’ if none.
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
221 (3) query name: The name of the query sequence or profile.
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
222 (4) accession: The accession of the query sequence or profile, or ’-’ if none.
7
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
223 (5) mdl (model): Which type of model was used to compute the final score. Either ’cm’ or ’hmm’. A CM is used to compute the final hit scores unless the model has zero basepairs or the --hmmonly option is used, in which case a HMM will be used.
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
224 (6) mdl from (model coord): The start of the alignment of this hit with respect to the profile (CM or HMM), numbered 1..N for a profile of N consensus positions.
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
225 (7) mdl to (model coord): The end of the alignment of this hit with respect to the profile (CM or HMM), numbered 1..N for a profile of N consensus positions.
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
226 (8) seq from (ali coord): The start of the alignment of this hit with respect to the sequence, numbered 1..L for a sequence of L residues.
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
227 (9) seq to (ali coord): The end of the alignment of this hit with respect to the sequence, numbered 1..L for a sequence of L residues.
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
228 (10) strand: The strand on which the hit occurs on the sequence. ’+’ if the hit is on the top (Watson) strand, ’-’ if the hit is on the bottom (Crick) strand. If on the top strand, the “seq from” value will be less than or equal to the “seq to” value, else it will be greater than or equal to it.
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
229 (11) trunc: Indicates if this is predicted to be a truncated CM hit or not. This will be “no” if it is a CM hit that is not predicted to be truncated by the end of the sequence, “5’ ” or “3’ ” if the hit is predicted to have one or more 5’ or 3’ residues missing due to a artificial truncation of the sequence, or “5’&amp;3”’ if the hit is predicted to have one or more 5’ residues missing and one or more 3’ residues missing. If the hit is an HMM hit, this will always be ’-’.
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
230 (12) pass: Indicates what “pass” of the pipeline the hit was detected on. This is probably only useful for testing and debugging. Non-truncated hits are found on the first pass, truncated hits are found on successive passes.
5
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
231 (13) gc: Fraction of G and C nucleotides in the hit.
7
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
232 (14) bias: The biased-composition correction: the bit score difference contributed by the null3 model for CM hits, or the null2 model for HMM hits. High bias scores may be a red flag for a false positive. It is difficult to correct for all possible ways in which a nonrandom but nonhomologous biological sequences can appear to be similar, such as short-period tandem repeats, so there are cases where the bias correction is not strong enough (creating false positives).
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
233 (15) score: The score (in bits) for this target/query comparison. It includes the biased-composition cor-rection (the “null3” model for CM hits, or the “null2” model for HMM hits).
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
234 (16) E-value: The expectation value (statistical significance) of the target. This is a per query E-value; i.e. calculated as the expected number of false positives achieving this comparison’s score for a single query against the search space Z. For cmsearch Z is defined as the total number of nucleotides in the target dataset multiplied by 2 because both strands are searched. For cmscan Z is the total number of nucleotides in the query sequence multiplied by 2 because both strands are searched and multiplied by the number of models in the target database. If you search with multiple queries and if you want to control the overall false positive rate of that search rather than the false positive rate per query, you will want to multiply this per-query E-value by how many queries you’re doing.
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
235 (17) inc: Indicates whether or not this hit achieves the inclusion threshold: ’!’ if it does, ’?’ if it does not (and rather only achieves the reporting threshold). By default, the inclusion threshold is an E-value of 0.01 and the reporting threshold is an E-value of 10.0, but these can be changed with command line options as described in the manual pages.
5
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
236 (18) description of target: The remainder of the line is the target’s description line, as free text.
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
237
2b3adbe83979 Uploaded
bgruening
parents: 4
diff changeset
238
8
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
239 For further questions please refere to the Infernal Userguide_.
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
240
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
241 .. _Userguide: http://selab.janelia.org/software/infernal/Userguide.pdf
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
242
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
243
8
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
244 How do I cite Infernal?
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
245 -----------------------
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
246
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
247 The Infernal 1.0 paper (Nawrocki et al., 2009) is the best paper to reference.
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
248 If you’re writing for an enlightened (url-friendly) journal, you may want to cite the webpage
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
249 http://infernal.janelia.org/ because it is kept up-to-date. We hope to publish a paper related to
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
250 Infernal version 1.1 soon.
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
251
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
252 **Galaxy Wrapper Author**::
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
253
b0f9aca4a34f Uploaded
bgruening
parents: 7
diff changeset
254 * Bjoern Gruening, University of Freiburg
7
46128c3865b8 Uploaded
bgruening
parents: 6
diff changeset
255
1
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
256 </help>
26ef7e66c39b Uploaded
bgruening
parents:
diff changeset
257 </tool>