annotate tools/protein_analysis/tmhmm2.xml @ 25:41a42022f815 draft

Uploaded v0.2.6, embedded citations
author peterjc
date Fri, 21 Nov 2014 08:17:36 -0500
parents 90e3d02f8013
children 20139cb4c844
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
25
41a42022f815 Uploaded v0.2.6, embedded citations
peterjc
parents: 22
diff changeset
1 <tool id="tmhmm2" name="TMHMM 2.0" version="0.0.13">
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
2 <description>Find transmembrane domains in protein sequences</description>
7
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
3 <!-- If job splitting is enabled, break up the query file into parts -->
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
4 <!-- Using 2000 chunks meaning 4 threads doing 500 each is ideal -->
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
5 <parallelism method="basic" split_inputs="fasta_file" split_mode="to_size" split_size="2000" merge_outputs="tabular_file"></parallelism>
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
6 <command interpreter="python">
25
41a42022f815 Uploaded v0.2.6, embedded citations
peterjc
parents: 22
diff changeset
7 tmhmm2.py "\$GALAXY_SLOTS" $fasta_file $tabular_file
19
4cd848c5590b Uploaded v0.2.5 preview 3, use $NSLOTS in the PSORT wrappers.
peterjc
parents: 17
diff changeset
8 ##If the environment variable isn't set, get "", and the python wrapper
4cd848c5590b Uploaded v0.2.5 preview 3, use $NSLOTS in the PSORT wrappers.
peterjc
parents: 17
diff changeset
9 ##defaults to four threads.
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
10 </command>
7
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
11 <stdio>
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
12 <!-- Anything other than zero is an error -->
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
13 <exit_code range="1:" />
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
14 <exit_code range=":-1" />
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
15 </stdio>
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
16 <inputs>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
17 <param name="fasta_file" type="data" format="fasta" label="FASTA file of protein sequences"/>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
18 <!--
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
19 <param name="version" type="select" display="radio" label="Model version">
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
20 <option value="">Version 1 (old)</option>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
21 <option value="" selected="True">Version 2 (default)</option>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
22 </param>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
23 -->
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
24 </inputs>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
25 <outputs>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
26 <data name="tabular_file" format="tabular" label="TMHMM results" />
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
27 </outputs>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
28 <requirements>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
29 <requirement type="binary">tmhmm</requirement>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
30 </requirements>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
31 <tests>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
32 <test>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
33 <param name="fasta_file" value="four_human_proteins.fasta" ftype="fasta"/>
1
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
34 <output name="tabular_file" file="four_human_proteins.tmhmm2.tabular" ftype="tabular"/>
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
35 </test>
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
36 <test>
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
37 <param name="fasta_file" value="empty.fasta" ftype="fasta"/>
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
38 <output name="tabular_file" file="empty_tmhmm2.tabular" ftype="tabular"/>
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
39 </test>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
40 </tests>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
41 <help>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
42
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
43 **What it does**
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
44
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
45 This calls the TMHMM v2.0 tool for prediction of transmembrane (TM) helices in proteins using a hidden Markov model (HMM).
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
46
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
47 The input is a FASTA file of protein sequences, and the output is tabular with six columns (one row per protein):
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
48
8
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
49 ====== =====================================================================================
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
50 Column Description
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
51 ------ -------------------------------------------------------------------------------------
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
52 1 Sequence identifier
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
53 2 Sequence length
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
54 3 Expected number of amino acids in TM helices (ExpAA). If this number is larger than
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
55 18 it is very likely to be a transmembrane protein (OR have a signal peptide).
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
56 4 Expected number of amino acids in TM helices in the first 60 amino acids of the
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
57 protein (Exp60). If this number more than a few, be aware that a predicted
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
58 transmembrane helix in the N-term could be a signal peptide.
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
59 5 Number of transmembrane helices predicted by N-best.
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
60 6 Topology predicted by N-best (encoded as a strip using o for output and i for inside)
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
61 ====== =====================================================================================
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
62
1
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
63 Predicted TM segments in the n-terminal region sometimes turn out to be signal peptides.
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
64
1
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
65 One of the most common mistakes by the program is to reverse the direction of proteins with one TM segment (i.e. mixing up which end of the protein is outside and inside the membrane).
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
66
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
67 Do not use the program to predict whether a non-membrane protein is cytoplasmic or not.
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
68
8
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
69
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
70 **Notes**
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
71
2
747cec3192d3 Migrated tool version 0.0.5 from old tool shed archive to new tool shed repository
peterjc
parents: 1
diff changeset
72 The short format output from TMHMM v2.0 looks like this (six columns tab separated, shown here as a table):
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
73
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
74 =================================== ======= =========== ============= ========= =============================
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
75 gi|2781234|pdb|1JLY|B len=304 ExpAA=0.01 First60=0.00 PredHel=0 Topology=o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
76 gi|4959044|gb|AAD34209.1|AF069992_1 len=600 ExpAA=0.00 First60=0.00 PredHel=0 Topology=o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
77 gi|671626|emb|CAA85685.1| len=473 ExpAA=0.19 First60=0.00 PredHel=0 Topology=o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
78 gi|3298468|dbj|BAA31520.1| len=107 ExpAA=59.37 First60=31.17 PredHel=3 Topology=o23-45i52-74o89-106i
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
79 =================================== ======= =========== ============= ========= =============================
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
80
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
81 In order to make it easier to use in Galaxy, the wrapper script simplifies this to remove the redundant tags, and instead adds a comment line at the top with the column names:
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
82
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
83 =================================== === ===== ======= ======= ====================
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
84 #ID len ExpAA First60 PredHel Topology
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
85 gi|2781234|pdb|1JLY|B 304 0.01 0.00 0 o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
86 gi|4959044|gb|AAD34209.1|AF069992_1 600 0.00 0.00 0 o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
87 gi|671626|emb|CAA85685.1| 473 0.19 0.00 0 o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
88 gi|3298468|dbj|BAA31520.1| 107 59.37 31.17 3 o23-45i52-74o89-106i
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
89 =================================== === ===== ======= ======= ====================
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
90
8
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
91
13
c6e5a737d3a0 Uploaded v0.2.2, was missing some test files
peterjc
parents: 8
diff changeset
92 -----
c6e5a737d3a0 Uploaded v0.2.2, was missing some test files
peterjc
parents: 8
diff changeset
93
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
94 **References**
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
95
20
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
96 If you use this Galaxy tool in work leading to a scientific publication please
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
97 cite the following papers:
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
98
22
90e3d02f8013 Uploaded v0.2.5 preview 6, can use accents in <help> RST
peterjc
parents: 20
diff changeset
99 Peter J.A. Cock, Björn A. Grüning, Konrad Paszkiewicz and Leighton Pritchard (2013).
20
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
100 Galaxy tools and workflows for sequence analysis with applications
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
101 in molecular plant pathology. PeerJ 1:e167
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
102 http://dx.doi.org/10.7717/peerj.167
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
103
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
104 Krogh, Larsson, von Heijne, and Sonnhammer (2001).
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
105 Predicting Transmembrane Protein Topology with a Hidden Markov Model: Application to Complete Genomes.
20
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
106 J. Mol. Biol. 305:567-580.
6
39a6e46cdda3 Migrated tool version 0.0.9 from old tool shed archive to new tool shed repository
peterjc
parents: 3
diff changeset
107 http://dx.doi.org/10.1006/jmbi.2000.4315
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
108
20
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
109 Sonnhammer, von Heijne, and Krogh (1998).
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
110 A hidden Markov model for predicting transmembrane helices in protein sequences.
20
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
111 In J. Glasgow et al., eds.: Proc. Sixth Int. Conf. on Intelligent Systems for Molecular Biology, pages 175-182. AAAI Press.
6
39a6e46cdda3 Migrated tool version 0.0.9 from old tool shed archive to new tool shed repository
peterjc
parents: 3
diff changeset
112 http://www.ncbi.nlm.nih.gov/pubmed/9783223
39a6e46cdda3 Migrated tool version 0.0.9 from old tool shed archive to new tool shed repository
peterjc
parents: 3
diff changeset
113
20
a538e182fab3 Uploaded v0.2.5 preview 4, adding Cock et al. 2003 citation information.
peterjc
parents: 19
diff changeset
114 See also http://www.cbs.dtu.dk/services/TMHMM/
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
115
17
af3174637834 Uploaded v0.2.5 preview 1, adding links to Tool Shed entry
peterjc
parents: 13
diff changeset
116 This wrapper is available to install into other Galaxy Instances via the Galaxy
af3174637834 Uploaded v0.2.5 preview 1, adding links to Tool Shed entry
peterjc
parents: 13
diff changeset
117 Tool Shed at http://toolshed.g2.bx.psu.edu/view/peterjc/tmhmm_and_signalp
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
118 </help>
25
41a42022f815 Uploaded v0.2.6, embedded citations
peterjc
parents: 22
diff changeset
119 <citations>
41a42022f815 Uploaded v0.2.6, embedded citations
peterjc
parents: 22
diff changeset
120 <citation type="doi">10.7717/peerj.167</citation>
41a42022f815 Uploaded v0.2.6, embedded citations
peterjc
parents: 22
diff changeset
121 <citation type="doi">10.1006/jmbi.2000.4315</citation>
41a42022f815 Uploaded v0.2.6, embedded citations
peterjc
parents: 22
diff changeset
122 <!-- TODO - add entry for PMID: 9783223 -->
41a42022f815 Uploaded v0.2.6, embedded citations
peterjc
parents: 22
diff changeset
123 </citations>
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
124 </tool>