annotate tools/protein_analysis/tmhmm2.xml @ 12:7ef4b36b026a draft

Uploaded v0.2.1 (removes stray test files)
author peterjc
date Wed, 03 Apr 2013 11:11:43 -0400
parents 391a142c1e60
children c6e5a737d3a0
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
8
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
1 <tool id="tmhmm2" name="TMHMM 2.0" version="0.0.10">
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
2 <description>Find transmembrane domains in protein sequences</description>
7
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
3 <!-- If job splitting is enabled, break up the query file into parts -->
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
4 <!-- Using 2000 chunks meaning 4 threads doing 500 each is ideal -->
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
5 <parallelism method="basic" split_inputs="fasta_file" split_mode="to_size" split_size="2000" merge_outputs="tabular_file"></parallelism>
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
6 <command interpreter="python">
7
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
7 tmhmm2.py "\$NSLOTS" $fasta_file $tabular_file
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
8 ##Set the number of threads in the runner entry in universe_wsgi.ini
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
9 ##which (on SGE at least) will set the $NSLOTS environment variable.
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
10 ##If the environment variable isn't set, get "", and defaults to one.
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
11 </command>
7
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
12 <stdio>
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
13 <!-- Anything other than zero is an error -->
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
14 <exit_code range="1:" />
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
15 <exit_code range=":-1" />
5e62aefb2918 Uploaded v0.1.2 to Test Tool Shed
peterjc
parents: 6
diff changeset
16 </stdio>
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
17 <inputs>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
18 <param name="fasta_file" type="data" format="fasta" label="FASTA file of protein sequences"/>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
19 <!--
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
20 <param name="version" type="select" display="radio" label="Model version">
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
21 <option value="">Version 1 (old)</option>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
22 <option value="" selected="True">Version 2 (default)</option>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
23 </param>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
24 -->
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
25 </inputs>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
26 <outputs>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
27 <data name="tabular_file" format="tabular" label="TMHMM results" />
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
28 </outputs>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
29 <requirements>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
30 <requirement type="binary">tmhmm</requirement>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
31 </requirements>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
32 <tests>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
33 <test>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
34 <param name="fasta_file" value="four_human_proteins.fasta" ftype="fasta"/>
1
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
35 <output name="tabular_file" file="four_human_proteins.tmhmm2.tabular" ftype="tabular"/>
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
36 </test>
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
37 <test>
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
38 <param name="fasta_file" value="empty.fasta" ftype="fasta"/>
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
39 <output name="tabular_file" file="empty_tmhmm2.tabular" ftype="tabular"/>
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
40 </test>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
41 </tests>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
42 <help>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
43
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
44 **What it does**
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
45
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
46 This calls the TMHMM v2.0 tool for prediction of transmembrane (TM) helices in proteins using a hidden Markov model (HMM).
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
47
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
48 The input is a FASTA file of protein sequences, and the output is tabular with six columns (one row per protein):
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
49
8
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
50 ====== =====================================================================================
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
51 Column Description
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
52 ------ -------------------------------------------------------------------------------------
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
53 1 Sequence identifier
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
54 2 Sequence length
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
55 3 Expected number of amino acids in TM helices (ExpAA). If this number is larger than
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
56 18 it is very likely to be a transmembrane protein (OR have a signal peptide).
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
57 4 Expected number of amino acids in TM helices in the first 60 amino acids of the
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
58 protein (Exp60). If this number more than a few, be aware that a predicted
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
59 transmembrane helix in the N-term could be a signal peptide.
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
60 5 Number of transmembrane helices predicted by N-best.
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
61 6 Topology predicted by N-best (encoded as a strip using o for output and i for inside)
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
62 ====== =====================================================================================
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
63
1
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
64 Predicted TM segments in the n-terminal region sometimes turn out to be signal peptides.
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
65
1
9a8a7f680dd6 Migrated tool version 0.0.3 from old tool shed archive to new tool shed repository
peterjc
parents: 0
diff changeset
66 One of the most common mistakes by the program is to reverse the direction of proteins with one TM segment (i.e. mixing up which end of the protein is outside and inside the membrane).
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
67
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
68 Do not use the program to predict whether a non-membrane protein is cytoplasmic or not.
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
69
8
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
70
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
71 **Notes**
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
72
2
747cec3192d3 Migrated tool version 0.0.5 from old tool shed archive to new tool shed repository
peterjc
parents: 1
diff changeset
73 The short format output from TMHMM v2.0 looks like this (six columns tab separated, shown here as a table):
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
74
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
75 =================================== ======= =========== ============= ========= =============================
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
76 gi|2781234|pdb|1JLY|B len=304 ExpAA=0.01 First60=0.00 PredHel=0 Topology=o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
77 gi|4959044|gb|AAD34209.1|AF069992_1 len=600 ExpAA=0.00 First60=0.00 PredHel=0 Topology=o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
78 gi|671626|emb|CAA85685.1| len=473 ExpAA=0.19 First60=0.00 PredHel=0 Topology=o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
79 gi|3298468|dbj|BAA31520.1| len=107 ExpAA=59.37 First60=31.17 PredHel=3 Topology=o23-45i52-74o89-106i
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
80 =================================== ======= =========== ============= ========= =============================
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
81
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
82 In order to make it easier to use in Galaxy, the wrapper script simplifies this to remove the redundant tags, and instead adds a comment line at the top with the column names:
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
83
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
84 =================================== === ===== ======= ======= ====================
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
85 #ID len ExpAA First60 PredHel Topology
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
86 gi|2781234|pdb|1JLY|B 304 0.01 0.00 0 o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
87 gi|4959044|gb|AAD34209.1|AF069992_1 600 0.00 0.00 0 o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
88 gi|671626|emb|CAA85685.1| 473 0.19 0.00 0 o
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
89 gi|3298468|dbj|BAA31520.1| 107 59.37 31.17 3 o23-45i52-74o89-106i
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
90 =================================== === ===== ======= ======= ====================
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
91
8
391a142c1e60 Uploaded
peterjc
parents: 7
diff changeset
92
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
93 **References**
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
94
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
95 Krogh, Larsson, von Heijne, and Sonnhammer.
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
96 Predicting Transmembrane Protein Topology with a Hidden Markov Model: Application to Complete Genomes.
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
97 J. Mol. Biol. 305:567-580, 2001.
6
39a6e46cdda3 Migrated tool version 0.0.9 from old tool shed archive to new tool shed repository
peterjc
parents: 3
diff changeset
98 http://dx.doi.org/10.1006/jmbi.2000.4315
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
99
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
100 Sonnhammer, von Heijne, and Krogh.
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
101 A hidden Markov model for predicting transmembrane helices in protein sequences.
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
102 In J. Glasgow et al., eds.: Proc. Sixth Int. Conf. on Intelligent Systems for Molecular Biology, pages 175-182. AAAI Press, 1998.
6
39a6e46cdda3 Migrated tool version 0.0.9 from old tool shed archive to new tool shed repository
peterjc
parents: 3
diff changeset
103 http://www.ncbi.nlm.nih.gov/pubmed/9783223
39a6e46cdda3 Migrated tool version 0.0.9 from old tool shed archive to new tool shed repository
peterjc
parents: 3
diff changeset
104
39a6e46cdda3 Migrated tool version 0.0.9 from old tool shed archive to new tool shed repository
peterjc
parents: 3
diff changeset
105 http://www.cbs.dtu.dk/services/TMHMM/
0
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
106
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
107 </help>
a2eeeaa6f75e Migrated tool version 0.0.1 from old tool shed archive to new tool shed repository
peterjc
parents:
diff changeset
108 </tool>