annotate tools/protein_analysis/psortb.xml @ 11:3d74c1176d67 draft

Uploaded minor fix
author peterjc
date Wed, 03 Apr 2013 10:47:50 -0400
parents 391a142c1e60
children af3174637834
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
8
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
1 <tool id="Psortb" name="psortb" version="0.0.1">
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
2 <description>Determines sub-cellular localisation of bacterial/archaeal protein sequences</description>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
3 <!-- If job splitting is enabled, break up the query file into parts -->
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
4 <!-- Using 2000 chunks meaning 4 threads doing 500 each is ideal -->
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
5 <parallelism method="basic" split_inputs="fasta_file" split_mode="to_size" split_size="2000" merge_outputs="tabular_file"></parallelism>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
6 <version_command interpreter="python">psortb.py --version</version_command>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
7 <command interpreter="python">psortb.py "\$NSLOTS" "$type" "$long" "$cutoff" "$divergent" "$sequence" "$outfile"</command>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
8 <stdio>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
9 <!-- Anything other than zero is an error -->
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
10 <exit_code range="1:" />
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
11 <exit_code range=":-1" />
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
12 </stdio>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
13 <inputs>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
14 <param format="fasta" name="sequence" type="data"
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
15 label="Input sequences for which to predict localisation (protein FASTA format)" />
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
16 <param name="type" type="select"
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
17 label="Organism type (N.B. all sequences in the above file must be of the same type)" >
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
18 <option value="-p">Gram positive bacteria</option>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
19 <option value="-n">Gram negative bacteria</option>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
20 <option value="-a">Archaea</option>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
21 </param>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
22 <param name="long" type="select" label="Output type">
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
23 <option value="terse">Short (terse, tabular with 3 columns)</option>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
24 <!-- The normal output is text, not tabular - worth offering?
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
25 <option value="normal">Normal</option>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
26 -->
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
27 <option value="long">Long (verbose, tabular with about 30 columns, depending on organism type)</option>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
28 </param>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
29 <param name="cutoff" size="10" type="float" optional="true" value=""
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
30 label="Sets a cutoff value for reported results (e.g. 7.5)"
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
31 help="Leave blank or use zero for no cutoff." />
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
32 <param name="divergent" size="10" type="float" optional="true" value=""
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
33 label="Sets a cutoff value for the multiple localization flag (e.g. 4.5)"
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
34 help="Leave blank or use zero for no cutoff." />
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
35 </inputs>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
36 <outputs>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
37 <data format="tabular" name="outfile" />
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
38 </outputs>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
39 <requirements>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
40 <requirement type="binary">psort</requirement>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
41 </requirements>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
42 <tests>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
43 <test>
11
3d74c1176d67 Uploaded minor fix
peterjc
parents: 8
diff changeset
44 <param name="sequence" value="empty.fasta" ftype="fasta"/>
3d74c1176d67 Uploaded minor fix
peterjc
parents: 8
diff changeset
45 <param name="long" value="terse"/>
3d74c1176d67 Uploaded minor fix
peterjc
parents: 8
diff changeset
46 <output name="outfile" file="empty_psortb_terse.tabular" ftype="tabular"/>
3d74c1176d67 Uploaded minor fix
peterjc
parents: 8
diff changeset
47 </test>
3d74c1176d67 Uploaded minor fix
peterjc
parents: 8
diff changeset
48 <test>
8
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
49 <param name="sequence" value="k12_ten_proteins.fasta" ftype="fasta"/>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
50 <param name="long" value="terse"/>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
51 <output name="outfile" file="k12_ten_proteins_psortb_p_terse.tabular" ftype="tabular"/>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
52 </test>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
53 </tests>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
54 <help>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
55
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
56 **What it does**
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
57
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
58 This calls the command line tool PSORTb v3.0 for prediction of prokaryotic
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
59 localization sites. The input dataset needs to be protein FASTA sequences.
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
60 The default output is a simple tabular file with three columns, one row
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
61 per query sequence:
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
62
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
63 ====== ==============================
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
64 Column Description
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
65 ------ ------------------------------
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
66 1 Sequence identifier
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
67 2 Localisation, e.g. Cytoplasmic
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
68 3 Score
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
69 ====== ==============================
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
70
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
71 The long output is also tabular with one row per query sequence, but has
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
72 lots more columns (a different set for each supported organism type). In
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
73 both cases, a simple header line is included (starting with a hash, #,
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
74 so that Galaxy treats it as a comment) giving the column names.
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
75
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
76
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
77 **References**
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
78
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
79 N.Y. Yu, J.R. Wagner, M.R. Laird, G. Melli, S. Rey, R. Lo, P. Dao,
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
80 S.C. Sahinalp, M. Ester, L.J. Foster, F.S.L. Brinkman (2010)
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
81 PSORTb 3.0: Improved protein subcellular localization prediction with
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
82 refined localization subcategories and predictive capabilities for all
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
83 prokaryotes, Bioinformatics 26(13):1608-1615
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
84 http://dx.doi.org/10.1093/bioinformatics/btq249
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
85
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
86 http://www.psort.org/documentation/index.html
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
87
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
88 </help>
391a142c1e60 Uploaded
peterjc
parents:
diff changeset
89 </tool>