Mercurial > repos > peterjc > tmhmm_and_signalp
diff tools/protein_analysis/psortb.xml @ 8:391a142c1e60 draft
Uploaded
author | peterjc |
---|---|
date | Tue, 26 Mar 2013 14:27:44 -0400 |
parents | |
children | 3d74c1176d67 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tools/protein_analysis/psortb.xml Tue Mar 26 14:27:44 2013 -0400 @@ -0,0 +1,84 @@ +<tool id="Psortb" name="psortb" version="0.0.1"> + <description>Determines sub-cellular localisation of bacterial/archaeal protein sequences</description> + <!-- If job splitting is enabled, break up the query file into parts --> + <!-- Using 2000 chunks meaning 4 threads doing 500 each is ideal --> + <parallelism method="basic" split_inputs="fasta_file" split_mode="to_size" split_size="2000" merge_outputs="tabular_file"></parallelism> + <version_command interpreter="python">psortb.py --version</version_command> + <command interpreter="python">psortb.py "\$NSLOTS" "$type" "$long" "$cutoff" "$divergent" "$sequence" "$outfile"</command> + <stdio> + <!-- Anything other than zero is an error --> + <exit_code range="1:" /> + <exit_code range=":-1" /> + </stdio> + <inputs> + <param format="fasta" name="sequence" type="data" + label="Input sequences for which to predict localisation (protein FASTA format)" /> + <param name="type" type="select" + label="Organism type (N.B. all sequences in the above file must be of the same type)" > + <option value="-p">Gram positive bacteria</option> + <option value="-n">Gram negative bacteria</option> + <option value="-a">Archaea</option> + </param> + <param name="long" type="select" label="Output type"> + <option value="terse">Short (terse, tabular with 3 columns)</option> + <!-- The normal output is text, not tabular - worth offering? + <option value="normal">Normal</option> + --> + <option value="long">Long (verbose, tabular with about 30 columns, depending on organism type)</option> + </param> + <param name="cutoff" size="10" type="float" optional="true" value="" + label="Sets a cutoff value for reported results (e.g. 7.5)" + help="Leave blank or use zero for no cutoff." /> + <param name="divergent" size="10" type="float" optional="true" value="" + label="Sets a cutoff value for the multiple localization flag (e.g. 4.5)" + help="Leave blank or use zero for no cutoff." /> + </inputs> + <outputs> + <data format="tabular" name="outfile" /> + </outputs> + <requirements> + <requirement type="binary">psort</requirement> + </requirements> + <tests> + <test> + <param name="sequence" value="k12_ten_proteins.fasta" ftype="fasta"/> + <param name="long" value="terse"/> + <output name="outfile" file="k12_ten_proteins_psortb_p_terse.tabular" ftype="tabular"/> + </test> + </tests> + <help> + +**What it does** + +This calls the command line tool PSORTb v3.0 for prediction of prokaryotic +localization sites. The input dataset needs to be protein FASTA sequences. +The default output is a simple tabular file with three columns, one row +per query sequence: + +====== ============================== +Column Description +------ ------------------------------ + 1 Sequence identifier + 2 Localisation, e.g. Cytoplasmic + 3 Score +====== ============================== + +The long output is also tabular with one row per query sequence, but has +lots more columns (a different set for each supported organism type). In +both cases, a simple header line is included (starting with a hash, #, +so that Galaxy treats it as a comment) giving the column names. + + +**References** + +N.Y. Yu, J.R. Wagner, M.R. Laird, G. Melli, S. Rey, R. Lo, P. Dao, +S.C. Sahinalp, M. Ester, L.J. Foster, F.S.L. Brinkman (2010) +PSORTb 3.0: Improved protein subcellular localization prediction with +refined localization subcategories and predictive capabilities for all +prokaryotes, Bioinformatics 26(13):1608-1615 +http://dx.doi.org/10.1093/bioinformatics/btq249 + +http://www.psort.org/documentation/index.html + + </help> +</tool>