Mercurial > repos > iracooke > xtandem
changeset 12:be958beb41d9 draft
Uploaded
author | iracooke |
---|---|
date | Sun, 08 Jun 2014 00:18:26 -0400 |
parents | b2f23c78d994 |
children | 2826f4b12b0b |
files | README README.md repository_dependencies.xml tandem.xml tool-data/pepxml_databases.loc.sample tool-data/tandem_mods.loc.sample |
diffstat | 6 files changed, 207 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/README Sun Jun 08 00:18:26 2014 -0400 @@ -0,0 +1,5 @@ +This package installs a wrapper script for the X!Tandem search engine + +Requirements: +This package depends on the protk and the trans proteomic pipeline packages +Please see instructions for those packages before installing
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/README.md Sun Jun 08 00:18:26 2014 -0400 @@ -0,0 +1,6 @@ +## What is it? +Galaxy tool definition file and wrapper scripts for the [X!Tandem search engine](http://www.thegpm.org/tandem/index.html). + +## This tool requires that the protk rubygem and X!Tandem itself are installed. + +
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/repository_dependencies.xml Sun Jun 08 00:18:26 2014 -0400 @@ -0,0 +1,4 @@ +<?xml version="1.0"?> +<repositories description="Proteomics datatypes"> + <repository changeset_revision="a1b29f86bdbf" name="proteomics_datatypes" owner="iracooke" toolshed="https://testtoolshed.g2.bx.psu.edu" /> + </repositories>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tandem.xml Sun Jun 08 00:18:26 2014 -0400 @@ -0,0 +1,173 @@ +<tool id="proteomics_search_tandem_1" name="X!Tandem MSMS Search" version="1.0.2"> + +<!-- <requirements> + <requirement type="package" version="1.2.6">protk</requirement> + <requirement type="package" version="4.6.3">trans_proteomic_pipeline</requirement> + </requirements> + --> + <description>Run an X!Tandem Search</description> + + <command> + #if $database.source_select=="built_in": + tandem_search.rb -d $database.dbkey + #else + tandem_search.rb -d $database.fasta_file + #end if + + --var-mods=' + $variable_mods + #for $custom_variable_mod in $custom_variable_mods: + ,${custom_variable_mod.custom_mod} + #end for + ' + + --fix-mods=' + $fixed_mods + #for $custom_fix_mod in $custom_fix_mods: + ,${custom_fix_mod.custom_mod} + #end for + ' + + $input_file -o $output -r + + --enzyme=$enzyme + + --precursor-ion-tol-units=$precursor_tolu + + -v $missed_cleavages + + -f $fragment_ion_tol + + -p $precursor_ion_tol + + $allow_multi_isotope_search + + --keep-params-files + + $cleavage_semi + + </command> + + <inputs> + <conditional name="database"> + <param name="source_select" type="select" label="Database source"> + <option value="built_in">Built-In</option> + <option value="input_ref" selected="true">Your Upload File</option> + </param> + <when value="built_in"> + <param name="dbkey" type="select" format="text" > + <label>Database</label> + <options from_file="pepxml_databases.loc"> + <column name="name" index="0" /> + <column name="value" index="2" /> + </options> + </param> + </when> + <when value="input_ref"> + <param name="fasta_file" type="data" format="fasta" label="Uploaded FASTA file" /> + </when> + </conditional> + + <param name="input_file" type="data" format="mzml" multiple="false" label="MSMS File" help="An mzML file with MS/MS data"/> + + + <param name="variable_mods" format="text" type="select" multiple="true" label="Variable Modifications" help="Hold the appropriate key while + clicking to select multiple items"> + <options from_file="tandem_mods.loc"> + <column name="name" index="0" /> + <column name="value" index="2" /> + </options> + </param> + + <repeat name="custom_variable_mods" title="Custom Variable Modifications" help="You can specify a modification when present in a motif. For instance, 0.998@N!{P}[ST] is a deamidation modification on N only if it is present in an N[any but P][S or T] motif (N-glycosite)."> + <param name="custom_mod" type="text"> + </param> + </repeat> + + + <param name="fixed_mods" format="text" type="select" multiple="true" label="Fixed Modifications" help="Hold the appropriate key while + clicking to select multiple items"> + <options from_file="tandem_mods.loc"> + <column name="name" index="0" /> + <column name="value" index="2" /> + </options> + </param> + + <repeat name="custom_fix_mods" title="Custom Fixed Modifications" help="You can specify a modification when present in a motif. For instance, 0.998@N!{P}[ST] is a deamidation modification on N only if it is present in an N[any but P][S or T] motif (N-glycosite)."> + <param name="custom_mod" type="text"> + </param> + </repeat> + + + + <param name="missed_cleavages" type="select" format="text" help="Allow peptides to contain up to this many missed enzyme cleavage sites"> + <label>Missed Cleavages Allowed</label> + <option value="0">0</option> + <option value="1">1</option> + <option value="2">2</option> + </param> + + <param name="cleavage_semi" type="boolean" label="Allow semi-cleaved peptides" help="This can increase search time dramatically" truevalue="" falsevalue="--no-cleavage-semi" /> + + <param name="enzyme" type="select" format="text"> + <label>Enzyme</label> + <option value="[R]|{P}">argc - [R]|{P}</option> + <option value="[X]|[D]">aspn - [X]|[D]</option> + <option value="[FLMWY]|{P}">chymotrypsin - [FLMWY]|{P}</option> + <option value="[R]|[X]">clostripain - [R]|[X]</option> + <option value="[M]|{P}">cnbr - [M]|{P}</option> + <option value="[AGILV]|{P}">elastase - [AGILV]|{P}</option> + <option value="[D]|{P}">formicacid - [D]|{P}</option> + <option value="[DE]|{P}">gluc - [DE]|{P}</option> + <option value="[E]|{P}">gluc_bicarb - [E]|{P}</option> + <option value="[W]|[X]">iodosobenzoate - [W]|[X]</option> + <option value="[K]|{P}">lysc - [K]|{P}</option> + <option value="[K]|[X]">lysc-p - [K]|[X]</option> + <option value="[X]|[K]">lysn - [X]|[K]</option> + <option value="[X]|[AKRS]">lysn_promisc - [X]|[AKRS]</option> + <option value="[X]|[X]">nonspecific - [X]|[X]</option> + <option value="[FL]|[X]">pepsina - [FL]|[X]</option> + <option value="[P]|[X]">protein_endopeptidase - [P]|[X]</option> + <option value="[E]|[X]">staph_protease - [E]|[X]</option> + <option value="[FMWY]|{P},[KR]|{P},[X]|[D]">tca - [FMWY]|{P},[KR]|{P},[X]|[D]</option> + <option value="[KR]|{P}" selected="true">trypsin - [KR]|{P}</option> + <option value="[FKLMRWY]|{P}">trypsin/chymotrypsin - [FKLMRWY]|{P}</option> + <option value="[KR]|{P},[M]|{P}">trypsin/cnbr - [KR]|{P},[M]|{P}</option> + <option value="[DEKR]|{P}">trypsin_gluc - [DEKR]|{P}</option> + </param> + + + <param name="fragment_ion_tol" help="Fragment Ion Tolerance in Daltons" type="float" value="0.65" min="0" max="10000" label="Fragment ion tolerance"/> + + <param name="precursor_ion_tol" help="Precursor Ion Tolerance (Da or ppm)" type="float" value="100" min="0" max="10000" label="Precursor ion tolerance"/> + <param name="precursor_tolu" type="select" format="text"> + <label>Precursor Ion Tolerance Units</label> + <option value="ppm">ppm</option> + <option value="Da">Da</option> + </param> + + <param name="allow_multi_isotope_search" type="boolean" label="Allow multi-isotope search" help="This allows peptide candidates in windows around -1 Da and -2 Da from the acquired mass to be considered. Only applicable when the minus/plus window above is set to less than 0.5 Da. Good for accurate-mass instruments for which the reported precursor mass is not corrected to the monoisotopic mass." truevalue="" falsevalue="--strict-monoisotopic-mass"/> + + </inputs> + + + <outputs> + <data format="tandem" name="output" metadata_source="input_file" label="X!Tandem_vs_${database.dbkey if $database.has_key('dbkey') else $database.fasta_file.display_name}.${input_file.display_name}.${input_file.display_name}.tandem"/> + </outputs> + + + <help> + +**What it does** + +Runs an MS/MS database search using the X!Tandem search engine. Output is in the form of a pepXML file containing identified peptides along with their raw search scores. + +---- + +**References** + +Please see http://www.thegpm.org/GPM/references.html for details of references describing the X!Tandem search engine. + + </help> + +</tool>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool-data/pepxml_databases.loc.sample Sun Jun 08 00:18:26 2014 -0400 @@ -0,0 +1,13 @@ +#This file lists the names of protein databases installed locally in protk. +# These are used by omssa and x!tandem as well as the "mascot to pepxml" tool +# In order to combine search results with Interprophet searches must be run against an identical database +# +# Entries should follow the be structured as follows +# Display_name omssa_tandem_dbname dbkey +# +# +Swissprot spall_ spall spall_ +Combined PlasmboDB (falciparum) and Swissprot Human plasmodb_pfalciparum_sphuman_ plasmodb_pfalciparum_sphuman plasmodb_pfalciparum_sphuman_ +Swissprot Human sphuman_ sphuman sphuman_ +Combined Swissprot/TRembl Human sptrhuman_ sptrhuman sptrhuman_ +Swissprot Mouse spmouse_ spmouse spmouse_
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool-data/tandem_mods.loc.sample Sun Jun 08 00:18:26 2014 -0400 @@ -0,0 +1,6 @@ +#This file lists the names of inbuilt chemical modifications accepted by X!Tandem +# +# +Carbamidomethyl C carbamidomethyl_c_ 57.021464@C carbamidomethyl_c_ +Glycocapture-N glycocapture_n_ 0.998@N!{P}[ST] glycocapture_n_ +Oxidation M oxidation_m_ 15.994915@M oxidation_m_ \ No newline at end of file