# HG changeset patch # User simonalpha # Date 1420496252 18000 # Node ID 9ee2e20c6f1abc11d34df78873362a75deb93831 # Parent 79ed4588f7ae432dab6a9b0173d769bf10b42136 Uploaded diff -r 79ed4588f7ae -r 9ee2e20c6f1a README --- a/README Tue Mar 18 19:46:10 2014 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,7 +0,0 @@ -This package is a galaxy wrapper for the MSGF+ search tool. - -Requirements: -This package depends on the galaxy_protk, protk_msgfplus, protk_proteowizard packages -Please see instructions for those packages before installing - -In addition to basic requirements you must also have unzip and java 6 runtime (or greater) installed diff -r 79ed4588f7ae -r 9ee2e20c6f1a README.md --- a/README.md Tue Mar 18 19:46:10 2014 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,8 +0,0 @@ -## What is it? -Galaxy tool definition file and wrapper scripts for the [MSGF+ Search Engine](http://proteomics.ucsd.edu/Software/MSGFPlus.html). - -## Installation -Install from the main galaxy toolshed at http://toolshed.g2.bx.psu.edu/ - -Depends on command-line scripts and databases available in the [protk ruby gem](https://bitbucket.org/iracooke/protk). - diff -r 79ed4588f7ae -r 9ee2e20c6f1a msgfplus_search.xml --- a/msgfplus_search.xml Tue Mar 18 19:46:10 2014 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,188 +0,0 @@ - - Run an MSGF+ Search - - protk - msgfplus - proteowizard - - - msgfplus_search.rb - #if $database.source_select=="built_in": - --galaxy -d $database.dbkey - #else - --galaxy -d $database.fasta_file - #end if - - --var-mods=' - $variable_mods - #for $custom_variable_mod in $custom_variable_mods: - ,${custom_variable_mod.custom_mod} - #end for - ' - - --fix-mods=' - $fixed_mods - #for $custom_fix_mod in $custom_fix_mods: - ,${custom_fix_mod.custom_mod} - #end for - ' - - $input_file - -o $output - -r - --enzyme=$enzyme - --precursor-ion-tol-units=$precursor_tolu - -v $missed_cleavages - $cleavage_semi - -f $fragment_ion_tol - -p $precursor_ion_tol - --instrument=$instrument - --isotope-error-range=$isotope_error_range - --fragment-method=$fragment_method - --protocol=$protocol - --min-pep-len=$min_pep_len - --max-pep-len=$max_pep_len - --max-pep-charge=$max_pep_charge - --min-pep-charge=$min_pep_charge - --num-reported-matches=$num_reported_matches - --java-mem=$java_mem - #unless $pepxml_output_use: - --no-pepxml - #end unless - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -**What it does** - -Runs an MS/MS database search using the MSGFPlus search engine. Output is in the form of a pepXML file containing identified peptides along with their raw search scores. - ----- - -**References** - -Please see http://proteomics.ucsd.edu/Software/MSGFPlus.html for details of the MSGFPlus search engine and references describing its algorithm - - - diff -r 79ed4588f7ae -r 9ee2e20c6f1a repository_dependencies.xml --- a/repository_dependencies.xml Tue Mar 18 19:46:10 2014 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,4 +0,0 @@ - - - - diff -r 79ed4588f7ae -r 9ee2e20c6f1a test-data/bsa.fasta --- a/test-data/bsa.fasta Tue Mar 18 19:46:10 2014 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,26 +0,0 @@ ->sp|ALBU_BOVIN| -MKWVTFISLLLLFSSAYSRGVFRRDTHKSEIAHRFKDLGEEHFKGLVLIA -FSQYLQQCPFDEHVKLVNELTEFAKTCVADESHAGCEKSLHTLFGDELCK -VASLRETYGDMADCCEKQEPERNECFLSHKDDSPDLPKLKPDPNTLCDEF -KADEKKFWGKYLYEIARRHPYFYAPELLYYANKYNGVFQECCQAEDKGAC -LLPKIETMREKVLASSARQRLRCASIQKFGERALKAWSVARLSQKFPKAE -FVEVTKLVTDLTKVHKECCHGDLLECADDRADLAKYICDNQDTISSKLKE -CCDKPLLEKSHCIAEVEKDAIPENLPPLTADFAEDKDVCKNYQEAKDAFL -GSFLYEYSRRHPEYAVSVLLRLAKEYEATLEECCAKDDPHACYSTVFDKL -KHLVDEPQNLIKQNCDQFEKLGEYGFQNALIVRYTRKVPQVSTPTLVEVS -RSLGKVGTRCCTKPESERMPCTEDYLSLILNRLCVLHEKTPVSEKVTKCC -TESLVNRRPCFSALTPDETYVPKAFDEKLFTFHADICTLPDTEKQIKKQT -ALVELLKHKPKATEEQLKTVMENFVAFVDKCCAADDKEACFAVEGPKLVV -STQTALA ->sp|AMYS_HUMAN| -MKLFWLLFTIGFCWAQYSSNTQQGRTSIVHLFEWRWVDIALECERYLAPK -GFGGVQVSPPNENVAIHNPFRPWWERYQPVSYKLCTRSGNEDEFRNMVTR -CNNVGVRIYVDAVINHMCGNAVSAGTSSTCGSYFNPGSRDFPAVPYSGWD -FNDGKCKTGSGDIENYNDATQVRDCRLSGLLDLALGKDYVRSKIAEYMNH -LIDIGVAGFRIDASKHMWPGDIKAILDKLHNLNSNWFPEGSKPFIYQEVI -DLGGEPIKSSDYFGNGRVTEFKYGAKLGTVIRKWNGEKMSYLKNWGEGWG -FMPSDRALVFVDNHDNQRGHGAGGASILTFWDARLYKMAVGFMLAHPYGF -TRVMSSYRWPRYFENGKDVNDWVGPPNDNGVTKEVTINPDTTCGNDWVCE -HRWRQIRNMVNFRNVVDGQPFTNWYDNGSNQVAFGRGNRGFIVFNNDDWT -FSLTLQTGLPAGTYCDVISGDKINGNCTGIKIYVSDDGKAHFSISNSAED -PFIAIHAESKL \ No newline at end of file diff -r 79ed4588f7ae -r 9ee2e20c6f1a test-data/bsa.mzML --- a/test-data/bsa.mzML Tue Mar 18 19:46:10 2014 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,96 +0,0 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - RPrt68CEaUDI7236swRrQLecS3FVwmxAdcjNcANFbUBlwi/182NuQL/xtWeWAm9AGm7A54clb0BNSkG3FyJxQJOMnIU9QXFAFCLgEKpScUCe6pCb4fJyQNbiUwAME3RA529CIQJSdUDmllZDYmJ2QFch5SfVQXdAOiNKe4NRd0A2WaMeolJ4QGwE4nX9YXhAG7tE9VZyeUAaNPRPcNN6QDyInSl0JHtAEqCmli1Te0CuDRXj/JJ7QBsS91h6gnxAet/42jOzfEC94xQdyZJ9QEbT2clgMn5Ah78ma9RCf0CAYI4ev1J/QPCiryCNKoBAqiuf5XkxgEDtuyL4H3qAQDI4Sl7dgYBAEVMiiZ66gEBi+IiY0tGAQDMbZJKR2YBAjL6CNCMKgUA0ETY8vUGBQEymCkYlUoFAzzEge71hgUB8D5cc97WBQKYnLPHAuYFArDlAMEfigUBWSPlJ9fGBQP2H9NsX/oFApMLYQlApgkBmFMstLUKCQG2tLxLaWYJAMPDce3ixgkAYsrrVc7mCQHAlOzbCOYNAPrMkQI1Bg0Ang6PkFWqDQOrPfqRIgoNAdZMYBBaKg0BaL4ZyIrqDQGIQWDm0woNANUHUfcDJg0AMAiuHVgqEQCzUmubdUoRAL6NYbilqhEDXwFYJlpqEQGjon+CiooRA9Pi9TT/ShEBrZcIvNdqEQBqjdVR16oRAs5jYfBzyhEBx5ldzwFGFQIz4Tsx6eoVAhPBo4wiKhUCCHJQwE5KFQCUGgZUD0oVAy9b6IuHZhUBeukkMAmKGQM11Gmkp8oZA1xcJbTnDh0AWwf9WMsuHQJhRLLd0SohAldQJaGJTiEAUyy2thoKIQNuizAbZColAjZyFPa0SiUDLSpNSkGKJQCveyDzymolAS80eaMXqiUB47j1csvKJQONTAIzneopAejarPlfTikAMPPcerlOLQDdPdciNW4tA1EM0usPji0CY3ZOHBauMQD90QX3L845A/+xHigh8j0D7OnDOKPaRQAUXK2oQ+pFAbqMBvCU+kkA= - - - - - - AABIQgAAUEIAAMpCAABkQwAA8EEAACBCAEAHRQAAgEIAACRDAICRQwAAhEIAAE9EAADwQQAAjkIAAAhCAAAEQgAAMEIAAChDAACmQgAA4EEAAJBDAADGQgAA1EIAAHhCAAAEQwAAHEMAAKpCAAAcQgAAgUMAALRCAIDuQwAADEIAAJxCAMCERAAAOEIAADlDAAAAQgAA3kIAAPxCAICfQwAASUMAAAtDAADoQQAA00MAgMNDAADoQQAA+UMAAOBBAABUQgAAH0MAAExCAICFQwAA+EEAABxCAACMQgAAIEIAAKhCAIDVQwAAKEMAAFpEAAAIQgAABEIAAOBBAAAMQgAA4EEAAIpCAAA1QwAA+EIAAFBCAADoQQAAEEIAACRCAIC8QwAAFUQAAKRDAAAkQgAAgUMAAAhCAIDFQwAA9kIAAOhBAADEQgAAFEMAAAxCAADUQgAAO0MAAApDAADgQQAA8EEAAANDAEAmRAAACEIAAL5CAAASRAAAAEIAABFDAEBQRA== - - - - - - - - - 2685 - - - 7058 - b76171188a63cfad075d3738a172b15f1f9e0c4c - diff -r 79ed4588f7ae -r 9ee2e20c6f1a test-data/bsa.mzid --- a/test-data/bsa.mzid Tue Mar 18 19:46:10 2014 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,123 +0,0 @@ - - - - - - - - - - - - - - - - - - - - YICDNQDTISSK - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - diff -r 79ed4588f7ae -r 9ee2e20c6f1a tool-data/msgfplus_mods.loc.sample --- a/tool-data/msgfplus_mods.loc.sample Tue Mar 18 19:46:10 2014 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,50 +0,0 @@ -#This file lists the names of inbuilt chemical modifications accepted by msgfplus -#Each entry consists of 4 tab separated fields like this -# -# -#Modification strings should conform to the standard MSGFPlus syntax with the following exception -#The ModType field is overridden by the msgfplus_search.rb tool. In other words any of these mods -#May be passed to the tool as a variable or fixed mod and the tool will substitute the appropriate ModType -#value -# -#Standard MSGFPlus syntax is -# -# To input a modification, use the following command: -# Mass or CompositionStr, Residues, ModType, Position, Name (all the five fields are required). -# CompositionStr (C[Num]H[Num]N[Num]O[Num]S[Num]P[Num]) -# - C (Carbon), H (Hydrogen), N (Nitrogen), O (Oxygen), S (Sulfer) and P (Phosphorus) are allowed. -# - Atom can be omitted. The sequence of atoms must be followed. -# - Negative numbers are allowed. -# - E.g. C2H2O1 (valid), H2C1O1 (invalid) -# Mass can be used instead of CompositionStr. It is important to specify accurate masses (integer masses are insufficient). -# - E.g. 15.994915 -# Residues: affected amino acids (must be upper letters) -# - Must be uppor letters or * -# - Use * if this modification is applicable to any residue. -# - * should not be "anywhere" modification (e.g. "15.994915, *, opt, any, Oxidation" is not allowed.) -# - E.g. NQ, * -# ModType: "fix" for fixed modifications, "opt" for variable modifications (case insensitive) -# Position: position in the peptide where the modification can be attached. -# - One of the following five values should be used: -# - any (anywhere), N-term (peptide N-term), C-term (peptide C-term), Prot-N-term (protein N-term), Prot-C-term (protein C-term) -# - Case insensitive -# - "-" can be omitted -# - E.g. any, Any, Prot-n-Term, ProtNTerm => all valid -# Name: name of the modification (Unimod PSI-MS name) -# - For proper mzIdentML output, this name should be the same as the Unimod PSI-MS name -# - E.g. Phospho, Acetyl -#C2H3N1O1,C,fix,any,Carbamidomethyl # Fixed Carbamidomethyl C -# Variable Modifications (default: none) -#O1,M,opt,any,Oxidation # Oxidation M -#15.994915,M,opt,any,Oxidation # Oxidation M (mass is used instead of CompositionStr) -#H-1N-1O1,NQ,opt,any,Deamidated # Negative numbers are allowed. -#C2H3NO,*,opt,N-term,Carbamidomethyl # Variable Carbamidomethyl N-term -#H-2O-1,E,opt,N-term,Pyro_glu # Pyro-glu from E -#H-3N-1,Q,opt,N-term,Pyro-glu # Pyro-glu from Q -#C2H2O,*,opt,Prot-N-term,Acetyl # Acetylation Protein N-term -#C2H2O1,K,opt,any,Acetyl # Acetylation K -#CH2,K,opt,any,Methy # Methylation K -#HO3P,STY,opt,any,Phospho # Phosphorylation STY - -Carbamidomethyl C carbamidomethyl_c_ C2H3N1O1,C,opt,any,Carbamidomethyl carbamidomethyl_c_ -Oxidation M oxidation_m_ O1,M,opt,any,Oxidation oxidation_m_ \ No newline at end of file diff -r 79ed4588f7ae -r 9ee2e20c6f1a tool-data/pepxml_databases.loc.sample --- a/tool-data/pepxml_databases.loc.sample Tue Mar 18 19:46:10 2014 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,13 +0,0 @@ -#This file lists the names of protein databases installed locally in protk. -# These are used by omssa and x!tandem as well as the "mascot to pepxml" tool -# In order to combine search results with Interprophet searches must be run against an identical database -# -# Entries should follow the be structured as follows -# Display_name omssa_tandem_dbname dbkey -# -# -Swissprot spall_ spall spall_ -Combined PlasmboDB (falciparum) and Swissprot Human plasmodb_pfalciparum_sphuman_ plasmodb_pfalciparum_sphuman plasmodb_pfalciparum_sphuman_ -Swissprot Human sphuman_ sphuman sphuman_ -Combined Swissprot/TRembl Human sptrhuman_ sptrhuman sptrhuman_ -Swissprot Mouse spmouse_ spmouse spmouse_ diff -r 79ed4588f7ae -r 9ee2e20c6f1a tool_dependencies.xml --- a/tool_dependencies.xml Tue Mar 18 19:46:10 2014 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,12 +0,0 @@ - - - - - - - - - - - -