diff myrimatch.xml @ 2:4bb0872e2b5f draft

planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tools/bumbershoot/myrimatch commit 98f3323d4b92a4a3668788b3e1bad1a6529fd6df-dirty
author galaxyp
date Thu, 02 Jun 2016 18:32:04 -0400
parents cedaffdc5e40
children c5e2f015165d
line wrap: on
line diff
--- a/myrimatch.xml	Tue Sep 15 17:50:24 2015 -0400
+++ b/myrimatch.xml	Thu Jun 02 18:32:04 2016 -0400
@@ -24,13 +24,19 @@
         #for $static_mod in $StaticMods
           #set $static_mods_str = $static_mods_str + " " + str($static_mod.aa) + " " + str($static_mod.mass)
         #end for
-        #set $static_mods_str = $static_mods_str.lstrip()
+        #for $mod in str($common_fixed_modifications).split(",")
+          #set $static_mods_str = $static_mods_str + " " + $mod.replace("_", " ")
+        #end for
+        #set $static_mods_str = $static_mods_str.strip()
 
         #set $dynamic_mods_str = ""
         #for $dynamic_mod in $DynamicMods
             #set $dynamic_mods_str = $dynamic_mods_str + " " + str($dynamic_mod.motif) + " * " + str($dynamic_mod.mass)
         #end for
-        #set $dynamic_mods_str = $dynamic_mods_str.lstrip()
+        #for $mod in str($common_variable_modifications).split(",")
+          #set $dynamic_mods_str = $dynamic_mods_str + " " + $mod.replace("_", " ")
+        #end for
+        #set $dynamic_mods_str = $dynamic_mods_str.strip()
 
         ln -s '$input' '${input_name}' &&
         ln -s '$ProteinDatabase' '${db_name}' &&
@@ -71,7 +77,7 @@
 ]]>
     </command>
     <inputs>
-          <param name="input" type="data" format="mzml,mzxml,mgf,ms2,mz5" label="Input File"/>
+          <param name="input" type="data" format="mzml,mzxml,mgf,ms2,h5" label="Input Raw MS File(s)"/>
           <param argument="-OutputFormat" type="select" label="Output Type" help="The file format to use for results of the search.">
               <option value="pepXML">pepXML</option>
               <option value="mzid">mzIdentML</option>
@@ -83,6 +89,7 @@
                <option value="Trypsin">Trypsin (normal trypsin cut, disallows cutting when the site is before a proline)</option>
                <option value="Chymotrypsin">Chymotrypsin (allows cut after F,Y,W,L. Disallows cutting before proline)</option>
                <option value="TrypChymo">TrypChymo (combines "Trypsin/P" and "Chymotrypsin" cleavage rules)</option>
+               <option value="glutamyl endopeptidase">Glu-C</option>
                <option value="Lys-C">Lys-C</option>
                <option value="Lys-C/P">Lys-C/P (Lys-C, disallowing cutting before proline)</option>
                <option value="Asp-N">Asp-N</option>
@@ -95,14 +102,42 @@
               <option value="1" selected="true">Semi-specific (at least one terminus must match cleavage rules)</option>
               <option value="0">Non-specific (neither terminus is required to match cleavage rules)</option>
           </param>
-          <param argument="-MaxMissedCleavages" type="integer" value="2" label="Maximum Missed Cleavages" help="Candidate peptides with more than this number of uncleaved cleavage sites will be skipped." />
-          <repeat name="StaticMods" title="Static Modifications" help="Modifications that are always applied to an amino acid. (-StaticMods)">
+          <param argument="-MaxMissedCleavages" type="integer" min="0" value="2" label="Maximum Missed Cleavages" help="Candidate peptides with more than this number of uncleaved cleavage sites will be skipped." />
+
+        <param name="common_fixed_modifications" type="select" label="Common Static Modifications" multiple="true" help="Occurs in known places on peptide sequence. Hold the appropriate key while clicking to select multiple items">
+            <option value="C_57.021464" selected="true">Carbamidomethyl C</option>
+            <option value="(_144.102063">iTRAQ 4-plex N-term</option>
+            <option value="K_144.102063">iTRAQ 4-plex K</option>
+            <option value="(_225.155833">TMT 2-plex N-term</option>
+            <option value="K_225.155833">TMT 2-plex K</option>
+            <option value="(_229.162932">TMT 6-or-10-plex N-term</option>
+            <option value="K_229.162932">TMT 6-or-10-plex K</option>
+            <sanitizer invalid_char=""><valid initial="string.printable"><add value="("/><add value=")"/><add value=","/><add value="-"/><add value="_"/></valid><mapping initial="none"></mapping></sanitizer>
+        </param>
+        <param name="common_variable_modifications" type="select" label="Common Dynamic Modifications" multiple="true" help="Can occur anywhere on the peptide sequence; adds additional error to search score. Hold the appropriate key while clicking to select multiple items">
+            <option value="K_*_42.010565">Acetylation K</option>
+            <option value="(_*_42.010565">Acetylation Protein N-term</option>
+            <option value="C_*_57.021464">Carbamidomethyl C</option>
+            <option value="(_*_57.021464">Carbamidomethyl N-term</option>
+            <option value="N_*_0.984016">Deamidation N</option>
+            <option value="Q_*_0.984016">Deamidation Q</option>
+            <option value="K_*_14.015650">Methylation K</option>
+            <option value="M_*_15.994915" selected="true">Oxidation M</option>
+            <option value="S_*_97.976896">Phosphorylation S</option>
+            <option value="T_*_97.976896">Phosphorylation T</option>
+            <option value="Y_*_97.976896">Phosphorylation Y</option>
+            <option value="(E_*_-18.010565">Pyro-glu from E</option>
+            <option value="(Q_*_-17.026549">Pyro-glu from Q</option>
+            <sanitizer invalid_char=""><valid initial="string.printable"><add value="("/><add value=")"/><add value=","/><add value="_"/><add value="*"/><add value="-"/></valid><mapping initial="none"></mapping></sanitizer>
+        </param>
+
+          <repeat name="StaticMods" title="Custom Static Modifications" help="Modifications that are always applied to an amino acid. (-StaticMods)">
               <param name="aa" type="text" label="Amino Acid">
                   <sanitizer><valid initial="string.ascii_uppercase"><remove value="B"/><remove value="J"/><remove value="O"/><remove value="Z"/></valid></sanitizer>
               </param>
               <param name="mass" type="float" label="Mass" value="0" />
           </repeat>
-          <repeat name="DynamicMods" title="Dynamic Modifications" help="Modifications that can either be present or absent on an amino acid. (-DynamicMods)">
+          <repeat name="DynamicMods" title="Custom Dynamic Modifications" help="Modifications that can either be present or absent on an amino acid. (-DynamicMods)">
               <param name="motif" type="text" label="Amino Acid Motif">
                   <sanitizer>
                       <valid initial="string.ascii_uppercase">
@@ -117,7 +152,8 @@
               </param>
               <param name="mass" type="float" label="Mass" value="0" />
           </repeat>
-          <param argument="-MaxDynamicMods" type="integer" value="4" label="Maximum Dynamic Mods" help="Candidate peptides with more than this number of dynamic modifications will be skipped." />
+
+          <param argument="-MaxDynamicMods" type="integer" min="0" value="4" label="Maximum Dynamic Mods" help="Candidate peptides with more than this number of dynamic modifications will be skipped." />
           <section name="tolerance_options" title="M/Z Tolerance Options" expanded="True">
               <conditional name="precursor_tolerance">
                   <param argument="-PrecursorMzToleranceRule" type="select" label="Precursor Mass Type" help="For data from Thermo instruments, using the 'auto' setting on a will automatically choose monoisotopic or average mass values, for other instruments monoisotopic or average should be chosen.">
@@ -126,40 +162,40 @@
                       <option value="mono">Monoisotopic</option>
                   </param>
                   <when value="auto">
-                      <param argument="-MonoPrecursorMzTolerance" type="float" value="10" label="Monoisotopic Precursor m/z Tolerance" help="This tolerance will be used for spectra that are determined to have monoisotopic precursors. MonoisotopeAdjustmentSet is applied to these." />
+                      <param argument="-MonoPrecursorMzTolerance" type="float" min="0.000001" value="10" label="Monoisotopic Precursor m/z Tolerance" help="This tolerance will be used for spectra that are determined to have monoisotopic precursors. MonoisotopeAdjustmentSet is applied to these." />
                       <param name="mono_precursor_mz_tolerance_units" type="select" label="Monoisotopic Precursor m/z Tolerance Units">
                           <option value="ppm">Parts per million</option>
                           <option value="daltons">Daltons</option>
                       </param>
-                      <param argument="-AvgPrecursorMzTolerance" type="float" value="1.25" label="Average Precursor m/z Tolerance" help="This tolerance will be used for spectra that are determined to have average mass precursors. MonoisotopeAdjustmentSet is not applied to these." />
+                      <param argument="-AvgPrecursorMzTolerance" type="float" min="0.000001" value="1.25" label="Average Precursor m/z Tolerance" help="This tolerance will be used for spectra that are determined to have average mass precursors. MonoisotopeAdjustmentSet is not applied to these." />
                       <param name="avg_precursor_mz_tolerance_units" type="select" label="Average Precursor m/z Tolerance Units">
                           <option value="ppm">Parts per million</option>
                           <option value="daltons" selected="true">Daltons</option>
                       </param>
                   </when>
                   <when value="avg">
-                      <param argument="-AvgPrecursorMzTolerance" type="float" value="1.25" label="Average Precursor m/z Tolerance" help="This tolerance will be used for all spectra, but MonoisotopeAdjustmentSet will never be applied." />
+                      <param argument="-AvgPrecursorMzTolerance" type="float" min="0.000001" value="1.25" label="Average Precursor m/z Tolerance" help="This tolerance will be used for all spectra, but MonoisotopeAdjustmentSet will never be applied." />
                       <param name="avg_precursor_mz_tolerance_units" type="select" label="Average Precursor m/z Tolerance Units">
                           <option value="ppm">Parts per million</option>
                           <option value="daltons" selected="true">Daltons</option>
                       </param>
                   </when>
                   <when value="mono">
-                      <param argument="-MonoPrecursorMzTolerance" type="float" value="10" label="Monoisotopic Precursor m/z Tolerance" help="This tolerance will be used for all spectra, and MonoisotopeAdjustmentSet is likewise applied to all spectra." />
+                      <param argument="-MonoPrecursorMzTolerance" type="float" min="0.000001" value="10" label="Monoisotopic Precursor m/z Tolerance" help="This tolerance will be used for all spectra, and MonoisotopeAdjustmentSet is likewise applied to all spectra." />
                       <param name="mono_precursor_mz_tolerance_units" type="select" label="Monoisotopic Precursor m/z Tolerance Units">
                           <option value="ppm">Parts per million</option>
                           <option value="daltons">Daltons</option>
                       </param>
                   </when>
               </conditional>
-              <param argument="-FragmentMzTolerance" type="float" value="0.5" label="Fragment m/z Tolerance" help="This tolerance is used for matching to fragment ions." />
+              <param argument="-FragmentMzTolerance" type="float" min="0.000001" value="0.5" label="Fragment m/z Tolerance" help="This tolerance is used for matching to fragment ions." />
               <param name="fragment_mz_tolerance_units" type="select" label="Fragment m/z Tolerance Units">
                   <option value="ppm">Parts per million</option>
                   <option value="daltons" selected="true">Daltons</option>
               </param>
           </section>
           <section name="advanced" title="Advanced Options" expanded="False">
-              <param argument="-MaxPeakCount" type="integer" value="" optional="true" label="Use Max Peaks" help="Filter out all but the specified number of peaks, keep empty to use all peaks." />
+              <param argument="-MaxPeakCount" type="integer" min="10" value="" optional="true" label="Use Max Peaks" help="Filter out all but the specified number of peaks, keep empty to use all peaks." />
               <conditional name="fragmentation_rule">
                   <param argument="-FragmentationAutoRule" type="boolean" label="Override Fragmentation Rule (Ion Series)" help="If the input file provides mass analyzer information (mzML, mzXML, mz5), MyriMatch can automatically choose the ion series to search on a scan-by-scan basis." />
                   <when value="false" />
@@ -167,11 +203,11 @@
                       <param argument="-FragmentationRule" type="text" label="Fragmentation Rule" help="Specify as a comma-separated list of a, b, c, x, y, z, or z* (z+1), e.g. 'b,y,z'" />
                   </when>
               </conditional>
-              <param argument="-MinPeptideLength" type="integer" value="5" label="Minimum Peptide Length" help="Candidate peptides shorter than this will not be compared against any spectrum." />
-              <param argument="-MaxPeptideLength" type="integer" value="75" label="Maximum Peptide Length" help="Candidate peptides longer than this will not be compared against any spectrum." />
+              <param argument="-MinPeptideLength" type="integer" min="3" value="5" label="Minimum Peptide Length" help="Candidate peptides shorter than this will not be compared against any spectrum." />
+              <param argument="-MaxPeptideLength" type="integer" min="3" value="75" label="Maximum Peptide Length" help="Candidate peptides longer than this will not be compared against any spectrum." />
               <param argument="-UseSmartPlusThreeModel" type="boolean" truevalue="true" falsevalue="false" label="Use Smart Plus 3 Model" help="For +3 and higher precursors, the fragment ions predicted depend on the way this parameter is set. When this parameter is true, then for each peptide bond, an internal calculation is done to estimate the basicity of the b and y fragment sequence. When this parameter is false, however, ALL possible charge distributions for the fragment ions are generated for every peptide bond." checked="true" />
-              <param argument="-NumChargeStates" type="integer" value="3" label="Number of Charge States" help="For spectra with an ambiguous multiple charge state, it will be treated as any charge in the range: [+2,NumChargeStates]." />
-              <param argument="-MaxResultRank" type="integer" value="2" label="Maximum Result Rank" help="The maximum rank of a search result (results with the same score occupy the same rank)." />
+              <param argument="-NumChargeStates" type="integer" min="1" value="3" label="Number of Charge States" help="For spectra with an ambiguous multiple charge state, it will be treated as any charge in the range: [+2,NumChargeStates]." />
+              <param argument="-MaxResultRank" type="integer" min="1" value="2" label="Maximum Result Rank" help="The maximum rank of a search result (results with the same score occupy the same rank)." />
               <param argument="-MonoisotopeAdjustmentSet" type="text" value="[-1,2]" label="Monoisotope Adjustment Set" help="For monoisotopic precursors where the monoisotope may have been incorrectly assigned to a nearby isotope, this range of adjustments will be considered. Instead of trying a wide precursor tolerance for a spectrum, this tries multiple tight tolerances.">
                   <sanitizer invalid_char=""><valid initial="string.digits"><add value="["/><add value="]"/><add value=","/><add value="-"/></valid><mapping initial="none"></mapping></sanitizer>
               </param>
@@ -189,6 +225,8 @@
             <param name="input" value="input/201208-378803.mzML" />
             <param name="ProteinDatabase" value="input/cow.protein.PRG2012-subset.fasta" />
             <param name="DecoyPrefix" value="XXX_" />
+            <param name="common_fixed_modifications" value="" />
+            <param name="common_variable_modifications" value="" />
             <param name="StaticMods_0|aa" value="C" />
             <param name="StaticMods_0|mass" value="58.00548" />
             <param name="DynamicMods_0|motif" value="M" />
@@ -211,8 +249,33 @@
         <test>
             <param name="input" value="input/201208-378803.mzML" />
             <param name="ProteinDatabase" value="input/cow.protein.PRG2012-subset.fasta" />
+            <param name="DecoyPrefix" value="XXX_" />
+            <param name="StaticMods_0|aa" value="C" />
+            <param name="StaticMods_0|mass" value="58.00548" />
+            <param name="DynamicMods_0|motif" value="M" />
+            <param name="DynamicMods_0|mass" value="15.9949" />
+            <param name="DynamicMods_1|motif" value="(Q" />
+            <param name="DynamicMods_1|mass" value="-17.026" />
+            <param name="common_fixed_modifications" value="" />
+            <param name="common_variable_modifications" value="Q_*_0.984016,N_*_0.984016" />
+            <param name="PrecursorMzToleranceRule" value="mono" />
+            <param name="MonoPrecursorMzTolerance" value="50" />
+            <param name="MinTerminiCleavages" value="1" />
+            <param name="MaxMissedCleavages" value="2" />
+            <param name="MaxDynamicMods" value="2" />
+            <param name="NumChargeStates" value="5" />
+            <param name="MaxResultRank" value="3" />
+            <param name="MonoisotopeAdjustmentSet" value="[-1,2]" />
+            <param name="UseSmartPlusThreeModel" value="false" />
+            <output name="output" file="201208-378803-mm.pepXML" lines_diff="14" />
+        </test>
+        <test>
+            <param name="input" value="input/201208-378803.mzML" />
+            <param name="ProteinDatabase" value="input/cow.protein.PRG2012-subset.fasta" />
             <param name="CleavageRules" value="Trypsin" />
             <param name="DecoyPrefix" value="XXX_" />
+            <param name="common_fixed_modifications" value="" />
+            <param name="common_variable_modifications" value="" />
             <param name="PrecursorMzToleranceRule" value="mono" />
             <param name="MonoPrecursorMzTolerance" value="15" />
             <param name="MinTerminiCleavages" value="2" />