comparison ident_params.xml @ 1:fa76abf69433 draft

planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/peptideshaker commit e09348a0c372d4355c5dda6519e52ff17e0e8621-dirty
author jjohnson
date Fri, 08 Jun 2018 15:58:53 -0400
parents 8b99cb00e1c4
children
comparison
equal deleted inserted replaced
0:8b99cb00e1c4 1:fa76abf69433
6 <import>macros_basic.xml</import> 6 <import>macros_basic.xml</import>
7 </macros> 7 </macros>
8 <requirements> 8 <requirements>
9 <requirement type="package" version="@SEARCHGUI_VERSION@">searchgui</requirement> 9 <requirement type="package" version="@SEARCHGUI_VERSION@">searchgui</requirement>
10 <requirement type="package" version="3.0">zip</requirement> 10 <requirement type="package" version="3.0">zip</requirement>
11 <requirement type="package">JQ</requirement>
11 </requirements> 12 </requirements>
12 <expand macro="stdio" /> 13 <expand macro="stdio" />
13 <command> 14 <command>
14 <![CDATA[ 15 <![CDATA[
15 #set $temp_stderr = "searchgui_stderr" 16 #set $temp_stderr = "searchgui_stderr"
17 18
18 mkdir output; 19 mkdir output;
19 cwd=`pwd`; 20 cwd=`pwd`;
20 export HOME=\$cwd; 21 export HOME=\$cwd;
21 22
22 echo "DB: ${input_database.display_name} sequences: ${input_database.metadata.sequences}"; 23 echo 'DB: ${input_database.display_name} sequences: ${input_database.metadata.sequences}';
24
25 ## copy the input FASTA file to the working folder
26 cp '${input_database}' './input_database.fasta';
27
23 28
24 ##################################################### 29 #####################################################
25 ## generate IdentificationParameters for SearchGUI ## 30 ## generate IdentificationParameters for SearchGUI ##
26 ##################################################### 31 #####################################################
27 (searchgui eu.isas.searchgui.cmd.IdentificationParametersCLI 32 (searchgui eu.isas.searchgui.cmd.IdentificationParametersCLI
28 --exec_dir="\$cwd/${bin_dir}" 33 --exec_dir="./bin/"
29 -out "\$cwd/SEARCHGUI_IdentificationParameters.par" 34 -out './SEARCHGUI_IdentificationParameters_temp.par'
30 35
31 ## SPECTRUM MATCHING PARAMETERS 36 ## SPECTRUM MATCHING PARAMETERS
32 37
33 -db "${input_database}" 38 -db './input_database.fasta'
34 39
35 -frag_tol '${spectrum_matching_options.fragment_tol}' 40 -frag_tol '${spectrum_matching_options.fragment_tol}'
36 -frag_ppm '${spectrum_matching_options.fragment_tol_units}' 41 -frag_ppm '${spectrum_matching_options.fragment_tol_units}'
37 -prec_tol '${spectrum_matching_options.precursor_ion_tol}' 42 -prec_tol '${spectrum_matching_options.precursor_ion_tol}'
38 -prec_ppm '${spectrum_matching_options.precursor_ion_tol_units}' 43 -prec_ppm '${spectrum_matching_options.precursor_ion_tol_units}'
100 ## end if 105 ## end if
101 106
102 107
103 ## PTM LOCALIZATION 108 ## PTM LOCALIZATION
104 109
105 -ptm_score "${advanced_options.ptm_localization_options.ptm_score.ptm_score_selector}" 110 -ptm_score '${advanced_options.ptm_localization_options.ptm_score.ptm_score_selector}'
106 #if $advanced_options.ptm_localization_options.ptm_score.ptm_score_selector == 1 111 #if $advanced_options.ptm_localization_options.ptm_score.ptm_score_selector == 1
107 -score_neutral_losses "${advanced_options.ptm_localization_options.ptm_score.neutral_losses}" 112 -score_neutral_losses '${advanced_options.ptm_localization_options.ptm_score.neutral_losses}'
108 #if str($advanced_options.ptm_localization_options.ptm_score.ptm_threshold) != '' 113 #if str($advanced_options.ptm_localization_options.ptm_score.ptm_threshold) != ''
109 -ptm_threshold "${advanced_options.ptm_localization_options.ptm_score.ptm_threshold}" 114 -ptm_threshold '${advanced_options.ptm_localization_options.ptm_score.ptm_threshold}'
110 #end if 115 #end if
111 #end if 116 #end if
112 -ptm_alignment "${advanced_options.ptm_localization_options.ptm_alignment}" 117 -ptm_alignment '${advanced_options.ptm_localization_options.ptm_alignment}'
113 -ptm_sequence_matching_type "${advanced_options.ptm_localization_options.ptm_sequence_matching_type}" 118 -ptm_sequence_matching_type '${advanced_options.ptm_localization_options.ptm_sequence_matching_type}'
114 119
115 120
116 ## GENE ANNOTATION 121 ## GENE ANNOTATION
117 122
118 $advanced_options.gene_annotation_options.use_gene_mapping 123 $advanced_options.gene_annotation_options.use_gene_mapping
126 ## TODO: PROTEIN INFERENCE 131 ## TODO: PROTEIN INFERENCE
127 132
128 133
129 ## TODO: VALIDATION LEVELS 134 ## TODO: VALIDATION LEVELS
130 135
131 -protein_fdr "${advanced_options.validation_levels_options.protein_fdr}" 136 -protein_fdr '${advanced_options.validation_levels_options.protein_fdr}'
132 -peptide_fdr "${advanced_options.validation_levels_options.peptide_fdr}" 137 -peptide_fdr '${advanced_options.validation_levels_options.peptide_fdr}'
133 -psm_fdr "${advanced_options.validation_levels_options.psm_fdr}" 138 -psm_fdr '${advanced_options.validation_levels_options.psm_fdr}'
134 139
135 140
136 ## FRACTION ANALYSIS 141 ## FRACTION ANALYSIS
137 142
138 -protein_fraction_mw_confidence "${advanced_options.fraction_analysis_options.protein_fraction_mw_confidence}" 143 -protein_fraction_mw_confidence '${advanced_options.fraction_analysis_options.protein_fraction_mw_confidence}'
139 144
140 145
141 ## -- SEARCH ENGINES SPECIFIC PARAMETERS -- 146 ## -- SEARCH ENGINES SPECIFIC PARAMETERS --
142 147
143 148
220 225
221 ## MSGF+ ADVANCED PARAMETERS 226 ## MSGF+ ADVANCED PARAMETERS
222 227
223 #if $advanced_options.searchengines_advanced_options.msgf.msgf_advanced == "yes" 228 #if $advanced_options.searchengines_advanced_options.msgf.msgf_advanced == "yes"
224 -msgf_decoy ${advanced_options.searchengines_advanced_options.msgf.msgf_decoy} 229 -msgf_decoy ${advanced_options.searchengines_advanced_options.msgf.msgf_decoy}
225 -msgf_min_pep_length ${advanced_options.searchengines_advanced_options.msgf.msgf_min_pep_length}
226 -msgf_max_pep_length ${advanced_options.searchengines_advanced_options.msgf.msgf_max_pep_length}
227 -msgf_termini ${advanced_options.searchengines_advanced_options.msgf.msgf_termini}
228 -msgf_num_ptms ${advanced_options.searchengines_advanced_options.msgf.msgf_num_ptms}
229 -msgf_instrument ${advanced_options.searchengines_advanced_options.msgf.msgf_instrument} 230 -msgf_instrument ${advanced_options.searchengines_advanced_options.msgf.msgf_instrument}
230 -msgf_fragmentation ${advanced_options.searchengines_advanced_options.msgf.msgf_fragmentation} 231 -msgf_fragmentation ${advanced_options.searchengines_advanced_options.msgf.msgf_fragmentation}
231 -msgf_protocol ${advanced_options.searchengines_advanced_options.msgf.msgf_protocol} 232 -msgf_protocol ${advanced_options.searchengines_advanced_options.msgf.msgf_protocol}
233 -msgf_termini ${advanced_options.searchengines_advanced_options.msgf.msgf_termini}
234 -msgf_min_pep_length ${advanced_options.searchengines_advanced_options.msgf.msgf_min_pep_length}
235 -msgf_max_pep_length ${advanced_options.searchengines_advanced_options.msgf.msgf_max_pep_length}
236 -msgf_num_ptms ${advanced_options.searchengines_advanced_options.msgf.msgf_num_ptms}
232 -msgf_num_matches ${advanced_options.searchengines_advanced_options.msgf.msgf_num_matches} 237 -msgf_num_matches ${advanced_options.searchengines_advanced_options.msgf.msgf_num_matches}
233 -msgf_additional ${advanced_options.searchengines_advanced_options.msgf.msgf_additional} 238 -msgf_additional ${advanced_options.searchengines_advanced_options.msgf.msgf_additional}
239 #if $advanced_options.searchengines_advanced_options.msgf.msgf_tasks.msgf_tasks_custom == "yes"
240 -msgf_num_tasks ${advanced_options.searchengines_advanced_options.msgf.msgf_tasks.msgf_num_tasks}
241 #end if
234 #end if 242 #end if
235 243
236 244
237 ## MSAMANDA ADVANCED PARAMETERS 245 ## MSAMANDA ADVANCED PARAMETERS
238 246
417 -novor_fragmentation ${advanced_options.searchengines_advanced_options.novor.novor_fragmentation} 425 -novor_fragmentation ${advanced_options.searchengines_advanced_options.novor.novor_fragmentation}
418 -novor_mass_analyzer ${advanced_options.searchengines_advanced_options.novor.novor_mass_analyzer} 426 -novor_mass_analyzer ${advanced_options.searchengines_advanced_options.novor.novor_mass_analyzer}
419 #end if 427 #end if
420 428
421 2> $temp_stderr); 429 2> $temp_stderr);
430
431 ## reading from the original .par file
432 content_par_target_path=`cat ./SEARCHGUI_IdentificationParameters_temp.par`;
433 ## modifying the .par file
434 ## First we establish the new content for the path: .searchParameters.fastaFile.path
435 new_content_par_target_path=`jq '.searchParameters.fastaFile.path = \$newVal' --arg newVal './input_database.fasta' <<< "\$content_par_target_path"`;
436 ## Secondly, for .proteinInferencePreferences.proteinSequenceDatabase.path
437 new_content_par_target_path=`jq '.proteinInferencePreferences.proteinSequenceDatabase.path = \$newVal' --arg newVal './input_database.fasta' <<< "\$new_content_par_target_path"`;
438
439 ## we generate a new .par file filled with the new fasta path.
440 echo 'Final identification parameters file: ';
441 #set $new_par_target_path = './SEARCHGUI_IdentificationParameters.par';
442 echo $new_par_target_path;
443 echo "\$new_content_par_target_path" >> $new_par_target_path;
444
445 ## compress both parameters and fasta file for the output
446 (zip ./IdentificationParametersAndFasta.zip ./SEARCHGUI_IdentificationParameters.par 2>> $temp_stderr)
447
448 &&
449
450 (zip -u ./IdentificationParametersAndFasta.zip ./input_database.fasta 2>> $temp_stderr);
422 451
423 exit_code_for_galaxy=\$?; 452 exit_code_for_galaxy=\$?;
424 cat $temp_stderr 2>&1; 453 cat $temp_stderr 2>&1;
425 (exit \$exit_code_for_galaxy) 454 (exit \$exit_code_for_galaxy)
426 ]]> 455 ]]>
805 <option value="no" selected="True">Default</option> 834 <option value="no" selected="True">Default</option>
806 </param> 835 </param>
807 <when value="no" /> 836 <when value="no" />
808 <when value="yes"> 837 <when value="yes">
809 <param name="msgf_decoy" type="boolean" truevalue="1" falsevalue="0" checked="false" 838 <param name="msgf_decoy" type="boolean" truevalue="1" falsevalue="0" checked="false"
810 label="MSGF: Search Decoys" help="If yes then a decoy database will be generated and searched. Assumed input database contains no decoys"/> 839 label="MSGF: Search Decoy Database" help="If yes then a decoy database will be generated and searched. Assumed input database contains no decoys"/>
811 <param name="msgf_min_pep_length" type="integer" value="6" 840 <param name="msgf_instrument" label="MSGF: MS/MS Detector" type="select" help="Identifier of the instrument to generate MS/MS spectra (used to determine the scoring model)">
812 label="MSGF: Minimum Peptide Length" help="Minimum length for a peptide to be considered"/> 841 <option value="0" >Low-res LCQ/LTQ</option>
813 <param name="msgf_max_pep_length" type="integer" value="30" 842 <option value="1" >Orbitrap/FTICR</option>
814 label="MSGF: Maximum Peptide Length" help="Maximum length for a peptide to be considered"/>
815 <param name="msgf_termini" type="select" format="txt"
816 label="MSGF: Number of tolerable termini" help="Searches will take much longer if selecting a value other than 2">
817 <option value="0">0 (ie non-specific cleavage)</option>
818 <option value="1">1 (ie semi-tryptic cleavage)</option>
819 <option value="2" selected="true">2 (ie fully-tryptic cleavage)</option>
820 </param>
821 <param name="msgf_num_ptms" label="MSGF: Max PTMs per peptide" type="integer" value="2"/>
822
823 <param name="msgf_instrument" label="MSGF: Instrument type" type="select" help="Identifier of the instrument to generate MS/MS spectra (used to determine the scoring model)">
824 <option value="0" selected="True">Low-res LCQ/LTQ</option>
825 <option value="1" >High-res LTQ</option>
826 <option value="2" >TOF</option> 843 <option value="2" >TOF</option>
827 <option value="3" >Q-Exactive</option> 844 <option value="3" selected="True">Q-Exactive</option>
828 </param> 845 </param>
829 <param name="msgf_fragmentation" label="MSGF: Fragmentation type" type="select" help="Fragmentation method identifier (used to determine the scoring model)"> 846 <param name="msgf_fragmentation" label="MSGF: Fragmentation method" type="select" help="Fragmentation method identifier (used to determine the scoring model)">
830 <option value="0" selected="True">As written in the spectrum or CID if no info</option> 847 <option value="0" >As written in the spectrum or CID if no info</option>
831 <option value="1" >CID</option> 848 <option value="1" >CID</option>
832 <option value="2" >ETD</option> 849 <option value="2" >ETD</option>
833 <option value="3" >HCD</option> 850 <option value="3" selected="True">HCD</option>
834 </param> 851 <option value="4" >UVPD</option>
835 <param name="msgf_protocol" label="MSGF: Protocol type" type="select" help="Protocol identifier. Protocols are used to enable scoring parameters for enriched and/or labeled samples"> 852 </param>
853 <param name="msgf_protocol" label="MSGF: Protocol" type="select" help="Protocol identifier. Protocols are used to enable scoring parameters for enriched and/or labeled samples">
836 <option value="0" selected="True">Automatic</option> 854 <option value="0" selected="True">Automatic</option>
837 <option value="1" >Phosphorylation</option> 855 <option value="1" >Phosphorylation</option>
838 <option value="2" >iTRAQ</option> 856 <option value="2" >iTRAQ</option>
839 <option value="3" >iTRAQPhospho</option> 857 <option value="3" >iTRAQPhospho</option>
840 <option value="4" >TMT</option> 858 <option value="4" >TMT</option>
841 <option value="5" >Standard</option> 859 <option value="5" >Standard</option>
842 </param> 860 </param>
843 <param name="msgf_num_matches" label="MSGF: Maximum Number of Spectrum Matches" type="integer" value="1" help="Number of peptide matches per spectrum to report" /> 861 <param name="msgf_termini" type="select" format="txt"
844 <param name="msgf_additional" label="MS-GF+ additional features" type="select" help="Additional features to export"> 862 label="MSGF: Enzymatic Terminals" help="Searches will take much longer if selecting a value other than 2">
863 <option value="0">None required</option>
864 <option value="1">At least one</option>
865 <option value="2" selected="true">Both</option>
866 </param>
867 <param name="msgf_min_pep_length" type="integer" value="8"
868 label="MSGF: Minimum Peptide Length" help="Minimum length for a peptide to be considered"/>
869 <param name="msgf_max_pep_length" type="integer" value="30"
870 label="MSGF: Maximum Peptide Length" help="Maximum length for a peptide to be considered"/>
871 <param name="msgf_num_ptms" label="MSGF: Max Variable PTMs per Peptide" type="integer" value="2"/>
872 <param name="msgf_num_matches" label="MSGF: Number of Spectrum Matches" type="integer" value="10" help="Number of peptide matches per spectrum to report" />
873 <param name="msgf_additional" label="MS-GF+ additional Output" type="select" help="Additional features to export">
845 <option value="0" selected="True">output basic scores only</option> 874 <option value="0" selected="True">output basic scores only</option>
846 <option value="1" >output additional features</option> 875 <option value="1" >output additional features</option>
847 </param> 876 </param>
877 <conditional name="msgf_tasks">
878 <param name="msgf_tasks_custom" type="select" label="Number of tasks to use on the threads">
879 <option value="yes">Custom</option>
880 <option value="no" selected="True">Default</option>
881 </param>
882 <when value="no" />
883 <when value="yes">
884 <param name="msgf_num_tasks" type="integer" value="4"
885 label="MSGF: Custom number of tasks to use on the threads"
886 help="Manually set the number of tasks to create for the search. More tasks than threads will reduce the memory requirements of the search, but will be slower (how much depends on the inputs). Check the documentation carefully. "/>
887 </when>
888 </conditional>
848 </when> 889 </when>
849 </conditional> 890 </conditional>
850 891
851 <!-- MS-AMANDA ADVANCED PARAMETERS --> 892 <!-- MS-AMANDA ADVANCED PARAMETERS -->
852 <conditional name="ms_amanda"> 893 <conditional name="ms_amanda">
1220 </section> 1261 </section>
1221 </section> 1262 </section>
1222 1263
1223 </inputs> 1264 </inputs>
1224 <outputs> 1265 <outputs>
1225 <data name="Searchgui_Identification_Parameters" format="par" from_work_dir="SEARCHGUI_IdentificationParameters.par" label="${tool.name}: PAR file on ${on_string}" /> 1266 <!-- <data name="Searchgui_Identification_Parameters" format="par" from_work_dir="SEARCHGUI_IdentificationParameters.par" label="${tool.name}: PAR file on ${on_string}" /> -->
1267 <data name="Identification_Parameters_And_Fasta" format="zip" from_work_dir="IdentificationParametersAndFasta.zip" label="${tool.name}: Compressed PAR and FASTA files on ${on_string}" />
1226 </outputs> 1268 </outputs>
1227 <tests> 1269 <tests>
1228 1270
1229 <!-- Test that default parameters generates a standar par file --> 1271 <!-- Test that default parameters generates a standar par file -->
1230 <test> 1272 <test>
1231 <param name="input_database" value="searchgui_tinydb1_concatenated_target_decoy.fasta" ftype="fasta"/> 1273 <param name="input_database" value="searchgui_tinydb1_concatenated_target_decoy.fasta" ftype="fasta"/>
1232 <output name="Searchgui_Identification_Parameters" file="Identification_Parameters_default.par" ftype="par" compare="sim_size" delta="1000" /> 1274 <output name="Identification_Parameters_And_Fasta" file="IdentificationParametersAndFastaDefault.zip" ftype="zip" compare="sim_size" delta="1000" />
1233 </test> 1275 </test>
1234 <!-- Test specific parameters --> 1276 <!-- Test specific parameters -->
1235 <test> 1277 <test>
1236 <param name="input_database" value="searchgui_tinydb1_concatenated_target_decoy.fasta" ftype="fasta"/> 1278 <param name="input_database" value="searchgui_tinydb1_concatenated_target_decoy.fasta" ftype="fasta"/>
1237 <param name="precursor_ion_tol" value="100"/> 1279 <param name="precursor_ion_tol" value="100"/>
1239 <param name="variable_modifications" value="Oxidation of M"/> 1281 <param name="variable_modifications" value="Oxidation of M"/>
1240 <param name="min_charge" value="1"/> 1282 <param name="min_charge" value="1"/>
1241 <param name="max_charge" value="3"/> 1283 <param name="max_charge" value="3"/>
1242 <param name="xtandem_advanced" value="yes"/> 1284 <param name="xtandem_advanced" value="yes"/>
1243 <param name="xtandem_refine_selector" value="yes"/> 1285 <param name="xtandem_refine_selector" value="yes"/>
1244 <output name="Searchgui_Identification_Parameters" file="Identification_Parameters_specific.par" ftype="par" compare="sim_size" delta="5000" /> 1286 <output name="Identification_Parameters_And_Fasta" file="IdentificationParametersAndFastaSpecific.zip" ftype="zip" compare="sim_size" delta="1000" />
1245 </test> 1287 </test>
1246 1288
1247 </tests> 1289 </tests>
1248 <help> 1290 <help>
1249 **What it does** 1291 **What it does**
1250 1292
1251 Creates a parameters file which can be used independently by SearchGUI or PeptideShaker apps. 1293 Creates a zip file containing:
1252 1294
1253 FASTA file used by this app must be kept in the history as the generated .par file will reference to it. 1295 - A fasta file.
1254 1296 - A parameters file (.par) which can be used independently by SearchGUI or PeptideShaker apps. It makes reference to the previous fasta file.
1255 A FASTA file with decoy sequences is recommended if SearchGUI and PeptideShaker are going to be used. 1297
1298 A FASTA file with decoy sequences generated by FastaCLI is recommended if SearchGUI and PeptideShaker are going to use the output of this tool.
1256 1299
1257 </help> 1300 </help>
1258 <expand macro="citations" /> 1301 <expand macro="citations" />
1259 </tool> 1302 </tool>