Mercurial > repos > iuc > gatk2
changeset 2:28b85e2409ce draft
Uploaded
author | bgruening |
---|---|
date | Sat, 30 Nov 2013 10:36:47 -0500 |
parents | c8752e31f496 |
children | b7ef18eaa9c9 |
files | base_recalibrator.xml indel_realigner.xml print_reads.xml realigner_target_creator.xml tool_dependencies.xml |
diffstat | 5 files changed, 47 insertions(+), 47 deletions(-) [+] |
line wrap: on
line diff
--- a/base_recalibrator.xml Tue Nov 26 06:10:20 2013 -0500 +++ b/base_recalibrator.xml Sat Nov 30 10:36:47 2013 -0500 @@ -1,5 +1,5 @@ <tool id="gatk2_base_recalibrator" name="Base Recalibrator" version="0.0.7"> - <description>on BAM files</description> + <description>calculates covariates used to recalibrate base quality scores of reads</description> <expand macro="requirements" /> <macros> <import>gatk2_macros.xml</import> @@ -20,6 +20,9 @@ --num_cpu_threads_per_data_thread 8 @THREADS@ + ## we set non standards at every run and the user can choose which ones are preferred + ## in our select box both standard options (ContextCovariate, CycleCovariate) are selected by default + --no_standard_covs #if $reference_source.reference_source_selector != "history": -R "${reference_source.ref_file.fields.path}" @@ -28,15 +31,11 @@ --BQSR "${input_recal}" #end if --out "${output_recal}" - ${standard_covs} #if str( $covariates ) != "None": #for $cov in str( $covariates ).split( ',' ): -cov "${cov}" #end for #end if - #if $plot_pdf: - --plot_pdf_file $output_pdf - #end if ' #set $snp_dataset_provided = False @@ -118,26 +117,25 @@ Please be aware that one should only run recalibration with the covariates file created on the same input bam(s). </help> </param> - <param name="standard_covs" type="boolean" truevalue="" falsevalue="--no_standard_covs" checked="false" label="Do not use the standard set of covariates in addition to the ones selected" help="--no_standard_covs/-noStandard" /> + <param name="covariates" type="select" multiple="True" display="checkboxes" label="Covariates to be used in the recalibration" help="-cov,--covariate &lt;covariate&gt;" > <!-- might we want to load the available covariates from an external configuration file, since additional ones can be added to local installs? --> - <option value="ReadGroupCovariate" /> + <option value="ContextCovariate" selected="true"/> + <option value="CycleCovariate" selected="true"/> + <option value="RepeatLengthCovariate" /> + <option value="RepeatUnitCovariate" /> + <option value="RepeatUnitAndLengthCovariate" /> + <!-- + Note: ReadGroupCovariate and QualityScoreCovariate are required covariates and will + be added for the user regardless of whether or not they were specified. <option value="QualityScoreCovariate" /> - <option value="CycleCovariate" /> - <option value="ContextCovariate" /> - <!-- covariates below were pulled from list option --> - <option value="HomopolymerCovariate" /> - <option value="GCContentCovariate" /> - <option value="MappingQualityCovariate" /> - <option value="MinimumNQSCovariate" /> - <option value="PositionCovariate" /> - <option value="PrimerRoundCovariate" /> - <option value="TileCovariate" /> + <option value="ReadGroupCovariate" /> + --> </param> - <repeat name="rod_bind" title="Binding for reference-ordered data" help="-knownSites,--knownSites &lt;knownSites&gt;"> + <repeat name="rod_bind" title="Known Variants" help="Using data sets of known variants (-knownSites,--knownSites &lt;knownSites&gt;)"> <conditional name="rod_bind_type"> - <param name="rod_bind_type_selector" type="select" label="Binding Type"> + <param name="rod_bind_type_selector" type="select" label="Variant Type"> <option value="dbsnp" selected="True">dbSNP</option> <option value="snps">SNPs</option> <option value="indels">INDELs</option> @@ -145,24 +143,24 @@ <option value="custom">Custom</option> </param> <when value="dbsnp"> - <param name="input_rod" type="data" format="vcf,gatk_dbsnp,bed" label="ROD file" /> + <param name="input_rod" type="data" format="vcf,gatk_dbsnp,bed" label="Variant file" /> </when> <when value="snps"> - <param name="input_rod" type="data" format="vcf,gatk_dbsnp,bed" label="ROD file" /> + <param name="input_rod" type="data" format="vcf,gatk_dbsnp,bed" label="Variant file" /> </when> <when value="indels"> - <param name="input_rod" type="data" format="vcf,gatk_dbsnp,bed" label="ROD file" /> + <param name="input_rod" type="data" format="vcf,gatk_dbsnp,bed" label="Variant file" /> </when> <when value="mask"> - <param name="input_rod" type="data" format="vcf,gatk_dbsnp,bed" label="ROD file" /> + <param name="input_rod" type="data" format="vcf,gatk_dbsnp,bed" label="Variant file" /> </when> <when value="custom"> - <param name="custom_rod_name" type="text" value="Unknown" label="ROD Name"/> - <param name="input_rod" type="data" format="vcf,gatk_dbsnp,bed" label="ROD file" /> + <param name="custom_rod_name" type="text" value="Unknown" label="Customer's variant file"/> + <param name="input_rod" type="data" format="vcf,gatk_dbsnp,bed" label="Variant file" /> </when> </conditional> </repeat> - <param name="plot_pdf" type="boolean" truevalue="--plot_pdf_file" falsevalue="" checked="False" label="Output recalibration plots pdf"/> + <expand macro="gatk_param_type_conditional" /> <conditional name="analysis_param_type"> @@ -243,9 +241,6 @@ <outputs> <data format="gatk_report" name="output_recal" label="${tool.name} on ${on_string} (Covariate File)" /> <data format="txt" name="output_log" label="${tool.name} on ${on_string} (log)" /> - <data format="pdf" name="output_pdf" label="${tool.name} on ${on_string} (plot_pdf_file)"> - <filter>plot_pdf == True</filter> - </data> </outputs> <tests> <test>
--- a/indel_realigner.xml Tue Nov 26 06:10:20 2013 -0500 +++ b/indel_realigner.xml Sat Nov 30 10:36:47 2013 -0500 @@ -87,26 +87,26 @@ </when> </conditional> <param name="target_intervals" type="data" format="gatk_interval,bed,picard_interval_list" label="Restrict realignment to provided intervals" help="-targetIntervals,--targetIntervals &lt;targetIntervals&gt;" /> - <repeat name="rod_bind" title="Binding for reference-ordered data" help="-known,--knownAlleles &lt;knownAlleles&gt;"> + <repeat name="rod_bind" title="Known Variants" help="Using data sets of known variants (-known,--knownAlleles &lt;knownAlleles&gt;)"> <conditional name="rod_bind_type"> - <param name="rod_bind_type_selector" type="select" label="Binding Type"> + <param name="rod_bind_type_selector" type="select" label="Variant Type"> <option value="dbsnp" selected="True">dbSNP</option> <option value="snps">SNPs</option> <option value="indels">INDELs</option> <option value="custom">Custom</option> </param> <when value="dbsnp"> - <param name="input_rod" type="data" format="vcf" label="ROD file" /> + <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" /> </when> <when value="snps"> - <param name="input_rod" type="data" format="vcf" label="ROD file" /> + <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" /> </when> <when value="indels"> - <param name="input_rod" type="data" format="vcf" label="ROD file" /> + <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" /> </when> <when value="custom"> - <param name="custom_rod_name" type="text" value="Unknown" label="ROD Name"/> - <param name="input_rod" type="data" format="vcf" label="ROD file" /> + <param name="custom_rod_name" type="text" value="Unknown" label="Customer's variant file"/> + <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" /> </when> </conditional> </repeat>
--- a/print_reads.xml Tue Nov 26 06:10:20 2013 -0500 +++ b/print_reads.xml Sat Nov 30 10:36:47 2013 -0500 @@ -73,7 +73,8 @@ #end if </command> <inputs> - <param name="input_recal" type="data" format="csv" optional="true" label="Covariates table recalibration file" help="-BQSR,--BQSR &lt;recal_file&gt;" /> + <param name="input_recal" type="data" format="gatk_report" optional="true" label="Covariates table recalibration file" + help="The input covariates table file which enables on-the-fly base quality score recalibration (intended for use with BaseRecalibrator files) (-BQSR,--BQSR)" /> <conditional name="reference_source"> <expand macro="reference_source_selector_param" /> <when value="cached"> @@ -212,7 +213,7 @@ **Inputs** -GenomeAnalysisTK: PrintReads accepts an aligned BAM and a recalibration CSV input files. +GenomeAnalysisTK: PrintReads accepts an aligned BAM and a recalibration (gatk_report) input files. **Outputs** @@ -235,7 +236,7 @@ exception_if_no_tile If provided, TileCovariate will throw an exception when no tile can be found. The default behavior is to use tile = -1 solid_recal_mode How should we recalibrate solid bases in whichthe reference was inserted? Options = DO_NOTHING, SET_Q_ZERO, SET_Q_ZERO_BASE_N, or REMOVE_REF_BIAS (DO_NOTHING|SET_Q_ZERO|SET_Q_ZERO_BASE_N|REMOVE_REF_BIAS) solid_nocall_strategy Defines the behavior of the recalibrator when it encounters no calls in the color space. Options = THROW_EXCEPTION, LEAVE_READ_UNRECALIBRATED, or PURGE_READ (THROW_EXCEPTION|LEAVE_READ_UNRECALIBRATED|PURGE_READ) - recal_file Filename for the input covariates table recalibration .csv file + recal_file Filename for the input covariates table recalibration .gatk_report file out The output BAM file bam_compression Compression level to use for writing BAM files disable_bam_indexing Turn off on-the-fly creation of indices for output BAM files.
--- a/realigner_target_creator.xml Tue Nov 26 06:10:20 2013 -0500 +++ b/realigner_target_creator.xml Sat Nov 30 10:36:47 2013 -0500 @@ -74,26 +74,26 @@ </when> </conditional> - <repeat name="rod_bind" title="Binding for reference-ordered data" help="-known,--known &lt;known&gt;"> + <repeat name="rod_bind" title="Known Variants" help="Using data sets of known variants (-known,--known &lt;known&gt;)"> <conditional name="rod_bind_type"> - <param name="rod_bind_type_selector" type="select" label="Binding Type"> + <param name="rod_bind_type_selector" type="select" label="Variant Type"> <option value="dbsnp" selected="True">dbSNP</option> - <option value="snps">SNPs</option> + <option value="snps">SNPs</option> <option value="indels">INDELs</option> <option value="custom">Custom</option> </param> <when value="dbsnp"> - <param name="input_rod" type="data" format="vcf" label="ROD file" /> + <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" /> </when> <when value="snps"> - <param name="input_rod" type="data" format="vcf" label="ROD file" /> + <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" /> </when> <when value="indels"> - <param name="input_rod" type="data" format="vcf" label="ROD file" /> + <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" /> </when> <when value="custom"> - <param name="custom_rod_name" type="text" value="Unknown" label="ROD Name"/> - <param name="input_rod" type="data" format="vcf" label="ROD file" /> + <param name="custom_rod_name" type="text" value="Unknown" label="Customer's variant file" /> + <param name="input_rod" type="data" format="vcf" label="Variant file (VCF format)" /> </when> </conditional> </repeat>
--- a/tool_dependencies.xml Tue Nov 26 06:10:20 2013 -0500 +++ b/tool_dependencies.xml Sat Nov 30 10:36:47 2013 -0500 @@ -4,6 +4,10 @@ <environment_variable action="set_to" name="GATK2_PATH">/please set the path to your GATK2 dir in the corresponding env.sh file/</environment_variable> </set_environment> <!-- + Use GATK2_SITE_OPTIONS to set additional parameters that should be inserted in every GATK2 call. + The intended use case was to prohibit GATK2 to collect and send data. + For example: + -et "NO_ET" -K "/data/gatk2_key_file" ##ET no phone home --> <set_environment version="1.0">