view falco-call.xml @ 59:73eda23fb8fd draft

Uploaded
author stef
date Wed, 25 Feb 2015 08:50:56 -0500
parents e7de191375e6
children 2820aab8b9c8
line wrap: on
line source

<tool id="falco-call" name="falco-call" version="0.0.1">
  
  <requirements>
    
    <requirement type="package" version="0.1.19">samtools</requirement>
    <requirement type="package" version="3.0.3">R</requirement>
    
  </requirements>

  <description>FALCO: Amplicon Analysis Pipeline</description>

  <command interpreter="bash">
    falco-call.sh $falco_cfg;
  </command>

  <stdio>
    <!-- Anything higher than 0 means the bash script didnt finish -->
    <exit_code range="1:" level="fatal" description="Bash script didnt finish correctly, check log" />
  </stdio>
  
  <inputs>
    <!-- ==================== -->
    <!-- General inputs -->
    <!-- ==================== -->
    <conditional name="genomeSource">
      <param name="refGenomeSource" type="select" label="You can select a reference genome from your history or use a built-in index">
        <option value="indexed">Use a built-in index</option>
        <option value="history">Use one from history</option>
      </param>
      <when value="indexed">
        <param name="indices" type="select" label="Select a reference genome">
          <options from_data_table="all_fasta">
            <filter type="sort_by" column="2" />
            <validator type="no_options" message="No indexes are available in table" />
          </options>
        </param>
      </when>
      <when value="history">
        <param name="ownFile" type="data" format="fasta" metadata_name="dbkey" label="Select a reference from history" />
      </when>
    </conditional>

    <param name="jobName" type="text" optional="false" label="Analysis/ouput name" help="Supply a name for the outputs to remind you what they contain" value="TEST">
      <validator type="empty_field" />
      <validator type="regex" message="This field may contain only non-whitespace characters">\S+</validator>
    </param>
    <param name="bam" type="data" multiple="false" optional="false" format="bam" label="Input BAM" help="Select BAM file" />

    <param format="tsv" name="filter_file" optional="True" type="data" label="FILTER File" help="When left empty, default list of genomic positions is used"/>
    <param format="txt" name="manifest_file" optional="True" type="data" label="MANIFEST File" help="When left empty, default Cancer Panel is used"/>

    <!-- ==================== -->
    <!-- Option to use your own bin annotations -->
    <!-- ==================== -->
  
  </inputs>
  
  <!-- ==================== -->
  <!-- This config is sourced by tool -->
  <!-- ==================== -->
  <configfiles>
    <configfile name="falco_cfg">
      filter_file=$filter_file
      manifest_file=$manifest_file
      bam_file=$bam
      bam_name=$bam.name
      html_out=$html_output
      vcf_out=$vcf_output
      qc_ann_qual_out=$qc_ann_qual_output
      qc2_ann_txt_out=$qc2_ann_txt_output
      qc_targets_txt_out=$qc_targets_txt_output

      out_path=${html_output.files_path}
      job_name=$jobName
      ## reference source
      REF_SOURCE="${genomeSource.refGenomeSource}"
      #if $genomeSource.refGenomeSource == "history":
        ##build index on the fly
        REF_FILE="${genomeSource.ownFile}"
        DB_KEY="${dbkey}"
      #else:
        ##use precomputed indexes
        REF_FILE="${genomeSource.indices.fields.path}"
      #end if
    </configfile>
  </configfiles>

  <!-- ==================== -->
  <!-- Main output is an html based report, additional on request -->
  <!-- ==================== -->
  <outputs>
    <data format="html" name="html_output" label="FALCO-calling (${jobName})" />
    <data format="vcf" name="vcf_output" label="FALCO-calling (${jobName}): VCF" />
    <data format="txt" name="qc_ann_qual_output" label="FALCO-calling (${jobName}): qc_ann_qual" />
    <data format="txt" name="qc2_ann_txt_output" label="FALCO-calling (${jobName}): qc2_ann" />
    <data format="txt" name="qc_targets_txt_output" label="FALCO-calling (${jobName}): qc_targets" />
  </outputs>

  <!-- ==================== -->
  <!-- Tests still to be done -->
  <!-- ==================== -->

  <!-- 
  <tests>
    <test>
      <param name="input1" value="input1" />   
      <param name="input2" value="input2" />   
    </test>
  </tests>
  -->

  <help>
.. class:: infomark

**Introduction**

This tool is a wrapper for the variant caller FALCO_ which is part of the Amplicon Analysis Pipeline (AAP)

.. _FALCO: https://github.com/tgac-vumc/falco/

Calls and annotates genomic variants for each amplicon in a design.

**Notes**

Because each amplicon is considered separate test, if two amplicons overlap this can cause the same variant position to be present twice in the output VCF. This is intentional, you can use this to evaluate the quality of the variant call beyond the amplicon.

-----

**Citation**

For the underlying tool please cite: Daoud Sie et al. Performance of amplicon-based next generation DNA sequencing for diagnostic gene mutation profiling in oncopathology (Cell Oncol 2014 Oct;37(5):353-61). [Pubmed]

.. _Pubmed: http://www.ncbi.nlm.nih.gov/pubmed/25209392

  </help>

</tool>