view tools/clc_assembly_cell/clc_assembler.xml @ 0:7b96d8a3262f draft

Uploaded v0.0.0, wrappers for the CLCbio assember and mapper only.
author peterjc
date Thu, 31 Oct 2013 07:57:41 -0400
children 6e145e4715a7
line wrap: on
line source

<tool id="clc_assembler" name="CLC assembler" version="0.0.1">
    <description>Assembles reads giving a FASTA file</description>
        <requirement type="binary">clc_assembler</requirement>
    <version_command>/mnt/apps/clcBio/clc-assembly-cell-4.1.0-linux_64/clc_assembler | grep -i version</version_command>
#for $rg in $read_group
#if str($rg.segments.type) == "paired"
-p $rg.segments.placement $rg.segments.dist_mode $rg.segments.min_size $rg.segments.max_size -q -i "$rg.segments.filename1" "$rg.segments.filename2"
#end if
#if str($rg.segments.type) == "interleaved"
-p $rg.segments.placement $rg.segments.dist_mode $rg.segments.min_size $rg.segments.max_size -q "$rg.segments.filename"
#end if
#if str($rg.segments.type) == "none"
-p no -q
#for $f in $rg.segments.filenames
#end for
#end if
#end for
-o "$out_fasta"
-v | grep -v "^Progress: "</command>
        <!-- Assume anything other than zero is an error -->
        <exit_code range="1:" />
        <exit_code range=":-1" />
        <repeat name="read_group" title="Read Group" min="1">
            <conditional name="segments">
                <param name="type" type="select" label="Are these paired reads?">
                    <option value="paired">Paired reads (as two files)</option>
		    <option value="interleaved">Paired reads (as one interleaved file)</option>
                    <option value="none">Unpaired reads (single or orphan reads)</option>
                <when value="paired">
                    <param name="placement" type="select" label="Pairing type (segment placing)">
                        <option value="fb">---&gt; &lt;--- (e.g. Sanger capillary or Solexa/Illumina paired-end library)</option>
                        <option value="bf">&lt;--- ---&gt; (e.g. Solexa/Illumina mate-pair library)</option>
                        <option value="ff">---&gt; ---&gt;</option>
                        <option value="bb">&lt;--- &lt;---</option>
		    <param name="dist_mode" type="select" label="How is the fragment distance measured?">
                        <option value="ss">Start to start (e.g. Sanger capillary or Solexa/Illumina libraries)</option>
                        <option value="se">Start to end</option>
                        <option value="es">End to start</option>
                        <option value="ee">End to end</option>
                    <!-- TODO - min/max validation done via the <code> tag? -->
                    <param name="min_size" type="integer" optional="false" min="0" value=""
                           label="Minimum size of 'good' DNA templates in the library preparation" />
                    <param name="max_size" type="integer" optional="false" min="0" value=""
                           label="Maximum size of 'good' DNA templates in the library preparation" />
		    <param name="filename1" type="data" format="fastq,fasta" required="true" label="Read file one"/>
                    <param name="filename2" type="data" format="fastq,fasta" required="true" label="Read file two"/>
                <when value="interleaved">
                    <param name="placement" type="select" label="Pairing type (segment placing)">
                        <option value="fb">---&gt; &lt;--- (e.g. Sanger capillary or Solexa/Illumina paired-end library)</option>
                        <option value="bf">&lt;--- ---&gt; (e.g. Solexa/Illumina mate-pair library)</option>
                        <option value="ff">---&gt; ---&gt;</option>
                        <option value="bb">&lt;-- &lt;--</option>
                    <param name="dist_mode" type="select" label="How is the fragment distance measured?">
                        <option value="ss">Start to start (e.g. Sanger capillary or Solexa/Illumina libraries)</option>
                        <option value="se">Start to end</option>
                        <option value="es">End to start</option>
                        <option value="ee">End to end</option>
                    <!-- TODO - min/max validation done via the <code> tag? -->
                    <param name="min_size" type="integer" optional="false" min="0" value=""
                           label="Minimum size of 'good' DNA templates in the library preparation" />
                    <param name="max_size" type="integer" optional="false" min="0" value=""
                           label="Maximum size of 'good' DNA templates in the library preparation" />
                    <param name="filename" type="data" format="fastq,fasta" required="true" label="Interleaved read file"/>
                <when value="none">
                    <param name="filenames" type="data" format="fastq,fasta" multiple="true" required="true" label="Read file(s)"
                           help="Multiple files allowed, for example several files of orphan reads." />
	<!-- Word size? -->
	<!-- Bubble size? -->
	<!-- Scaffolding options? -->
        <!-- Minimum contig length? -->
        <!-- AGP / GFF output? -->
    <!-- min/max validation? <code file="" /> -->
        <data name="out_fasta" format="fasta" label="CLCbio assember contigs (FASTA)" />
        <!-- TODO -->

**What it does**

Runs the ``clc_assembler`` tool giving a FASTA output file. You would then
typically map the same set of reads onto this assembly using ``cls_mapper``
to any perform downstream analysis using the mapped reads.


If you use this Galaxy tool in work leading to a scientific publication please
cite this wrapper as:

Peter J.A. Cock (2013), Galaxy wrapper for the CLC Assembly Cell suite from CLCbio

This wrapper is available to install into other Galaxy Instances via the Galaxy
Tool Shed at