diff cgatools/tools/cgatools_1.6/evidence2sam.xml @ 20:382c50ce0519 draft

Uploaded
author bcrain-completegenomics
date Tue, 04 Sep 2012 18:46:40 -0400
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/cgatools/tools/cgatools_1.6/evidence2sam.xml	Tue Sep 04 18:46:40 2012 -0400
@@ -0,0 +1,229 @@
+<tool id="cg_evidence2sam" name="evidence2sam(beta) 1.6" version="1.0.0">
+<!--
+This tool creates a GUI for the evidence2sam function of cgatools from Complete Genomics, Inc.
+written 8-31-2012 by bcrain@completegenomics.com
+-->
+
+  <description>converts evidence mappings to SAM format</description>
+  
+  <command>
+<!-- print version of cgatools to STDOUT-->
+cgatools | head -1;
+
+<!-- print command lines to STDOUT-->
+echo "cgatools evidence2sam --beta
+--reference $crr.fields.path
+--output $output
+--evidence-dnbs $data_sources.input
+--consistent-mapping-range $range
+#if $region.selectregion == "yes"
+--extract-genomic-region $region.coordinates
+#end if
+$duplicates
+$mates
+$intervals
+$skip
+$svcandidates
+$unmapped
+$primary
+";
+
+<!-- execute cgatools-->
+cgatools evidence2sam --beta
+--reference $crr.fields.path
+--evidence-dnbs $data_sources.input
+#if $region.selectregion == "yes"
+	--extract-genomic-region $region.coordinates
+#end if
+$duplicates
+$mates
+$intervals
+$skip
+$svcandidates
+$unmapped
+$primary
+--consistent-mapping-range $range
+--output $output
+  </command>
+
+  <outputs>
+    <data format="tabular" name="output" label="${tool.name} output"/>
+  </outputs>
+  
+  <inputs>
+		<!--form field to select crr file-->
+		<param name="crr" type="select" label="Reference genome (.crr file)">
+			<options from_data_table="cg_crr_files" />
+		</param>
+	
+		<!--conditional to select input file-->
+  	<conditional name="data_sources">
+      <param name="data_source" type="select" label="Where is the input evidence file?">
+        <option value="in">imported into Galaxy</option>
+        <option value="out" selected="true">located outside Galaxy (data on server or mounted drive)</option>
+      </param>
+      
+			<!--form field to select evidence files-->
+      <when value="in">
+				<param name="input" type="data" format="tabluar" label="EvidenceDnbs file">
+					<validator type="dataset_ok_validator" />
+					<validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
+					 metadata_name="dbkey" metadata_column="1"
+					 message="cgatools is not currently available for this build."/>
+				</param>
+			</when>
+			
+			<!--form field to enter external input file-->
+      <when value="out">
+				<param name="input" type="text" label="EvidenceDnbs file (/path/file)" size="40" help="e.g. /harddrive/GS00000XXXX-DID/GS00000YYYY-ASM/GS00123-DNA_G01_2000/ASM/EVIDENCE/evidenceDnbs-chr21-GS00000YYYY-ASM.tsv.bz2">
+					<validator type="empty_field" message="You must supply an evidenceDnbs file"/>
+				</param>
+			</when>
+		</conditional>
+
+		<!--form field to select chromosomal region-->
+		<conditional name="region">
+			<param name="selectregion" type="select" label="Do you what to extract specific genomic region?">
+				<option value="no" selected="true">no</option>
+				<option value="yes">yes</option>
+			</param>
+
+			<when value="yes">
+				<param name="coordinates" type="text" label="Enter genomic coordinates to avoid converting the entire file (chr,from,to)" size="40" help="Specify the region as a half-open interval chr,from,to (e.g. chrX,15203639,15412498)"/>
+			</when>
+		</conditional>
+		
+		<!--form field to select duplicate handling-->
+		<param name="duplicates" type="select" label="Keep local duplicates of DNB mappings (default no)" help="All the output SAM records will be marked as 'not primary' if this option is used.">
+			<option value="" selected="true">no</option>
+			<option value="--keep-duplicates">yes</option>
+		</param>
+
+		<!--form field to generate mate sequence-->
+		<param name="mates" type="select" label="Generate mate sequence (R2) and score (Q2) tags (default no)">
+			<option value="" selected="true">no</option>
+			<option value="--add-mate-sequence">yes</option>
+		</param>
+
+		<!--form field to generate interval ids-->
+		<param name="intervals" type="select" label="Generate interval id (ZI:I) and allele id (ZA:I) tags (default no)">
+			<option value="" selected="true">no</option>
+			<option value="--add-allele-id">yes</option>
+		</param>
+
+		<!--form field to skip not mapped reads-->
+		<param name="skip" type="select" label="Skip not mapped records (default no)">
+			<option value="" selected="true">no</option>
+			<option value="--skip-not-mapped">yes</option>
+		</param>
+
+		<!--form field to skip not mapped reads-->
+		<param name="svcandidates" type="select" label="Mate unique single arm mappings in SAM including those on different stands and chromosomes (default no)">
+			<option value="" selected="true">no</option>
+			<option value="--mate-sv-candidates">yes</option>
+		</param>
+
+		<!--form field to skip not mapped reads-->
+		<param name="unmapped" type="select" label="Generate mate sequence and score tags for inconsistent mappings only (default no)">
+			<option value="" selected="true">no</option>
+			<option value="--add-unmapped-mate-info">yes</option>
+		</param>
+
+		<!--form field to skip not mapped reads-->
+		<param name="primary" type="select" label="Use primary mappings only (default no)" help="Report only the best mappings">
+			<option value="" selected="true">no</option>
+			<option value="--primary-mappings-only">yes</option>
+		</param>
+
+		<param name="range" type="integer" value="1300" label="Maximum distance between consistent mates (default 1300)">
+			<validator type="empty_field" message="You must enter a value, the default is 1300" />
+		</param>
+  </inputs>
+
+	<stdio>
+		<regex match="failed" source="stderr" level="fatal"/>
+		<regex match="error" source="stderr" level="fatal"/>
+		<regex match="Export the sequence:" source="stderr" level="warning" description="Finished:" />
+	</stdio>
+
+  <help>
+  
+**What it does**
+
+This tool uses cgatools evidence2sam to convert Complete Genomics evidence mappings to SAM format
+
+**cgatools 1.6.0 Documentation**
+
+Userguide: http://cgatools.sourceforge.net/docs/1.6.0/cgatools-user-guide.pdf
+
+Release notes: http://cgatools.sourceforge.net/docs/1.6.0/cgatools-release-notes.pdf
+
+**Command line reference**::
+
+		COMMAND NAME
+				evidence2sam - Converts CGI variant evidence data into SAM format.
+		
+		DESCRIPTION
+				The evidence2sam converter takes as input evidence mapping files 
+				(evidenceDnbs-*) and generates one SAM file as an output. The output is 
+				sent into stdout by default. By default, all the evidence mapping records 
+				from the input are converted into a pair of corresponding SAM records - one
+				record for each HalfDNB. The negative gaps in CGI mappings are represented 
+				using GS/GQ/GC tags.
+		
+		OPTIONS
+			-h [ --help ] 
+						Print this help message.
+		
+			--beta 
+						This is a beta command. To run this command, you must pass the --beta 
+						flag.
+		
+			-e [ --evidence-dnbs ] arg
+						Input evidence dnbs file.
+		
+			-s [ --reference ] arg
+						Reference file.
+		
+			-o [ --output ] arg (=STDOUT)
+						The output SAM file (may be omitted for stdout).
+		
+			-r [ --extract-genomic-region ] arg
+						defines a region as a half-open interval 'chr,from,to'.
+		
+			--keep-duplicates 
+						Keep local duplicates of DNB mappings.All the output SAM records will 
+						be marked as not primary if this option is used.
+		
+			--add-allele-id 
+						Generate interval id and allele id tags.
+		
+			--skip-not-mapped 
+						Skip not mapped records
+		
+			--add-mate-sequence 
+						Generate mate sequence and score tags.
+		
+			--mate-sv-candidates 
+						Inconsistent mappings are normally converted as single arm mappings 
+						with no mate information provided. If the option is used map2sam will 
+						mate unique single arm mappings in SAM including those on different 
+						stands and chromosomes. To distinguish these "artificially" mated 
+						records a tag "XS:i:1" is used. The MAPQ provided for these records is 
+						a single arm mapping weight.
+		
+			--add-unmapped-mate-info 
+						works like add-mate-sequence, but is applied to inconsistent mappings 
+						only
+		
+			--primary-mappings-only 
+						report only the best mappings
+		
+			--consistent-mapping-range arg (=1300)
+						limit the maximum distance between consistent mates
+		
+		
+		SUPPORTED FORMAT_VERSION
+				0.3 or later
+  </help>
+</tool>