diff assembly_stats_txt.xml @ 0:67b2a782bcfc default tip

Migrated tool version 1.0.1 from old tool shed archive to new tool shed repository
author konradpaszkiewicz
date Tue, 07 Jun 2011 15:48:22 -0400
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/assembly_stats_txt.xml	Tue Jun 07 15:48:22 2011 -0400
@@ -0,0 +1,52 @@
+<tool id="assemblystats" name="assemblystats" version="1.0.1">
+	<description>Summarise an assembly (e.g. N50 metrics)</description>
+	<command interpreter="python">
+	  assembly_stats_txt.py 
+           '$type' '$stats.extra_files_path'
+           '$type'
+           '$bucket'
+	   '$input'
+   	    '$stats'
+    '$sortedcontigs'
+    '$histogrampng' 
+    '$summedcontigspng'
+    '$histogramdata' 
+    '$summedcontigdata' 
+
+	</command>
+        <inputs>
+          <param label="Type of read" name="type" type="select" help="Is this from an genomic (contig) or transcriptomic assembly (isotig) or are these raw reads (read)">
+                        <option value="contig" selected="yes">Contig (if from genomic assembly)</option>
+                        <option value="isotig">Isotig (if from transcriptomic assembly)</option>
+			<option value="read">Raw reads from sequencer in FASTA format (useful for 454 data)</option>
+
+          </param>
+          <param name="bucket" type="boolean" label="Output histogram with bin sizes=1" truevalue="-b" falsevalue="" help="Use this to specify whether or not bin sizes of 1 should be used when plotting histograms"/>
+	 <param format="fasta" name="input" type="data" label="Source file in FASTA format"/>
+
+        </inputs>
+	<outputs>
+		 <data format="tabular" name="stats" label="Assembly statistics"/>
+		 <data format="fasta" name="sortedcontigs" label="Sorted contigs" />
+		<data format="png" name="histogrampng" label="Histogram of contig sizes"/>
+		<data format="png" name="summedcontigspng" label="Cumulative sum of contig sizes"/>
+		<data format="tabular" name="histogramdata" label="Histogram data"/>
+		<data format="tabular" name="summedcontigdata" label="Cumulative sum of contig size data"/>
+	</outputs>
+	<requirements>
+	</requirements>
+	<help>
+**Summarise assembly overview** 
+
+This script is used to give summary statistics of an assembly or set of reads. Typically this is run after an assembly to evaluate gross features.
+
+
+# Gives back
+# - N50
+# - num of contigs > 1 kb
+# - num of contigs
+# - Read or Contig Histogram and graphs.
+# - Summed contig length (by number of contigs, in sorted order)
+	</help>
+
+</tool>