changeset 18:a47f03c50780 draft

Uploaded
author nikos
date Tue, 09 Sep 2014 10:28:01 -0400
parents 0847315fa035
children fc7f090fd00b
files bedClip.sh bedClip.xml bedExtendRanges.xml bigWigSummary.xml bigwig2summary.sh bigwig2summary.xml faCount.xml test-data/.DS_Store test-data/._.DS_Store test-data/1.bed test-data/1.bigwig test-data/1.fasta test-data/1.tabular test-data/1.txt test-data/2.bed test-data/2.tabular test-data/3.bed test-data/3.tabular test-data/4.bed test-data/4.tabular test-data/test-data/1.fasta test-data/test-data/3.tabular test-data/test-data/4.tabular tool_dependencies.xml
diffstat 24 files changed, 151 insertions(+), 596 deletions(-) [+]
line wrap: on
line diff
--- a/bedClip.sh	Tue Sep 09 10:22:40 2014 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,3 +0,0 @@
-#!/bin/bash
-
-bedClip $1 <(fetchChromSizes $2 2> /dev/null) $3
--- a/bedClip.xml	Tue Sep 09 10:22:40 2014 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,65 +0,0 @@
-<tool id="bedClip" name="bedClip">
-    <description> Remove lines from bed file that refer to off-chromosome places.</description>
-    <requirements>
-        <requirement type="package" version="1.0">fetchChromSizes</requirement>
-        <requirement type="package" version="1.0">bedClip</requirement>
-    </requirements>
-    <command interpreter="bash"> 
-	## Set genome assembly 
-
-	#set $Genome = str( $genome_cond.genome )
-	#if str( $genome_cond ) == 'OTHER':
-		#set $Genome = str( $genome_cond.genome_other )
-	#end if
-	
-	bedClip.sh $input $Genome $output
-    </command>
-    <inputs>
-        <param name="input" type="data" format="bed" label="Input"/>
-        <conditional name="genome_cond">
-	    <param name="genome" type="select" label="Genome Assembly">
-        	<option value="hg19">Human (Homo sapiens): hg19</option>
-	        <option value="hg18">Human (Homo sapiens): hg18</option>
-        	<option value="mm10">Mouse (Mus musculus): mm10</option>
-	        <option value="mm9">Mouse (Mus musculus): mm9</option>
-        	<option value="ce10">C. elegans: ce10</option>
-	        <option value="ce6">C. elegans: ce6</option>
-        	<option value="dm3">D. melanogaster: dm3</option>
-	        <option value="OTHER">Other</option>
-            </param>
-	    <when value="OTHER">
-        	<param name="genome_other" type="text" label="Other genome assemly"/>
-      	    </when>
-	    <when value="hg19" type="text" />
-      	    <when value="hg18" type="text" />
-      	    <when value="mm10" type="text" />
-      	    <when value="mm9" type="text" />
-	    <when value="ce10" type="text" />
-	    <when value="ce6" type="text" />
-	    <when value="dm3" type="text" />
-	</conditional>
-
-    </inputs>
-  
-    <outputs>
-        <data format="input" name="output"/> 
-    </outputs>
-    
-    <tests>
-        <test>
-            <param name="input" value="3.bed" />
-            <param name="genome" value="hg19" />
-            <output name="output" file="1.bed" />
-        </test>
-    </tests>
-
-    <help>
-**What it does**
-bedClip - Remove lines from bed file that refer to off-chromosome places.
-
-**Usage**
-
-  bedClip input.bed chrom.sizes output.bed
-
-    </help>
-</tool>
--- a/bedExtendRanges.xml	Tue Sep 09 10:22:40 2014 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,82 +0,0 @@
-<tool id="bedExtendRanges" name="bedExtendRanges">
-    <description> Extend length of entries in bed 6+. </description>
-    <requirements>
-        <requirement type="package" version="1.0">bedExtendRanges</requirement>
-    </requirements>
-    <command> 
-	## Set genome assembly 
-
-	#set $Genome = str( $genome_cond.genome )
-	#if str( $genome_cond ) == 'OTHER':
-		#set $Genome = str( $genome_cond.genome_other )
-	#end if
-	
-	bedExtendRanges -user=genome -host=genome-mysql.cse.ucsc.edu $Genome $length $input 2> /dev/null > $output
-    </command>
-    <inputs>
-        <param name="input" type="data" format="bed" label="Input"/>
-        <conditional name="genome_cond">
-            <param name="genome" type="select" label="Genome Assembly (-g)">
-	        <option value="hg19">Human (Homo sapiens): hg19</option>
-        	<option value="hg18">Human (Homo sapiens): hg18</option>
-	        <option value="mm10">Mouse (Mus musculus): mm10</option>
-        	<option value="mm9">Mouse (Mus musculus): mm9</option>
-        	<option value="ce10">C. elegans: ce10</option>
-	        <option value="ce6">C. elegans: ce6</option>
-	        <option value="dm3">D. melanogaster: dm3</option>
-        	<option value="OTHER">Other</option>
-            </param>
-            <when value="OTHER">
-      		<param name="genome_other" type="text" label="Other genome assemly"/>
-            </when>
-      	    <when value="hg19" type="text" />
-            <when value="hg18" type="text" />
-      	    <when value="mm10" type="text" />
-            <when value="mm9" type="text" />
-            <when value="ce10" type="text" />
-            <when value="ce6" type="text" />
-            <when value="dm3" type="text" />
-    	</conditional>
-        <param name="length" type="integer" value="0" label="Length extension (base-pairs)" />
-
-    </inputs>
-  
-    <outputs>
-        <data format="input" name="output"/> 
-    </outputs>
-
-    <tests>
-	<test>
-	    <param name="input" value="2.bed" />
-	    <param name="genome" value="hg19" />
-	    <param name="length" value="5000" />
-	    <output name="output" file="4.bed" />
-	</test>
-    </tests>
-
-    <help>
-
-**What it does**
-
-bedExtendRanges_ - extend length of entries in bed 6+ data to be at least the given length,
-taking strand directionality into account.
-
-.. _bedExtendRanges: http://hgdownload.cse.ucsc.edu/admin/exe/linux.x86_64/bedExtendRanges
-
-**Usage**
-
-   bedExtendRanges database length files(s)
-
-**Example**
-
-  * bedExtendRanges -user=genome -host=genome-mysql.cse.ucsc.edu hg18 250 stdin
-
-  will transform:
-    chr1 500 525 . 100 +
-    chr1 1000 1025 . 100 -
-  to:
-    chr1 500 750 . 100 +
-    chr1 775 1025 . 100 -
-
-    </help>
-</tool>
--- a/bigWigSummary.xml	Tue Sep 09 10:22:40 2014 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,43 +0,0 @@
-<tool id="bigWigSummary" name="bigWigSummary">
-    <description> Extract summary information from a bigWig file. </description>
-    <command> 
-	bigWigSummary $input $chrom $start $end $dataPoints -type=$type> $output
-    </command>
-    <inputs>
-        <param name="input" type="data" format="bigwig" label="Input"/>
-        <param name="chrom" type="text" value="chr" label="Chromosome" help="E.g. 'chr7'"/>
-        <param name="start" type="integer" value="" label="Start coordinate" help="BED format (0-based)."/>
-        <param name="end" type="integer" value="" label="End coordinate" help="BED format (0-based)."/>    
-        <param name="dataPoints" type="integer" value="1" label="Number of (equal) parts to break down the selected region."  help="Choose 1 for simple summary."/>
-        <param name="type" type="select" label="Operation">
-	    <option value="mean">Average value in region (default)</option>
-            <option value="min">Minimum value in region</option>
-            <option value="max">Maximum value in region</option>
-            <option value="std">Standard deviation in region</option>
-            <option value="coverage">Percentage of region that is covered</option>
-        </param>
-    </inputs>
-  
-    <outputs>
-        <data format="text" name="output"/> 
-    </outputs>
-
-    <tests>
-	<test>
-	    <param name="input" value="1.bigwig" />
-	    <param name="chrom" value="chr21" />
-	    <param name="start" value="10000000" />
-            <param name="end" value="50000000" />
-	    <param name="dataPoints" value="3" />
-	    <param name="type" value="std" />
-	    <output name="output" file="1.txt" />
-	</test>
-    </tests>
-    <help>
-
-**Usage**
-  * bigWigSummary file.bigWig chrom start end dataPoints
-  * Get summary data from bigWig for indicated region, broken into dataPoints equal parts.  (Use dataPoints=1 for simple summary.)
-
-    </help>
-</tool>
--- a/bigwig2summary.sh	Tue Sep 09 10:22:40 2014 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,131 +0,0 @@
-#!/bin/bash
-# $Id: bigwig2summary_stdout 34 2014-02-20 08:31:20Z jens $
-
-#USE IN GALAXY
-#This script extract summary values (mean, min, max, std or coverage) from a bigwig file for a number of equal sized bins across genomic regions given in bed file.
-#If the bed file contains 6 columns (or more), column 6 is expected to contain strand information. Summary values from a negative strand will be reversed.
-
-########################################
-#bigwigSummary has 3 non-standard outputs:
-#1) n/a #(no data in bin)
-#2) no data #(no data in entire region)
-#3) <number> is not a valid option (typically if negative coordinate)
-
-#Default settings & input parsing. "" indicates required user input.
-nbins=1
-rm_header_line=0
-summary_type=mean
-
-#parse input
-while getopts hef:b:o:n:t: myarg
-do	case "$myarg" in
-	h)	echo "Usage: bigwig2summary_stdout -f <BIGWIG_FILE> -b <BED_FILE> -o <ASSEMBLY> -n <NUMBER OF BINS> -t <SUMMARY TYPE> -e"
-	        echo "Corrects for strand if bed-file has 6 columns or more. Col 6 assumed to contain strand infomation"
-		exit ;;
-	f)	bigwig_file="$OPTARG" ;;
-	b)	bed_file="$OPTARG" ;; #must be tab separated without header
-	o)	org_assembly="$OPTARG" ;;
-	n)	nbins="$OPTARG" ;;
-	t)	summary_type="$OPTARG" ;;
-	e)	rm_header_line=2 ;; #flag. if -e then first line is removed
-	[?])	echo "Usage: bigwig2summary_stdout -f <BIGWIG_FILE> -b <BED_FILE> -o <ASSEMBLY> -n <NUMBER OF BINS> -t <SUMMARY TYPE> -e"
-	        echo "Corrects for strand if bed-file has 6 columns or more. Col 6 assumed to contain strand infomation"
-		exit 1 ;;
-	esac
-done
-
-###################################################
-###VALIDATE INPUT
-###################################################
-
-#get chromosome sizes from bigwig file. bigwig file does not contain name of genome assembly.
-org_assembly_file=`mktemp -u`
-fetchChromSizes $org_assembly 2>/dev/null > $org_assembly_file
-if [ $? -ne 0 ]; then 
-  echo "ERROR: Organism genome assembly does not exist" 
-  rm $org_assembly_file
-  exit
-fi
-
-#check input bed_file. bedClip only checks first 3 columns!
-if [ `bedClip -verbose=2 <(tail -n +${rm_header_line} $bed_file) $org_assembly_file /dev/null 2>&1 | wc -l` -gt 0 ]; then
-  echo -e "ERROR: Input bed file is not in proper format!\nTry 'bedClip' to find lines causing error"
-  echo "Make sure that bigwig and bed files are using the same genome assembly"
-  exit 1
-fi
-
-#make string of "nbins" 0's to insert in regions, where no reads are found
-if [ $nbins -gt 1 ]; then
-  seq_string=`seq 1 $nbins`
-  zero_string=`printf "0\t%.s" {$seq_string} | perl -pe "s/\t$//"` 
-fi
-
-#make sure the given summary type exists
-if [ `echo $summary_type | egrep "(mean|max|min|std|coverage)" | wc -l` -ne 1 ]; then
-  echo "ERROR: Summary type must be: mean, max, min, std or coverage. Default is 'mean'"
-  exit 1
-fi
-
-#determine number of fields in bed_file
-if [ `tail -n +${rm_header_line} $bed_file | awk '{print NF}' | uniq | wc -l` -eq 1 ]; then
-  nfields_bed=`tail -n +${rm_header_line} $bed_file | awk '{print NF}' | uniq`
-else
-  echo "ERROR: Bed file does not have constant number of line columns"
-  exit 1
-fi  
-
-if [[ $nbins -gt 1 && $nfields_bed -ge 6 ]]; then
-  strand_uniq_chars=`tail -n +${rm_header_line} $bed_file | cut -f6 | sort -u | perl -pe "s/\n//"`
-  if [[ $strand_uniq_chars != "+-" && $strand_uniq_chars != "-+" ]] ; then
-    echo "ERROR: Column 6 in bed file must only contain '+' or '-' characters"
-    exit 1
-  fi
-fi 
-
-###################################################
-###EXTRACT DENSITIES FROM NORMALIZED BIGWIG FILE
-###################################################
-
-
-#if more than 1 bin AND >= 6 fields (i.e. has strand column)
-if [[ $nbins -gt 1 && $nfields_bed -ge 6 ]]; then
-
-  #cut columns 1-3+6 | rm header if flag set
-  cut -f1-3,6 $bed_file | tail -n +${rm_header_line} | while read -r line; do
-  
-    #read 4 fields into variables
-    read -r cur_chr cur_start cur_end cur_strand <<<"$line"
-    #run bigWigSummary. Combine stdout and stderr | treat exceptions and errors after 'done'
-    bigWigSummary $bigwig_file $cur_chr $cur_start $cur_end $nbins -type=${summary_type} 2>&1 | perl -pe "s/no data.+$/${zero_string}/" | awk 'BEGIN{OFS="\t"}{ if("'"$cur_strand"'"=="-") { for (i=NF; i>0; i--) { printf("%s\t",$i) } printf("\n") } else { print $0 } }'
-  done | perl -pe "s/n\/a/0/g" | perl -pe "s/^\t?0\t?$/${zero_string}/" | perl -pe "s/ +/\t/g"  | perl -pe "s/\t$//" |  sed '/^$/d'
-
-#if more than 1 bin AND less than 6 fields (i.e. no strand column)
-elif [[ $nbins -gt 1 && $nfields_bed -lt 6 ]]; then
-
-  #cut columns 1-3 | rm header if flag set
-  cut -f1-3 $bed_file | tail -n +${rm_header_line} | while read -r line; do
-  
-    #read 3 fields into variables
-    read -r cur_chr cur_start cur_end <<<"$line"
-    #run bigWigSummary. Combine stdout and stderr | treat exceptions and errors after 'done'
-    bigWigSummary $bigwig_file $cur_chr $cur_start $cur_end $nbins -type=${summary_type} 2>&1 
-  
-  done | perl -pe "s/n\/a/0/g" | perl -pe "s/no data.+$/${zero_string}/" | perl -pe "s/^\t?0\t?$/${zero_string}/" | perl -pe "s/ +/\t/g" | sed '/^$/d'
-
-
-#if 1 bin. Strand column irrelevant 
-else
-
-  cut -f1-3 $bed_file | tail -n +${rm_header_line} | while read -r line; do
-  
-    read -r cur_chr cur_start cur_end <<<"$line"
-    bigWigSummary $bigwig_file $cur_chr $cur_start $cur_end 1 -type=${summary_type} 2>&1
-    
-  done | perl -pe "s/no data.+$/0/" | perl -pe "s/n\/a/0/g" | sed '/^$/d'
-  
-fi 
-  
-
-
-  
-  
--- a/bigwig2summary.xml	Tue Sep 09 10:22:40 2014 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,106 +0,0 @@
-<tool id="bigwig2_summary" name="bigWig2Summary">
-    <description> Extract summary information from a bigWig file across multiple genomic regions specified by the user. </description>
-    <requirements>
-        <requirement type="package" version="1.0">bigWigSummary</requirement>
-        <requirement type="package" version="1.0">fetchChromSizes</requirement>
-        <requirement type="package" version="1.0">bedClip</requirement>
-    </requirements>
-    <command interpreter="bash"> 
-	bigwig2summary.sh -f $input_bw -b $input_bed -n $bins -o $assembly -t $type $header > $output
-    </command>
-    <inputs>
-        <param name="input_bw" type="data" format="bigwig" label="Extract summary from" help="bigWig format."/>
-        <param name="input_bed" type="data" format="tabular" label="using genomic regions in" help="TAB delimited BED-like file."/>
-        <param name="bins" type="integer" value="1" label="Number of bins" help="Postitive integer"/>
-        <param name="assembly" type="text" label="Orgamism assembly" help="E.g. hg19" />
-        <param name="header" type="boolean" checked="False" truevalue="-e" falsevalue=" " label="Does the genomic region file contain a header?" />    
-        <param name="type" type="select" label="Operation" help="">
-	    <option value="mean">Average value in region (default)</option>
-            <option value="min">Minimum value in region</option>
-            <option value="max">Maximum value in region</option>
-            <option value="std">Standard deviation in region</option>
-            <option value="coverage">Percentage of region that is covered</option>
-        </param>
-    </inputs>
-  
-    <outputs>
-        <data format="tabular" name="output"/> 
-    </outputs>
-
-    <tests>
-        <test>
-	    <param name="input_bw" value="1.bigwig" />
-	    <param name="input_bed" value="1.bed" />
-	    <param name="bins" value="3" />
-	    <param name="assembly" value="hg19" />
-	    <param name="header" value="true" />
-	    <output name="output" file="1.tabular" />
-        </test>
-        <test>
-            <param name="input_bw" value="1.bigwig" />
-            <param name="input_bed" value="2.bed" />
-            <param name="bins" value="5" />
-            <param name="assembly" value="hg19" />
-            <param name="header" value="true" />
-            <output name="output" file="2.tabular" />
-        </test>
-    </tests>
-
-    <help>
-
-This tool extracts summary values (mean, min, max, std or coverage) from a **bigWig** file for a number of equal sized bins across genomic regions given in an a "BED-like" file.
-
-The script this tool is based on is written by Jens Vilstrup Johansen and uses bigWigSummary_, bedClip_ and fetchChromSizes_.
-
-.. _bigWigSummary: http://hgdownload.cse.ucsc.edu/admin/exe/linux.x86_64/bigWigSummary 
-
-.. _bedClip: http://hgdownload.cse.ucsc.edu/admin/exe/linux.x86_64/bedClip
-
--- _fetchChromSizes: http://hgdownload.cse.ucsc.edu/admin/exe/linux.x86_64/fetchChromSizes
-
------
-
-.. class:: infomark
-
-The file contaning the genomic region must be TAB-delimited with at list 3 columns representing Chromosome, ChrStart and ChrEnd. If the file contains 6 columns (or more), column 6 is expected to contain strand information. Summary values from a negative strand will be reversed.
- 
------
-
-**Example 1**
-
-Input BED file::
-
-  chr19   50178708        50180708
-  chr6    90348174        90350174
-  chr16   58495848        58497848
-  chr5    180580242       180582242
-  chr9    120177017       120179017  
-
-Extract summary (*#* of bins = 3):: 
-
-  0		0		0
-  0.144886	0		0
-  0.507327	1.14649		1.38456
-  0.221471	0.144886	0.309857
-  0.348944	0.426638	0.244495
-
-**Example 2**
-
-Input BED file (with strand information)::
-
-  chr19	  50178708	50180708	NM_198318	0	+	PRMT1
-  chr6	  90348174	90350174	NM_020466	0	-	LYRM2
-  chr16	  58495848	58497848	NM_020465	0	+	NDRG4
-  chr5 	  180580242	180582242	NM_206880	0	+	OR2V2
-  chr9    120177017     120179017       NM_014010       0       -	ASTN2
-
-Extract summary (*#* of bins = 3)::
-
-  0		0		0
-  0		0		0.144886
-  0.507327	1.14649		1.38456
-  0.221471	0.144886	0.309857
-  0.244495	0.426638	0.348944
-
-    </help>
-</tool>
--- a/faCount.xml	Tue Sep 09 10:22:40 2014 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,78 +0,0 @@
-<tool id="faCount" name="faCount">
-    <description> Count base statistics and CpGs in FASTA files.</description>
-    <requirements>
-        <requirement type="package" version="1.0">faCount</requirement>
-    </requirements>
-    <command>
-	faCount $summary $dinuc $strands $input > $output
-    </command>
-
-    <inputs>
-	<param name="input" type="data" format="fasta" label="FASTA file" />
-	<param name="summary" type="boolean" checked="false" falsevalue="" truevalue="-summary" label="Show only summary statistics" />
-	<param name="dinuc" type="boolean" checked="false" falsevalue="" truevalue="-dinuc" label="Include statistics on dinucletoide frequencies" />
-	<param name="strands" type="boolean" checked="false" falsevalue="" truevalue="-strands" label="Count bases on both strands" />
-    </inputs>
-
-    <outputs>
-	<data format="tabular" name="output" />
-    </outputs>
-
-    <tests>
-	<test>
-	    <param name="input" value="1.fasta" />
-	    <output name="output" file="2.tabular" />
-	</test>
-	<test>
-	    <param name="input" value="1.fasta" />
-	    <param name="summary" value="true" />
-	    <param name="dinuc" value="true" />
-	    <param name="strands" value="true" />
-	    <output name="output" file="3.tabular" />
-    	</test>
-    </tests>
-
-    <help>
-**What it does**
-
-faCount_ - Count base statistics and CpGs in FA files.
-
-.. _faCount: http://hgdownload.cse.ucsc.edu/admin/exe/linux.x86_64/faCount
-
-**Usage**
-  
-faCount file(s).fa -summary -dinuc -strands
-
-**Examples**
-
-Example 1::
-
-  faCount 1.fasta
-
-  #seq		len	A	C	G	T	N	cpg
-  HSFAU1	515	125	138	146	106	0	23
-  HSFAU2	514	124	138	146	106	0	25
-  HSFAU3	518	125	139	149	105	0	25
-  HSFAU4	524	128	142	148	106	0	26
-  HSFAU5	518	124	138	147	109	0	25
-  total		2589	626	695	736	532	0	124
-
-Example 2::
-
-  faCount 1.fasta -summary
-
-  #seq		len	A	C	G	T	N	cpg
-  total		2589	626	695	736	532	0	124
-  prcnt		1.0  	0.2418	0.2684	0.2843	0.2055	0.0000	0.0479
-
-Example 3::
-
-  faCount 1.fasta -summary -strands
-  
-  #seq		len	A	C	G	T	N	cpg
-  total		5178	1158	1431	1431	1158	0	248
-  prcnt		1.0  	0.2236	0.2764	0.2764	0.2236	0.0000	0.0479
-
-    </help>
-
-</tool>
Binary file test-data/.DS_Store has changed
Binary file test-data/._.DS_Store has changed
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/1.bed	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,5 @@
+chr19	50178708	50180708
+chr6	90348174	90350174
+chr16	58495848	58497848
+chr5	180580242	180582242
+chr9	120177017	120179017
Binary file test-data/1.bigwig has changed
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/1.fasta	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,50 @@
+>HSFAU1
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggccccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU2
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgcactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU3
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaagggggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU4
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgaaatagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttgcccgaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU5
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtaggccgcatgctttttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
\ No newline at end of file
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/1.tabular	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,4 @@
+0.144886	0	0
+0.507327	1.14649	1.38456
+0.221471	0.144886	0.309857
+0.348944	0.426638	0.244495
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/1.txt	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,1 @@
+0.796113	0.273952	0.437672
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/2.bed	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,5 @@
+chr19	50178708	50180708	NM_198318	0	+	PRMT1
+chr6	90348174	90350174	NM_020466	0	-	LYRM2
+chr16	58495848	58497848	NM_020465	0	+	NDRG4
+chr5	180580242	180582242	NM_206880	0	+	OR2V2
+chr9	120177017	120179017	NM_014010	0	-	ASTN2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/2.tabular	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,4 @@
+0	0	0	0.144886	0
+0.396878	0.970009	1.1091	1.17538	1.40612
+0.203829	0.21262	0.144886	0.409996	0.274558
+0.180424	0.430989	0.458898	0.35171	0.307157
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/3.bed	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,7 @@
+chr19	50178708	50180708
+chr21	48119895	48139895
+chr6	90348174	90350174
+chr16	58495848	58497848
+chr5	180580242	180582242
+chr17	81194210	81196210
+chr9	120177017	120179017  
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/3.tabular	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,7 @@
+#seq	len	A	C	G	T	N	cpg
+HSFAU1	515	125	138	146	106	0	23
+HSFAU2	514	124	138	146	106	0	25
+HSFAU3	518	125	139	149	105	0	25
+HSFAU4	524	128	142	148	106	0	26
+HSFAU5	518	124	138	147	109	0	25
+total	2589	626	695	736	532	0	124
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/4.bed	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,5 @@
+chr19 50178708 50183708 NM_198318 0 + PRMT1
+chr6 90345174 90350174 NM_020466 0 - LYRM2
+chr16 58495848 58500848 NM_020465 0 + NDRG4
+chr5 180580242 180585242 NM_206880 0 + OR2V2
+chr9 120174017 120179017 NM_014010 0 - ASTN2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/4.tabular	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,3 @@
+#seq	len	A	C	G	T	N	cpg	AA	AC	AG	AT	CA	CC	CG	CT	GA	GC	GG	GT	TA	TC	TG	TT
+total	5178	1158	1431	1431	1158	0	248	360	238	408	142	328	447	248	408	320	426	447	238	150	320	328	360
+prcnt	1.0  	0.2236	0.2764	0.2764	0.2236	0.0000	0.0479	0.0695	0.0460	0.0788	0.0274	0.0633	0.0863	0.0479	0.0788	0.0618	0.0823	0.0863	0.0460	0.0290	0.0618	0.0633	0.0695
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test-data/1.fasta	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,50 @@
+>HSFAU1
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggccccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU2
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgcactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU3
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaagggggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU4
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgaaatagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtagcaggccgcatgcttgcccgaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
+>HSFAU5
+ttcctctttctcgactccatcttcgcggtagctgggaccgccgttcagtcgccaatatgc
+agctctttgtccgcgcccaggagctacacaccttcgaggtgaccggccaggaaacggtcg
+cccagatcaaggctcatgtagcctcactggagggcattgccccggaagatcaagtcgtgc
+tcctggcaggcgcgcccctggaggatgaggccactctgggccagtgcggggtggaggccc
+tgactaccctggaagtaggccgcatgctttttggaggtaaagttcatggttccctggccc
+gtgctggaaaagtgagaggtcagactcctaaggtggccaaacaggagaagaagaagaaga
+agacaggtcgggctaagcggcggatgcagtacaaccggcgctttgtcaacgttgtgccca
+cctttggcaagaagaagggccccaatgccaactcttaagtcttttgtaattctggctttc
+tctaataaaaaagccacttagttcagtcaaaaaaaaaa
\ No newline at end of file
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test-data/3.tabular	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,7 @@
+#seq	len	A	C	G	T	N	cpg
+HSFAU1	515	125	138	146	106	0	23
+HSFAU2	514	124	138	146	106	0	25
+HSFAU3	518	125	139	149	105	0	25
+HSFAU4	524	128	142	148	106	0	26
+HSFAU5	518	124	138	147	109	0	25
+total	2589	626	695	736	532	0	124
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test-data/4.tabular	Tue Sep 09 10:28:01 2014 -0400
@@ -0,0 +1,3 @@
+#seq	len	A	C	G	T	N	cpg	AA	AC	AG	AT	CA	CC	CG	CT	GA	GC	GG	GT	TA	TC	TG	TT
+total	5178	1158	1431	1431	1158	0	248	360	238	408	142	328	447	248	408	320	426	447	238	150	320	328	360
+prcnt	1.0  	0.2236	0.2764	0.2764	0.2236	0.0000	0.0479	0.0695	0.0460	0.0788	0.0274	0.0633	0.0863	0.0479	0.0788	0.0618	0.0823	0.0863	0.0460	0.0290	0.0618	0.0633	0.0695
--- a/tool_dependencies.xml	Tue Sep 09 10:22:40 2014 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,88 +0,0 @@
-<?xml version="1.0"?>
-<tool_dependency>
-    <package name="bigWigSummary" version="1.0">
-        <install version="1.0">
-            <actions>
-                <action type="download_by_url">http://hgdownload.soe.ucsc.edu/admin/exe/linux.x86_64/bigWigSummary</action>
-	        <action type="move_directory_files">
-        	    <source_directory>.</source_directory>
-        	    <destination_directory>$INSTALL_DIR</destination_directory>
-        	</action>
-                <action type="chmod"><file mode="755">$INSTALL_DIR/bigWigSummary</file></action>
-		<action type="set_environment">
-                    <environment_variable name="PATH" action="prepend_to">$INSTALL_DIR</environment_variable>
-                </action>
-	    </actions>
-        </install>
-        <readme>
-        </readme>
-    </package>
-    <package name="bedClip" version="1.0">
-        <install version="1.0">
-            <actions>
-                <action type="download_by_url">http://hgdownload.soe.ucsc.edu/admin/exe/linux.x86_64/bedClip</action>
-                <action type="move_directory_files">
-                    <source_directory>.</source_directory>
-                    <destination_directory>$INSTALL_DIR</destination_directory>
-                </action>
-                <action type="chmod"><file mode="755">$INSTALL_DIR/bedClip</file></action>
-                <action type="set_environment">
-                    <environment_variable name="PATH" action="prepend_to">$INSTALL_DIR</environment_variable>
-                </action>
-            </actions>
-        </install>
-        <readme>
-        </readme>
-    </package>
-    <package name="bedExtendRanges" version="1.0">
-        <install version="1.0">
-            <actions>
-                <action type="download_by_url">http://hgdownload.soe.ucsc.edu/admin/exe/linux.x86_64/bedExtendRanges</action>
-                <action type="move_directory_files">
-                    <source_directory>.</source_directory>
-                    <destination_directory>$INSTALL_DIR</destination_directory>
-                </action>
-                <action type="chmod"><file mode="755">$INSTALL_DIR/bedExtendRanges</file></action>
-                <action type="set_environment">
-                    <environment_variable name="PATH" action="prepend_to">$INSTALL_DIR</environment_variable>
-                </action>
-            </actions>
-        </install>
-        <readme>
-        </readme>
-    </package>
-    <package name="faCount" version="1.0">
-	<install version="1.0">
-	    <actions>
-		<action type="download_by_url">http://hgdownload.soe.ucsc.edu/admin/exe/linux.x86_64/faCount</action>
-		<action type="move_directory_files">
-		    <source_directory>.</source_directory>
-		    <destination_directory>$INSTALL_DIR</destination_directory>
-	        </action>
-		<action type="chmod"><file mode="755">$INSTALL_DIR/faCount</file></action>
-		<action type="set_environment">
-		     <environment_variable name="PATH" action="prepend_to">$INSTALL_DIR</environment_variable>
-                </action>
-	    </actions>
-	</install>
-	<readme>
-	</readme>
-    </package>
-    <package name="fetchChromSizes" version="1.0">
-        <install version="1.0">
-            <actions>
-                <action type="download_by_url">http://hgdownload.soe.ucsc.edu/admin/exe/linux.x86_64/fetchChromSizes</action>
-                <action type="move_directory_files">
-                    <source_directory>.</source_directory>
-                    <destination_directory>$INSTALL_DIR</destination_directory>
-                </action>
-		<action type="chmod"><file mode="755">$INSTALL_DIR/fetchChromSizes</file></action>
-                <action type="set_environment">
-                    <environment_variable name="PATH" action="prepend_to">$INSTALL_DIR</environment_variable>
-                </action>
-            </actions>
-        </install>
-        <readme>
-        </readme>
-    </package>
-</tool_dependency>