Mercurial > repos > jjohnson > snpsift

--- a/snpEff_macros.xml	Thu Oct 23 06:06:25 2014 -0500
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,32 +0,0 @@
-<macros>
-    <xml name="requirements">
-        <requirements>
-            <requirement type="package" version="4.0">snpEff</requirement>
-        </requirements>
-    </xml>
-  <xml name="stdio">
-    <stdio>
-        <exit_code range=":-1"  level="fatal" description="Error: Cannot open file" />
-        <exit_code range="1:"  level="fatal" description="Error" />
-    </stdio>
-  </xml>
-  <token name="@EXTERNAL_DOCUMENTATION@">
-
-For details about this tool, please go to:
-	http://snpeff.sourceforge.net/SnpEff_manual.html
-
-  </token>
-  <token name="@CITATION_SECTION@">------
-
-**Citation**
-
-For the underlying tool, please cite the following two publications:
-
-SnpEff citation:
-"A program for annotating and predicting the effects of single nucleotide polymorphisms, SnpEff: SNPs in the genome of Drosophila melanogaster strain w1118; iso-2; iso-3.", Cingolani P, Platts A, Wang le L, Coon M, Nguyen T, Wang L, Land SJ, Lu X, Ruden DM. Fly (Austin). 2012 Apr-Jun;6(2):80-92. PMID: 22728672 [PubMed - in process]
-
-SnpSift citation:
-"Using Drosophila melanogaster as a model for genotoxic chemical mutational studies with a new program, SnpSift", Cingolani, P., et. al., Frontiers in Genetics, 3, 2012.
-
-  </token>
-</macros>
--- a/snpSift_annotate.xml	Thu Oct 23 06:06:25 2014 -0500
+++ b/snpSift_annotate.xml	Wed Dec 09 14:03:26 2015 -0500
@@ -1,13 +1,15 @@
-<tool id="snpSift_annotate" name="SnpSift Annotate" version="4.0.0">
+<tool id="snpSift_annotate" name="SnpSift Annotate" version="@WRAPPER_VERSION@.0">
     <description>SNPs from dbSnp</description>
     <!--
         You can change the amount of memory used, just change the -Xmx parameter (e.g. use -Xmx2G for 2Gb of memory)
     -->
+    <macros>
+        <import>snpSift_macros.xml</import>
+    </macros>
     <expand macro="requirements" />
-    <macros>
-        <import>snpEff_macros.xml</import>
-    </macros>
-    <command>
+    <expand macro="stdio" />
+    <expand macro="version_command" />
+    <command><![CDATA[
         java -Xmx6G -jar \$SNPEFF_JAR_PATH/SnpSift.jar $annotate_cmd
         #if $annotate.id :
           -id
@@ -15,6 +17,7 @@
           -info "$annotate.info_ids"
         #end if
         -q $dbSnp $input > $output
+]]>
     </command>
     <inputs>
         <param format="vcf" name="input" type="data" label="Variant input file in VCF format"/>
@@ -37,7 +40,6 @@
             </help>
             </param>
     </inputs>
-    <expand macro="stdio" />
     <outputs>
         <data format="vcf" name="output" />
     </outputs>
@@ -54,7 +56,7 @@
             </output>
         </test>
     </tests>
-    <help>
+    <help><![CDATA[

 This is typically used to annotate IDs from dbSnp.

@@ -95,6 +97,7 @@
 @CITATION_SECTION@


+]]>
     </help>
 </tool>
--- a/snpSift_caseControl.xml	Thu Oct 23 06:06:25 2014 -0500
+++ b/snpSift_caseControl.xml	Wed Dec 09 14:03:26 2015 -0500
@@ -1,13 +1,15 @@
-<tool id="snpSift_caseControl" name="SnpSift CaseControl" version="4.0.0">
+<tool id="snpSift_caseControl" name="SnpSift CaseControl" version="@WRAPPER_VERSION@.0">
     <description>Count samples are in 'case' and 'control' groups.</description>
     <!--
         You can change the amount of memory used, just change the -Xmx parameter (e.g. use -Xmx2G for 2Gb of memory)
     -->
+    <macros>
+        <import>snpSift_macros.xml</import>
+    </macros>
     <expand macro="requirements" />
-    <macros>
-        <import>snpEff_macros.xml</import>
-    </macros>
-    <command>
+    <expand macro="stdio" />
+    <expand macro="version_command" />
+    <command><![CDATA[
     java -Xmx1G -jar \$SNPEFF_JAR_PATH/SnpSift.jar caseControl -q
     #if $name.__str__.strip() != '':
       -name $name
@@ -18,6 +20,7 @@
       -tfam "$ctrl.tfam"
     #end if
     $input > $output
+]]>
     </command>
     <inputs>
         <param format="vcf" name="input" type="data" label="Variant input file in VCF format"/>
@@ -45,7 +48,6 @@
     <outputs>
         <data format="vcf" name="output" />
     </outputs>
-    <expand macro="stdio" />
     <tests>
         <test>
             <param name="input" ftype="vcf" value="test.private.01.vcf"/>
@@ -84,7 +86,7 @@
             </output>
         </test>
     </tests>
-    <help>
+    <help><![CDATA[

 **SnpSift CaseControl**

@@ -118,5 +120,6 @@

 @CITATION_SECTION@

+]]>
   </help>
 </tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/snpSift_extractFields.xml	Wed Dec 09 14:03:26 2015 -0500
@@ -0,0 +1,221 @@
+<tool id="snpSift_extractFields" name="SnpSift Extract Fields" version="@WRAPPER_VERSION@.0">
+    <options sanitize="False" />
+    <description>from a VCF file inot a tabular file</description>
+    <macros>
+        <import>snpSift_macros.xml</import>
+    </macros>
+    <expand macro="requirements" />
+    <expand macro="stdio" />
+    <expand macro="version_command" />
+    <command><![CDATA[
+        cat "$input"
+        #if $one_effect_per_line:
+          | \$SNPEFF_JAR_PATH/scripts/vcfEffOnePerLine.pl
+        #end if
+        | java -Xmx6G -jar \$SNPEFF_JAR_PATH/SnpSift.jar extractFields
+        #if $separator:
+          -s '$separator'
+        #end if
+        #if $empty_text:
+          -e '$empty_text'
+        #end if
+        -
+        #echo ' '.join(['"%s"' % x for x in $extract.split()])
+        > $output
+]]>
+    </command>
+    <inputs>
+        <param format="vcf" name="input" type="data" label="Variant input file in VCF format"/>
+        <param name="extract" type="text" label="Extract" size="160" help="Need help? See below a few examples." />
+        <param name="one_effect_per_line" type="boolean" truevalue="yes" falsevalue="no" checked="false" label="One effect per line" help="When variants have more than one effect, lists one effect per line, while all other parameters in the line are repeated across mutiple lines" />
+        <param name="separator" type="text" value="" optional="true" label="multiple field separator" size="1" help="Separate multiple fields in one column with this character, e.g. a comma, rather than a column for each of the multiple values">
+        </param>
+        <param name="empty_text" type="text" value="" optional="true" label="empty field text" size="10" help="Represent empty fields with this value, rather than leaving them blank" >
+        </param>
+    </inputs>
+    <outputs>
+        <data format="tabular" name="output" />
+    </outputs>
+    <tests>
+        <test>
+            <param name="input" ftype="vcf" value="test_rmInfo.vcf"/>
+            <param name="extract" value="CHROM POS REF ALT EFF[*].EFFECT"/>
+            <output name="output">
+                <assert_contents>
+                <has_text text="INTRAGENIC" />
+                <not_has_text text="DOWNSTREAM,INTRAGENIC,INTRON,UTR_3_PRIME" />
+                </assert_contents>
+            </output>
+        </test>
+
+        <test>
+            <param name="input" ftype="vcf" value="test_rmInfo.vcf"/>
+            <param name="extract" value="CHROM POS REF ALT EFF[*].EFFECT"/>
+            <param name="separator" value=","/>
+            <output name="output">
+                <assert_contents>
+		<has_text text="DOWNSTREAM,INTRAGENIC,INTRON,UTR_3_PRIME" />
+                </assert_contents>
+            </output>
+        </test>
+
+    </tests>
+    <help><![CDATA[
+
+**SnpSift Extract Fields**
+
+Extract fields from a VCF file to a TXT, tab separated format, that you can easily load in R, XLS, etc.
+
+http://snpeff.sourceforge.net/SnpSift.html#Extract
+
+You can also use sub-fields and genotype fields / sub-fields such as:
+
+  ::
+
+    Standard VCF fields:
+        CHROM
+        POS
+        ID
+        REF
+        ALT
+        FILTER
+    INFO fields:
+        AF
+        AC
+        DP
+        MQ
+        etc. (any info field available)
+    SnpEff 'ANN' fields:
+        "ANN[*].ALLELE" (alias GENOTYPE)
+        "ANN[*].EFFECT" (alias ANNOTATION): Effect in Sequence ontology terms (e.g. 'missense_variant', 'synonymous_variant', 'stop_gained', etc.)
+        "ANN[*].IMPACT:" { HIGH, MODERATE, LOW, MODIFIER }
+        "ANN[*].GENE:" Gene name (e.g. 'PSD3')
+        "ANN[*].GENEID:" Gene ID
+        "ANN[*].FEATURE
+        " ANN[*].FEATUREID (alias TRID: Transcript ID)
+        "ANN[*].BIOTYPE:" Biotype, as described by the annotations (e.g. 'protein_coding')
+        "ANN[*].RANK:" Exon or Intron rank (i.e. exon number in a transcript)
+        "ANN[*].HGVS_C" (alias HGVS_DNA, CODON): Variant in HGVS (DNA) notation
+        "ANN[*].HGVS_P" (alias HGVS, HGVS_PROT, AA): Variant in HGVS (protein) notation
+        "ANN[*].CDNA_POS" (alias POS_CDNA)
+        "ANN[*].CDNA_LEN" (alias LEN_CDNA)
+        "ANN[*].CDS_POS" (alias POS_CDS)
+        "ANN[*].CDS_LEN" (alias LEN_CDS)
+        "ANN[*].AA_POS" (alias POS_AA)
+        "ANN[*].AA_LEN" (alias LEN_AA)
+        "ANN[*].DISTANCE"
+        "ANN[*].ERRORS" (alias WARNING, INFOS)
+    SnpEff 'EFF' fields (this is for older SnpEff/SnpSift versions, new version use 'ANN' field):
+        "EFF[*].EFFECT"
+        "EFF[*].IMPACT"
+        "EFF[*].FUNCLASS"
+        "EFF[*].CODON"
+        "EFF[*].AA"
+        "EFF[*].AA_LEN"
+        "EFF[*].GENE"
+        "EFF[*].BIOTYPE"
+        "EFF[*].CODING"
+        "EFF[*].TRID"
+        "EFF[*].RANK"
+    SnpEff 'LOF' fields:
+        "LOF[*].GENE"
+        "LOF[*].GENEID"
+        "LOF[*].NUMTR"
+        "LOF[*].PERC"
+    SnpEff' NMD' fields:
+        "NMD[*].GENE"
+        "NMD[*].GENEID"
+        "NMD[*].NUMTR"
+        "NMD[*].PERC"
+
+
+Some examples:
+
+  - *Extracting chromosome, position, ID and allele frequency from a VCF file:*
+
+    **CHROM POS ID AF**
+
+    The result will look something like:
+
+      ::
+
+        #CHROM        POS        ID            AF
+        1             69134                    0.086
+        1             69496      rs150690004   0.001
+
+
+  - *Extracting genotype fields:*
+
+    **CHROM POS ID THETA GEN[0].GL[1] GEN[1].GL GEN[3].GL[*] GEN[*].GT**
+
+    This means to extract:
+
+      - CHROM POS ID: regular fields (as in the previous example)
+      - THETA : This one is from INFO
+      - GEN[0].GL[1] : Second likelihood from first genotype
+      - GEN[1].GL : The whole GL fiels (all entries without separating them)
+      - GEN[3].GL[*] : All likelihoods form genotype 3 (this time they will be tab separated, as opposed to the previous one).
+      - GEN[*].GT : Genotype subfields (GT) from ALL samples (tab separated).
+
+    The result will look something like:
+
+      ::
+
+        #CHROM  POS     ID              THETA   GEN[0].GL[1]    GEN[1].GL               GEN[3].GL[*]            GEN[*].GT
+        1       10583   rs58108140      0.0046  -0.47           -0.24,-0.44,-1.16       -0.48   -0.48   -0.48   0|0     0|0     0|0     0|1     0|0     0|1     0|0     0|0     0|1
+        1       10611   rs189107123     0.0077  -0.48           -0.24,-0.44,-1.16       -0.48   -0.48   -0.48   0|0     0|1     0|0     0|0     0|0     0|0     0|0     0|0     0|0
+        1       13302   rs180734498     0.0048  -0.58           -2.45,-0.00,-5.00       -0.48   -0.48   -0.48   0|0     0|1     0|0     0|0     0|0     1|0     0|0     0|1     0|0
+
+  - *Extracting fields with multiple values:*
+    (notice that there are multiple effect columns per line because there are mutiple effects per variant)
+
+    **CHROM POS REF ALT ANN[*].EFFECT**
+
+    The result will look something like:
+
+      ::
+
+        #CHROM	POS	REF	ALT	ANN[*].EFFECT
+        22	17071756	T	C	3_prime_UTR_variant	downstream_gene_variant
+        22	17072035	C	T	missense_variant	downstream_gene_variant
+        22	17072258	C	A	missense_variant	downstream_gene_variant
+
+  - *Extracting fields with multiple values using a comma as a multipe field separator:*
+
+    **CHROM POS REF ALT ANN[*].EFFECT ANN[*].HGVS_P**
+
+    The result will look something like:
+
+      ::
+
+        #CHROM	POS	REF	ALT	ANN[*].EFFECT	ANN[*].HGVS_P
+        22	17071756	T	C	3_prime_UTR_variant,downstream_gene_variant	.,.
+        22	17072035	C	T	missense_variant,downstream_gene_variant	p.Gly469Glu,.
+        22	17072258	C	A	missense_variant,downstream_gene_variant	p.Gly395Cys,.
+
+
+  - *Extracting fields with multiple values, one effect per line:*
+
+    **CHROM POS REF ALT ANN[*].EFFECT**
+
+    The result will look something like:
+
+      ::
+
+        #CHROM	POS	REF	ALT	ANN[*].EFFECT
+        22	17071756	T	C	3_prime_UTR_variant
+        22	17071756	T	C	downstream_gene_variant
+        22	17072035	C	T	missense_variant
+        22	17072035	C	T	downstream_gene_variant
+        22	17072258	C	A	missense_variant
+        22	17072258	C	A	downstream_gene_variant
+
+
+@EXTERNAL_DOCUMENTATION@
+	http://snpeff.sourceforge.net/SnpSift.html#Extract
+
+@CITATION_SECTION@
+
+]]>
+    </help>
+</tool>
--- a/snpSift_filter.xml	Thu Oct 23 06:06:25 2014 -0500
+++ b/snpSift_filter.xml	Wed Dec 09 14:03:26 2015 -0500
@@ -1,11 +1,13 @@
-<tool id="snpSift_filter" name="SnpSift Filter" version="4.0.0">
+<tool id="snpSift_filter" name="SnpSift Filter" version="@WRAPPER_VERSION@.0">
     <options sanitize="False" />
     <description>Filter variants using arbitrary expressions</description>
+    <macros>
+        <import>snpSift_macros.xml</import>
+    </macros>
     <expand macro="requirements" />
-    <macros>
-        <import>snpEff_macros.xml</import>
-    </macros>
-    <command>
+    <expand macro="stdio" />
+    <expand macro="version_command" />
+    <command><![CDATA[
         java -Xmx6G -jar \$SNPEFF_JAR_PATH/SnpSift.jar filter -f $input -e $exprFile $inverse
         #if $filtering.mode == 'field':
             #if $filtering.replace.pass:
@@ -22,6 +24,7 @@
             #end if
         #end if
          > $output
+]]>
     </command>
     <inputs>
         <param format="vcf" name="input" type="data" label="Variant input file in VCF format"/>
@@ -57,7 +60,6 @@
     <outputs>
         <data format="vcf" name="output" />
     </outputs>
-    <expand macro="stdio" />
     <tests>
         <test>
         <param name="input" ftype="vcf" value="test01.vcf"/>
@@ -85,7 +87,7 @@

         <test>
         <param name="input" ftype="vcf" value="test01.vcf"/>
-        <param name="expr" value="(POS >= 20175) &amp; (POS &lt;= 35549)"/>
+        <param name="expr" value="(POS >= 20175) & (POS <= 35549)"/>
         <param name="mode" value="entries"/>
         <output name="output">
             <assert_contents>
@@ -111,11 +113,11 @@
         </output>
         </test>
     </tests>
-    <help>
+    <help><![CDATA[

 **SnpSift filter**

-You can filter ia vcf file using arbitrary expressions, for instance "(QUAL > 30) | (exists INDEL) | ( countHet() > 2 )". The actual expressions can be quite complex, so it allows for a lot of flexibility.
+You can filter a VCF file using arbitrary expressions, for instance "(QUAL > 30) | (exists INDEL) | ( countHet() > 2 )". The actual expressions can be quite complex, so it allows for a lot of flexibility.

 Some examples:

@@ -123,7 +125,7 @@

     ::

-    ( CHROM = 'chr1' ) &amp; ( POS &gt; 1000000 )  &amp; ( POS &lt; 2000000 )
+    ( CHROM = 'chr1' ) & ( POS > 1000000 ) & ( POS < 2000000 )

   - *Filter value is either 'PASS' or it is missing*:

@@ -131,11 +133,13 @@

     (FILTER = 'PASS') | ( na FILTER )

-  - *I want to filter lines with an EFF of 'frameshift_variant' ( for vcf files using Sequence Ontology terms )*:
+  - *I want to filter lines with an ANN annotation EFFECT of 'frameshift_variant' ( for vcf files using Sequence Ontology terms )*:

     ::

-    ( EFF[*].EFFECT = 'frameshift_variant' )
+    ( ANN[*].EFFECT has 'frameshift_variant' )
+
+    **Important** According to the specification, there can be more than one EFFECT separated by & (e.g. 'missense_variant&splice_region_variant', thus using has operator is better than using equality operator (=). For instance 'missense_variant&splice_region_variant' = 'missense_variant' is false, whereas 'missense_variant&splice_region_variant' has 'missense_variant' is true.

   - *I want to filter lines with an EFF of 'FRAME_SHIFT' ( for vcf files using Classic Effect names )*:

@@ -147,31 +151,31 @@

     ::

-    ( QUAL &gt; 30 )
+    ( QUAL > 30 )

   - *...but we also want InDels that have quality 20 or more*:

     ::

-    (( exists INDEL ) &amp; (QUAL >= 20)) | (QUAL >= 30 )
+    (( exists INDEL ) & (QUAL >= 20)) | (QUAL >= 30 )

   - *...or any homozygous variant present in more than 3 samples*:

     ::

-    (countHom() > 3) | (( exists INDEL ) &amp; (QUAL >= 20)) | (QUAL >= 30 )
+    (countHom() > 3) | (( exists INDEL ) & (QUAL >= 20)) | (QUAL >= 30 )

   - *...or any heterozygous sample with coverage 25 or more*:

     ::

-    ((countHet() > 0) &amp; (DP >= 25)) | (countHom() > 3) | (( exists INDEL ) &amp; (QUAL >= 20)) | (QUAL >= 30 )
+    ((countHet() > 0) & (DP >= 25)) | (countHom() > 3) | (( exists INDEL ) & (QUAL >= 20)) | (QUAL >= 30 )

   - *I want to keep samples where the genotype for the first sample is homozygous variant and the genotype for the second sample is reference*:

     ::

-    (isHom( GEN[0] ) &amp; isVariant( GEN[0] ) &amp; isRef( GEN[1] ))
+    (isHom( GEN[0] ) & isVariant( GEN[0] ) & isRef( GEN[1] ))


 **For information regarding HGVS and Sequence Ontology terms versus classic names**:
@@ -185,5 +189,6 @@

 @CITATION_SECTION@

+]]>
     </help>
 </tool>
--- a/snpSift_int.xml	Thu Oct 23 06:06:25 2014 -0500
+++ b/snpSift_int.xml	Wed Dec 09 14:03:26 2015 -0500
@@ -1,14 +1,17 @@
-<tool id="snpSift_int" name="SnpSift Intervals" version="4.0.0">
+<tool id="snpSift_int" name="SnpSift Intervals" version="@WRAPPER_VERSION@.0">
     <description>Filter variants using intervals</description>
     <!--
         You can change the amount of memory used, just change the -Xmx parameter (e.g. use -Xmx2G for 2Gb of memory)
     -->
+    <macros>
+        <import>snpSift_macros.xml</import>
+    </macros>
     <expand macro="requirements" />
-    <macros>
-        <import>snpEff_macros.xml</import>
-    </macros>
-    <command>
+    <expand macro="stdio" />
+    <expand macro="version_command" />
+    <command><![CDATA[
         java -Xmx2G -jar \$SNPEFF_JAR_PATH/SnpSift.jar intervals -i $input $exclude $bedFile > $output
+]]>
     </command>
     <inputs>
         <param format="vcf" name="input" type="data" label="Variant input file in VCF format"/>
@@ -19,7 +22,6 @@
     <outputs>
         <data format="vcf" name="output" />
     </outputs>
-    <expand macro="stdio" />
     <tests>
         <test>
             <param name="input" ftype="vcf" value="annotate_5.vcf"/>
@@ -44,14 +46,15 @@
             </output>
         </test>
     </tests>
-    <help>
+    <help><![CDATA[

 You can filter using intervals (BED file).

 @EXTERNAL_DOCUMENTATION@
-	http://snpeff.sourceforge.net/SnpSift.html#intervals
+    http://snpeff.sourceforge.net/SnpSift.html#intervals

 @CITATION_SECTION@

+]]>
     </help>
 </tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/snpSift_macros.xml	Wed Dec 09 14:03:26 2015 -0500
@@ -0,0 +1,39 @@
+<macros>
+    <xml name="requirements">
+        <requirements>
+            <requirement type="package" version="4.1">snpEff</requirement>
+        </requirements>
+    </xml>
+  <xml name="stdio">
+    <stdio>
+        <exit_code range=":-1"  level="fatal" description="Error: Cannot open file" />
+        <exit_code range="1:"  level="fatal" description="Error" />
+    </stdio>
+  </xml>
+  <xml name="version_command">
+    <version_command>java -jar $SNPEFF_JAR_PATH/SnpEff.jar -version</version_command>
+  </xml>
+  <token name="@WRAPPER_VERSION@">4.1</token>
+  <token name="@EXTERNAL_DOCUMENTATION@">
+
+For details about this tool, please go to:
+	http://snpeff.sourceforge.net/SnpEff_manual.html
+
+  </token>
+  <token name="@CITATION_SECTION@">------
+
+**Citation**
+
+For the underlying tool, please cite the following two publications:
+
+SnpSift citation:
+"Using Drosophila melanogaster as a model for genotoxic chemical mutational studies with a new program, SnpSift", Cingolani, P., et. al., Frontiers in Genetics, 3:35, 2012.
+
+  </token>
+  <xml name="citations">
+      <citations>
+        <citation type="doi">10.3389/fgene.2012.00035</citation>
+        <yield />
+      </citations>
+  </xml>
+</macros>
--- a/snpSift_rmInfo.xml	Thu Oct 23 06:06:25 2014 -0500
+++ b/snpSift_rmInfo.xml	Wed Dec 09 14:03:26 2015 -0500
@@ -1,11 +1,14 @@
-<tool id="snpSift_rmInfo" name="SnpSift rmInfo" version="4.0.0">
+<tool id="snpSift_rmInfo" name="SnpSift rmInfo" version="@WRAPPER_VERSION@.0">
     <description>remove INFO field annotations</description>
-    <expand macro="requirements" />
     <macros>
-        <import>snpEff_macros.xml</import>
+        <import>snpSift_macros.xml</import>
     </macros>
-    <command>
+    <expand macro="requirements" />
+    <expand macro="stdio" />
+    <expand macro="version_command" />
+    <command><![CDATA[
       java -Xmx2G -jar \$SNPEFF_JAR_PATH/SnpSift.jar rmInfo $input ' '.join($info_fields.split(',')) > $output
+]]>
     </command>
     <inputs>
         <param format="vcf" name="input" type="data" label="Variant input file in VCF format"/>
@@ -17,7 +20,6 @@
     <outputs>
         <data format="vcf" name="output" />
     </outputs>
-    <expand macro="stdio" />
     <tests>
         <test>
             <param name="input" ftype="vcf" value="test-data/test_rmInfo.vcf"/>
@@ -25,8 +27,8 @@
             <output name="output">
                 <assert_contents>
                     <has_text text="DP=29" />
-		    <not_has_text text="EFF=EXON" />
-		</assert_contents>
+                    <not_has_text text="EFF=EXON" />
+                </assert_contents>
             </output>
         </test>
         <test>
@@ -34,23 +36,24 @@
             <param name="info_fields" value="EFF"/>
             <output name="output">
                 <assert_contents>
-		   <not_has_text text="DP=29;EFF=EXON" />
-		</assert_contents>
+                    <not_has_text text="DP=29;EFF=EXON" />
+                </assert_contents>
             </output>
         </test>
     </tests>
-    <help>
+    <help><![CDATA[
 This command removes INFO fields from a VCF file (i.e. removes annotations)

 Removing INFO fields is usually done because you want to re-annotate the VCF file, thus removing old INFO fields in order to add new ones later.

-SnpEff &amp; SnpSift only add annotations and do not change current ones. So, in order to re-annotate a file, you should first remove the old annotations and then re-annotate.
+SnpEff & SnpSift only add annotations and do not change current ones. So, in order to re-annotate a file, you should first remove the old annotations and then re-annotate.
 The reason for this behavior is simply because replacing annotation values is considered a bad practice. Imagine that you have a VCF entry  in your re-annotated file having the value "AA=1": How do you know if this is from the old annotations or from the new ones? This confusion often leads to problems in downstream steps of your pipelines, so it's better to avoid the problem by first removing all the previous annotations and then adding the new ones.

 @EXTERNAL_DOCUMENTATION@
-	http://snpeff.sourceforge.net/SnpSift.html#rmInfo
+    http://snpeff.sourceforge.net/SnpSift.html#rmInfo

 @CITATION_SECTION@

+]]>
     </help>
 </tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/snpSift_vartype.xml	Wed Dec 09 14:03:26 2015 -0500
@@ -0,0 +1,43 @@
+<tool id="snpsift_vartype" name="SnpSift Variant Type" version="@WRAPPER_VERSION@.0">
+    <description>Annotate with variant type</description>
+    <macros>
+        <import>snpSift_macros.xml</import>
+    </macros>
+    <expand macro="requirements" />
+    <expand macro="stdio" />
+    <expand macro="version_command" />
+    <command><![CDATA[
+        java -jar \$SNPEFF_JAR_PATH/SnpSift.jar varType $input 2> $log > $output
+]]>
+    </command>
+    <inputs>
+        <param format="vcf" name="input" type="data" label="Variant file (VCF)"/>
+    </inputs>
+    <outputs>
+        <data format="vcf" name="output" label="${tool.name} on ${on_string}: VCF" />
+        <data format="txt" name="log" label="${tool.name} on ${on_string}: log" />
+    </outputs>
+    <tests>
+    </tests>
+    <help><![CDATA[
+**What it does**
+
+This tool uses `SnpSift Variant type`_ to add the variant type (SNP/MNP/INS/DEL/MIXED) in the INFO field. It also adds "HOM/HET", but this last one works if there is only one sample (otherwise it doesn't make any sense).
+
+.. _SnpSift Variant type: http://snpeff.sourceforge.net/SnpSift.html#VariantType
+
+------
+
+**License**
+
+This Galaxy tool is Copyright © 2013-2014 `CRS4 Srl.`_ and is released under the `MIT license`_.
+
+.. _CRS4 Srl.: http://www.crs4.it/
+.. _MIT license: http://opensource.org/licenses/MIT
+
+@CITATION_SECTION@
+
+]]>
+    </help>
+    <expand macro="citations" />
+</tool>
--- a/snpSift_vcfCheck.xml	Thu Oct 23 06:06:25 2014 -0500
+++ b/snpSift_vcfCheck.xml	Wed Dec 09 14:03:26 2015 -0500
@@ -1,11 +1,14 @@
-<tool id="snpSift_vcfCheck" name="SnpSift vcfCheck" version="4.0.0">
+<tool id="snpSift_vcfCheck" name="SnpSift vcfCheck" version="@WRAPPER_VERSION@.0">
     <description>basic checks for Vcf specification compliance</description>
-    <expand macro="requirements" />
     <macros>
-        <import>snpEff_macros.xml</import>
+        <import>snpSift_macros.xml</import>
     </macros>
-    <command>
+    <expand macro="requirements" />
+    <expand macro="stdio" />
+    <expand macro="version_command" />
+    <command><![CDATA[
       java -Xmx2G -jar \$SNPEFF_JAR_PATH/SnpSift.jar vcfCheck $input > $output
+]]>
     </command>
     <inputs>
         <param format="vcf" name="input" type="data" label="Variant input file in VCF format to check"/>
@@ -13,7 +16,6 @@
     <outputs>
         <data format="vcf" name="output" />
     </outputs>
-    <expand macro="stdio" />
     <tests>
         <test>
             <param name="input" ftype="vcf" value="test-data/test_bad.vcf"/>
@@ -24,7 +26,7 @@
             </output>
         </test>
     </tests>
-    <help>
+    <help><![CDATA[

 Perform some basic check ups on VCF files to spot common problems.

@@ -35,5 +37,6 @@

 @CITATION_SECTION@

+]]>
     </help>
 </tool>
--- a/tool_dependencies.xml	Thu Oct 23 06:06:25 2014 -0500
+++ b/tool_dependencies.xml	Wed Dec 09 14:03:26 2015 -0500
@@ -1,7 +1,6 @@
 <?xml version="1.0"?>
 <tool_dependency>
-    <package name="snpEff" version="4.0">
-        <repository name="package_snpeff_4_0" owner="jjohnson" changeset_revision="4ac635fc1781" toolshed="http://testtoolshed.g2.bx.psu.edu/" />
+    <package name="snpEff" version="4.1">
+        <repository changeset_revision="02a5e07a4121" name="package_snpeff_4_1" owner="iuc" toolshed="https://testtoolshed.g2.bx.psu.edu" />
     </package>
 </tool_dependency>
-