annotate jaccardBed.xml @ 45:b176b1c7949e draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bedtools commit 69394918e7a50dad3ae578e932cbac27b96e0d3b
author iuc
date Tue, 24 Jul 2018 11:49:34 -0400
parents d279800f4ff9
children 2f457890d8c8
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
8
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
1 <tool id="bedtools_jaccard" name="JaccardBed" version="@WRAPPER_VERSION@.0">
17
a2d4c30ba2f9 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bedtools commit 0887009a23d176b21536c9fd8a18c4fecc417d4f
iuc
parents: 8
diff changeset
2 <description>calculate the distribution of relative distances between two files</description>
8
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
3 <macros>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
4 <import>macros.xml</import>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
5 </macros>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
6 <expand macro="requirements" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
7 <expand macro="stdio" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
8 <command>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
9 <![CDATA[
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
10 bedtools jaccard
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
11 $strand
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
12 $split
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
13 $reciprocal
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
14 -f $overlap
26
c0fbce5dc84a planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bedtools commit 19967671ddd4e750f53d71274e5c12325a402811
iuc
parents: 17
diff changeset
15 -a '$inputA'
c0fbce5dc84a planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bedtools commit 19967671ddd4e750f53d71274e5c12325a402811
iuc
parents: 17
diff changeset
16 -b '$inputB'
c0fbce5dc84a planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bedtools commit 19967671ddd4e750f53d71274e5c12325a402811
iuc
parents: 17
diff changeset
17 > '$output'
8
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
18 ]]>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
19 </command>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
20 <inputs>
42
d279800f4ff9 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bedtools commit b75b9e79cf3186a22dc2e1e9d27c1a080b891b59
iuc
parents: 26
diff changeset
21 <param format="@STD_BEDTOOLS_INPUTS@" name="inputA" type="data" label="@STD_BEDTOOLS_INPUT_LABEL@ file"/>
d279800f4ff9 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bedtools commit b75b9e79cf3186a22dc2e1e9d27c1a080b891b59
iuc
parents: 26
diff changeset
22 <param format="@STD_BEDTOOLS_INPUTS@" name="inputB" type="data" label="@STD_BEDTOOLS_INPUT_LABEL@ file"/>
8
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
23 <expand macro="overlap" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
24 <expand macro="reciprocal" />
26
c0fbce5dc84a planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/bedtools commit 19967671ddd4e750f53d71274e5c12325a402811
iuc
parents: 17
diff changeset
25 <param name="strand" type="boolean" checked="false" truevalue="-s" falsevalue=""
8
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
26 label="Force strandedness"
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
27 help="That is, only report hits in B that overlap A on the same strand. By default, overlaps are reported without respect to strand. (-s)" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
28 <expand macro="strand2" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
29 <expand macro="split" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
30 </inputs>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
31 <outputs>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
32 <data format_source="inputA" name="output" metadata_source="inputA" label="Intersection of ${inputA.name} and ${inputB.name}" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
33 </outputs>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
34 <tests>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
35 <test>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
36 <param name="inputA" value="jaccardBed1.bed" ftype="bed" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
37 <param name="inputB" value="jaccardBed2.bed" ftype="bed" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
38 <output name="output" file="jaccardBed_result1.bed" ftype="bed" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
39 </test>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
40 <test>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
41 <param name="inputA" value="jaccardBed1.bed" ftype="bed" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
42 <param name="inputB" value="jaccardBed2.bed" ftype="bed" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
43 <param name="overlap" value="0.1" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
44 <output name="output" file="jaccardBed_result2.bed" ftype="bed" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
45 </test>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
46 </tests>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
47 <help>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
48
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
49 **What it does**
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
50
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
51 By default, bedtools jaccard reports the length of the intersection, the length of the union (minus the intersection), the final Jaccard statistic reflecting the similarity of the two sets, as well as the number of intersections.
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
52 Whereas the bedtools intersect tool enumerates each an every intersection between two sets of genomic intervals, one often needs a single statistic reflecting the similarity of the two sets based on the intersections between them. The Jaccard statistic is used in set theory to represent the ratio of the intersection of two sets to the union of the two sets. Similarly, Favorov et al [1] reported the use of the Jaccard statistic for genome intervals: specifically, it measures the ratio of the number of intersecting base pairs between two sets to the number of base pairs in the union of the two sets. The bedtools jaccard tool implements this statistic, yet modifies the statistic such that the length of the intersection is subtracted from the length of the union. As a result, the final statistic ranges from 0.0 to 1.0, where 0.0 represents no overlap and 1.0 represent complete overlap.
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
53
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
54 .. image:: $PATH_TO_IMAGES/jaccard-glyph.png
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
55
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
56 .. class:: warningmark
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
57
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
58 The jaccard tool requires that your data is pre-sorted by chromosome and then by start position (e.g., sort -k1,1 -k2,2n in.bed > in.sorted.bed for BED files).
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
59
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
60 @REFERENCES@
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
61 </help>
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
62 <expand macro="citations" />
0d3aa592ce27 Uploaded
iuc
parents:
diff changeset
63 </tool>