annotate correct_barcodes.xml @ 21:f509cd1d5a78 draft

planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
author nick
date Thu, 04 Jan 2018 23:55:06 -0500
parents e5d1d90c099b
children db602e459536
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
1 <?xml version="1.0"?>
21
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
2 <tool id="correct_barcodes" name="Du Novo: Correct barcodes" version="2.0.10">
0
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
3 <description>of duplex sequencing reads</description>
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
4 <requirements>
21
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
5 <requirement type="package" version="1.1.2">bowtie</requirement>
18
075ef42d1ce5 Bugfix in kalign for very diverse read lengths.
nick
parents: 17
diff changeset
6 <requirement type="package" version="1.10">networkx</requirement>
21
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
7 <requirement type="package" version="2.0.10">dunovo</requirement>
0
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
8 <!-- TODO: require Python 2.7 -->
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
9 </requirements>
17
a34e074e4818 correct.py wrapper fix
nick
parents: 16
diff changeset
10 <version_command>correct.py --version</version_command>
6
1534fb45ab54 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'6d49c0120b09941b250a81cd5118436fe96cdfcf\n'-dirty
nick
parents: 5
diff changeset
11 <command detect_errors="exit_code"><![CDATA[
21
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
12 baralign.sh -c $advanced.chunkmbs -t \${GALAXY_SLOTS:-1} '$input' refdir correct.sam
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
13 && correct.py --galaxy $phone --dist $dist --mapq $mapq --pos $pos
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
14 '$input' refdir/barcodes.fa correct.sam
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
15 > families.corrected.tsv
17
a34e074e4818 correct.py wrapper fix
nick
parents: 16
diff changeset
16 && sort families.corrected.tsv
21
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
17 > '$output'
6
1534fb45ab54 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'6d49c0120b09941b250a81cd5118436fe96cdfcf\n'-dirty
nick
parents: 5
diff changeset
18 ]]>
0
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
19 </command>
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
20 <inputs>
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
21 <param name="input" type="data" format="tabular" label="Input reads" help="with barcodes, grouped by family"/>
21
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
22 <param name="dist" type="integer" value="3" min="1" label="Maximum differences" help="Only use alignments where the barcodes differ by at most these many errors. Note that raising this beyond 3 probably probably won't have an effect, because of the inherent limit in bowtie's ability to match up distant barcodes."/>
0
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
23 <param name="mapq" type="integer" value="20" min="0" label="Minimum mapping quality" help="Only use alignments whose MAPQ is at least this."/>
21
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
24 <param name="pos" type="integer" value="2" min="0" label="Maximum start offset" help="Ignore alignments where the start positions differ by more than this."/>
15
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
25 <param name="phone" type="boolean" truevalue="--phone-home" falsevalue="" checked="False" label="Send usage data" help="Report helpful usage data to the developer, to better understand the use cases and performance of the tool. The only data which will be recorded is the name and version of the tool, the size of the input data, the time and memory taken to process it, and the IP address of the machine running it. Also, if the tool fails, it will report the name of the exception thrown and the line of code it occurred in. The parameters and input/output dataset names are not sent. All the reporting and recording code is available at https://github.com/NickSto/ET"/>
21
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
26 <section name="advanced" title="Advanced Options" expanded="false">
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
27 <param name="chunkmbs" type="integer" value="512" min="16" label="bowtie --chunkmbs" help="This is the number of megabytes to give each bowtie thread for storing path descriptors. If you see warnings about &quot;Exhausted best-first chunk memory&quot; in stderr, you need to increase this."/>
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
28 </section>
0
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
29 </inputs>
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
30 <outputs>
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
31 <data name="output" format="tabular"/>
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
32 </outputs>
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
33 <help>
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
34
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
35 **What it does**
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
36
21
f509cd1d5a78 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fd1625359a101d8a6b0b8d97028cc8be509398f2\n'-dirty
nick
parents: 19
diff changeset
37 This is for processing duplex sequencing data. This will correct duplex barcodes and create new, larger families. Errors in barcodes normally prevent them from being recognized as the same as the other barcodes in their family. Correcting these errors allows the original, full families to be reconstructed, saving reads which would otherwise be lost. This tool accomplishes this by doing an all vs. all alignment between the barcodes with bowtie. This identifies ones which are identical except a few, small differences.
0
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
38
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
39 -----
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
40
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
41 **Input**
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
42
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
43 This expects the output format of the "Make families" tool.
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
44
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
45 -----
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
46
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
47 **Output**
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
48
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
49 The output format is the same as the input format, ready to be consumed by the "Align families" tool.
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
50
15
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
51 </help>
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
52 <citations>
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
53 <citation type="bibtex">@article{Stoler2016,
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
54 author = {Stoler, Nicholas and Arbeithuber, Barbara and Guiblet, Wilfried and Makova, Kateryna D and Nekrutenko, Anton},
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
55 doi = {10.1186/s13059-016-1039-4},
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
56 issn = {1474-760X},
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
57 journal = {Genome biology},
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
58 number = {1},
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
59 pages = {180},
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
60 pmid = {27566673},
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
61 publisher = {Genome Biology},
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
62 title = {{Streamlined analysis of duplex sequencing data with Du Novo.}},
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
63 url = {http://www.ncbi.nlm.nih.gov/pubmed/27566673},
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
64 volume = {17},
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
65 year = {2016}
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
66 }</citation>
e87f8aef4535 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'4ee47753d5af62e584de290ae07ca3547aca2637\n'-dirty
nick
parents: 14
diff changeset
67 </citations>
0
548c63893c70 planemo upload for repository https://github.com/galaxyproject/dunovo commit b'fcd6f371638bc29da6dbe22f939f7a5a7f360481\n'-dirty
nick
parents:
diff changeset
68 </tool>