annotate flaimapper.xml @ 37:d4bb1f5dbfc8 draft

Uploaded
author yhoogstrate
date Fri, 31 Jul 2015 05:33:05 -0400
parents 3074e91f9f80
children ee6d8c07205b
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
fec346894871 Uploaded
yhoogstrate
parents:
diff changeset
1 <?xml version="1.0" encoding="UTF-8"?>
35
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
2 <tool id="flaimapper" name="FlaiMapper" version="1.2.1.w2">
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
3 <description>Detect small ncRNA derived fragments using Fragment Location Annotation Identification Mapper.</description>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
4 <requirements>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
5 <requirement type="package" version="1.2.1">flaimapper</requirement>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
6 </requirements>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
7
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
8 <stdio>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
9 <regex match="in parse_gff.*?ValueError: invalid literal for int\(\) with base 10" source="stderr" level="fatal" description="The GTF file is corrupt: double check the columns of your GTF/GFF file.\n" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
10 <regex match="[fai_load] build FASTA index." source="stderr" level="log" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
11 </stdio>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
12
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
13 <version_command>flaimapper --version</version_command>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
14
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
15 <command><![CDATA[
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
16 flaimapper
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
17 -v
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
18 -f $output_format
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
19 -o $output
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
20 -m $mask
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
21 -r $fasta
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
22
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
23 #for $alignment in $alignments
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
24 $alignment
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
25 #end for
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
26 ]]></command>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
27
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
28 <inputs>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
29 <param name="alignments" type="data" format="bam" label="Alignment file(s)" help="Aligned small RNA-Seq reads which may not be fragmented. In case you add multiple BAM files, FlaiMapper will simply concatenate the data and perform one single analysis on the entire set of alignments." multiple="true" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
30
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
31 <param name="mask" type="data" format="gtf,gff,gff3" label="small ncRNA Annotation (gtf)" help="" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
32
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
33 <param name="fasta" type="data" format="fasta" label="Fasta sequence corresponding to reference genome" help="" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
34
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
35 <param name="output_format" type="select" label="Output format">
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
36 <option value="1">Tabular (1 fragment per column)</option>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
37 <option value="2">Tabular (1 precursor per column)</option>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
38 <option value="3">GenBank</option>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
39 <!-- option value="gtf">GTF/GFF</option -->
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
40 </param>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
41 </inputs>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
42
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
43 <outputs>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
44 <data format="tabular" name="output" label="${tool.name} on ${', '.join([ str(a.hid)+': '+a.name for a in $alignments ])}" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
45 </outputs>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
46
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
47 <tests>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
48 <test><!-- Testing "ncRNAdb09 alignment"-type analysis -->
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
49 <param name="alignments" value="test1/snord81.bam" ftype="bam" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
50 <param name="mask" value="test1/ncrnadb09.v2.gtf" ftype="gtf" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
51 <param name="fasta" value="test1/ncrnadb09.fa" ftype="fasta" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
52 <param name="output_format" value="1" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
53
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
54 <output name="output" file="test1/snord81.flaimapper.txt" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
55 </test>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
56 <test><!-- Testing "Full genome alignment"-type analysis -->
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
57 <param name="alignments" value="test2/test_genomic_alignment.bam" ftype="bam" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
58 <param name="mask" value="test2/test_genomic_genes.gtf" ftype="gtf" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
59 <param name="fasta" value="test2/test_genomic_all_chromosomes.fa" ftype="fasta" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
60 <param name="output_format" value="1" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
61
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
62 <output name="output" file="test2/test_genomic_flaimapper_output.txt" />
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
63 </test>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
64 </tests>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
65
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
66 <help><![CDATA[
14
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
67 FlaiMapper wrapper for Galaxy
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
68 =============================
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
69
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
70 https://github.com/yhoogstrate/flaimapper
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
71 http://www.ncbi.nlm.nih.gov/pubmed/25338717
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
72 http://dx.doi.org/10.1093/bioinformatics/btu696
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
73
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
74 Fragment Location Annotation Identification Mapper
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
75
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
76 FlaiMapper: computational annotation of small ncRNA-derived fragments using RNA-seq high-throughput data.
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
77
26
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
78
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
79 Input
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
80 -----
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
81
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
82 Alignments
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
83 **********
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
84
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
85 Aligned reads from small RNA-Seq experiments have to be provided in the BAM format.
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
86 In case you add multiple BAM files, FlaiMapper will simply concatenate the data and perform one single analysis on the entire set of alignments.
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
87
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
88 Mask File
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
89 *********
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
90
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
91 There are two strategies to analyze using FlaiMapper:
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
92
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
93 - Relative to mature ncRNA sequences
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
94 - Relative to chromosomes
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
95
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
96 Therefore FlaiMapper requires a list of ncRNA annotations relative to the used reference genome for the alignment files. These ncRNA locations within the sequences provided in the FASTA file (MASK) regions should be provided in the GFF/GTF format:
14
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
97
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
98 - http://genome.ucsc.edu/FAQ/FAQformat.html#format3
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
99 - http://www.ensembl.org/info/website/upload/gff.html
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
100
26
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
101 If you are making use of a ncRNA database that has no GTF file available you can make use of the galaxy tool **flaimapper-gtf-from-fasta** to create one.
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
102
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
103
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
104 You can access **ncRNAdb09** GTF file at the following URL:
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
105 https://raw.githubusercontent.com/yhoogstrate/flaimapper/master/share/annotations/ncRNA_annotation/ncrnadb09.gtf *(mask file)*
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
106
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
107 Fasta sequence
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
108 **************
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
109
20
ac69be28e786 FlaiMapper: added wrapper for FASTA-&gt;GTF conversion
yhoogstrate
parents: 19
diff changeset
110 The reference sequence should be provided in FASTA format.
14
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
111
26
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
112 You can access **ncRNAdb09** FASTA file at the following URL:
19
ab3ea877607f Uploaded
yhoogstrate
parents: 18
diff changeset
113 https://raw.githubusercontent.com/yhoogstrate/flaimapper/master/share/annotations/ncRNA_annotation/ncrnadb09.fa *(reference file)*
ab3ea877607f Uploaded
yhoogstrate
parents: 18
diff changeset
114
26
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
115 Example- and reference data
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
116 ***************************
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
117
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
118 To align reads to ncRNA you need aligner specific indexed version of the reference. We have made
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
119 the following available for ncRNAdb09:
19
ab3ea877607f Uploaded
yhoogstrate
parents: 18
diff changeset
120
ab3ea877607f Uploaded
yhoogstrate
parents: 18
diff changeset
121 - **Tophat1**: https://github.com/yhoogstrate/flaimapper/blob/master/share/annotations/ncRNA_annotation/ncrnadb09.bt2.tar.gz
ab3ea877607f Uploaded
yhoogstrate
parents: 18
diff changeset
122 - **Tophat2**: https://github.com/yhoogstrate/flaimapper/blob/master/share/annotations/ncRNA_annotation/ncrnadb09.bt2.tar.gz
ab3ea877607f Uploaded
yhoogstrate
parents: 18
diff changeset
123
26
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
124 If you want to test FlaiMapper with example data you can obtain several
4e00cc7b97e5 Uploaded
yhoogstrate
parents: 25
diff changeset
125 alignment files from the following directory tree:
19
ab3ea877607f Uploaded
yhoogstrate
parents: 18
diff changeset
126
ab3ea877607f Uploaded
yhoogstrate
parents: 18
diff changeset
127 https://github.com/yhoogstrate/flaimapper/tree/master/share/small_RNA-seq_alignments
ab3ea877607f Uploaded
yhoogstrate
parents: 18
diff changeset
128
14
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
129 Installation
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
130 ------------
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
131
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
132 The wrapper makes use of easy_install to install a python egg. Please
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
133 ensure you have easy_install installed.
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
134
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
135 License
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
136 -------
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
137
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
138 **flaimapper** and **wrapper**:
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
139
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
140 GPL (>=3)
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
141
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
142 **pysam**:
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
143
19
ab3ea877607f Uploaded
yhoogstrate
parents: 18
diff changeset
144 The MIT License
14
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
145
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
146 Contact
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
147 -------
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
148
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
149 The tool wrapper has been written by Youri Hoogstrate from the Erasmus
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
150 Medical Center (Rotterdam, Netherlands).
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
151
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
152
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
153 Development
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
154 -----------
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
155
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
156 * Repository-Maintainer: Youri Hoogstrate
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
157 * Repository-Developers: Youri Hoogstrate
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
158
35
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
159 * Repository-Development: https://github.com/ErasmusMC-Bioinformatics/galaxy-tools
14
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
160
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
161 The tool wrapper has been written by Youri Hoogstrate from the Erasmus
fb1537d04625 Uploaded
yhoogstrate
parents: 13
diff changeset
162 Medical Center (Rotterdam, Netherlands).
35
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
163 ]]></help>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
164
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
165 <citations>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
166 <citation type="doi">10.1093/bioinformatics/btu696</citation>
3074e91f9f80 Uploaded
yhoogstrate
parents: 28
diff changeset
167 </citations>
20
ac69be28e786 FlaiMapper: added wrapper for FASTA-&gt;GTF conversion
yhoogstrate
parents: 19
diff changeset
168 </tool>