comparison transcriptsToOrfs.xml @ 2:5eb99d21ef0d

Add trinityrnaseq_norm and transcriptsToOrfs tools
author Jim Johnson <jj@umn.edu>
date Thu, 05 Sep 2013 08:08:21 -0500
parents
children
comparison
equal deleted inserted replaced
1:a34ce2b18877 2:5eb99d21ef0d
1 <tool id="transcriptsToOrfs" name="transcriptsToOrfs" version="0.0.2">
2 <description>Trinity Transcripts to Candidate Peptides</description>
3 <requirements>
4 <requirement type="package" version="2013_08_14">trinityrnaseq</requirement>
5 <requirement type="package" version="3.0">hmmer</requirement>
6 </requirements>
7 <command>
8 \$TRINITY_HOME/trinity-plugins/transdecoder/transcripts_to_best_scoring_ORFs.pl
9 -t $transcripts
10 #if $min_prot_length:
11 -m $min_prot_length
12 #end if
13 #if $retain_long_orfs:
14 --retain_long_orfs $retain_long_orfs
15 #end if
16 #if $training_count:
17 -T $training_count
18 #end if
19 #if str($strand_specificity) == 'SS':
20 -S
21 #end if
22 #if $genetic_code.__str__ != '':
23 -G $genetic_code
24 #end if
25 #if $search.use_pfam == 'yes':
26 --search_pfam "${ filter( lambda x: str( x[0] ) == str( $search.pfam_db ), $__app__.tool_data_tables[ 'pfam_databases' ].get_fields() )[0][-1] }"
27 --CPU $search.CPU
28 #end if
29 </command>
30 <inputs>
31 <param format="fasta" name="transcripts" type="data" label="Transcripts sequences in fastA format" help="" />
32 <param name="min_prot_length" type="integer" value="" optional="true" label="Minimum peptide length (in amino acids)" help="default: 100">
33 <validator type="in_range" message="Minimum peptide length should be at least 50" min="50" />
34 </param>
35 <param name="retain_long_orfs" type="integer" value="" optional="true" label="Retain all ORFs found that are of minimum length in nucleotides" help="default: 900" >
36 <validator type="in_range" message="ORF length should be at least 50" min="50" />
37 </param>
38 <param name="training_count" type="integer" value="" optional="true" label="Number of top longest ORFs to train Markov Model (hexamer stats)" help="default: 500" >
39 <validator type="in_range" message="ORF count should be at least 50" min="50" />
40 </param>
41 <param name="strand_specificity" type="select" label="Strand specificity type">
42 <option value="DS">NOT strand specific, examine both strands</option>
43 <option value="SS">Strand specific, examine only top strand</option>
44 </param>
45 <param name="genetic_code" type="select" label="Genetic Code">
46 <option value="">use default(universal)</option>
47 <option value="universal">universal</option>
48 <option value="Euplotes">Euplotes</option>
49 <option value="Tetrahymena">Tetrahymena</option>
50 <option value="Candida">Candida</option>
51 <option value="Acetabularia">Acetabularia</option>
52 </param>
53 <conditional name="search">
54 <param name="use_pfam" type="select" label="Search PFAM database">
55 <option value="no">NO</option>
56 <option value="yes">YES</option>
57 </param>
58 <when value="no"/>
59 <when value="yes">
60 <param name="pfam_db" type="select" label="Pfam database">
61 <options from_data_table="pfam_databases" />
62 </param>
63 <param name="CPU" type="integer" value="2" min="1" label="CPU" help="Number of CPUs to use by hmmscan" />
64 </when>
65 </conditional>
66 </inputs>
67 <stdio>
68 <exit_code range="1:" level="fatal" description="Failed" />
69 <regex match="Error"
70 source="stderr"
71 level="fatal"
72 description="Failed" />
73 </stdio>
74 <outputs>
75 <data format="txt" name="trinity_pep_pfam" label="${tool.name} on ${on_string}: Pfam matches to Candidate Peptide Sequences" from_work_dir="longest_orfs.pep.pfam.dat">
76 <filter>search['use_pfam'] == 'yes'</filter>
77 </data>
78 <data format="gff3" name="trinity_pep_gff3" label="${tool.name} on ${on_string} Candidate Peptide Features" from_work_dir="best_candidates.eclipsed_orfs_removed.gff3" />
79 <data format="bed" name="trinity_pep_bed" label="${tool.name} on ${on_string} Candidate Peptide Coordinates" from_work_dir="best_candidates.eclipsed_orfs_removed.bed" />
80 <data format="fasta" name="trinity_pep_cds" label="${tool.name} on ${on_string}: Candidate Peptide CDS Sequences" from_work_dir="best_candidates.eclipsed_orfs_removed.cds"/>
81 <data format="fasta" name="trinity_pep_seqs" label="${tool.name} on ${on_string}: Candidate Peptide Sequences" from_work_dir="best_candidates.eclipsed_orfs_removed.pep"/>
82 </outputs>
83 <tests>
84 <test>
85 <param name="transcripts" ftype="fasta" value="TrinitySingle.fasta"/>
86 <param name="min_prot_length" value="100"/>
87 <param name="use_pfam" value="no"/>
88 <output name="trinity_pep_seqs">
89 <assert_contents>
90 <has_text text="WAAKAWLITARSLYPADF" />
91 </assert_contents>
92 </output>
93 <output name="trinity_pep_cds">
94 <assert_contents>
95 <has_text text="TGGGCAGCCAAGGCATGGCTGATCACGGCCCGCA" />
96 </assert_contents>
97 </output>
98 <output name="trinity_pep_bed">
99 <assert_contents>
100 <has_text text="comp10_c0_seq1" />
101 </assert_contents>
102 </output>
103 <output name="trinity_pep_gff3">
104 <assert_contents>
105 <has_text text="comp10_c0_seq1" />
106 </assert_contents>
107 </output>
108 </test>
109 </tests>
110 <help>
111 ** transcriptsToOrfs **
112 Trinity_ is a de novo transcript assembler that uses RNA-seq data as input.
113 This tool searches for open reading frames in the assembled transcripts.
114
115 .. _Trinity: http://trinityrnaseq.sourceforge.net
116 </help>
117 </tool>