comparison tools/mira4/mira4_de_novo.xml @ 13:7fcabeeca5df draft

Uploaded v0.0.2 preview 5, fixes for MIRA 4.0 (final), more verbose error if $MIRA4 path wrong
author peterjc
date Sun, 16 Feb 2014 16:30:48 -0500
parents 302d13490b23
children 133b863a8a40
comparison
equal deleted inserted replaced
12:a6a56440567c 13:7fcabeeca5df
77 </outputs> 77 </outputs>
78 <configfiles> 78 <configfiles>
79 <configfile name="manifest"> 79 <configfile name="manifest">
80 project = MIRA 80 project = MIRA
81 job = denovo,${job_type},${job_quality} 81 job = denovo,${job_type},${job_quality}
82 parameters = -GE:not=1 -NW:cmrnl -DI:trt=/tmp 82 parameters = -NW:cmrnl=no -DI:trt=/tmp
83 ## -GE:not is short for -GENERAL:number_of_threads and using one (1) 83 ## -GE:not is short for -GENERAL:number_of_threads and using one (1)
84 ## can be useful for repeatability of assemblies and bug hunting. 84 ## can be useful for repeatability of assemblies and bug hunting.
85 ## This is overriden by the command line -t switch which is easier
86 ## to set from within Galaxy.
85 ## 87 ##
86 ## -NW:cmrnl is short for -NAG_AND_WARN:check_maxreadnamelength 88 ## -NW:cmrnl is short for -NAG_AND_WARN:check_maxreadnamelength
87 ## and without this MIRA aborts with read names over 40 characters 89 ## and without this MIRA aborts with read names over 40 characters
88 ## due to limitations of some downstream tools. 90 ## due to limitations of some downstream tools.
89 ## 91 ##
97 99
98 readgroup 100 readgroup
99 technology = ${rg.technology} 101 technology = ${rg.technology}
100 ##Record the segment placement (if any) 102 ##Record the segment placement (if any)
101 #if str($rg.segments.type) == "paired" 103 #if str($rg.segments.type) == "paired"
102 segmentplacement = ${rg.segments.placement} 104 segment_placement = ${rg.segments.placement}
103 segmentnaming = ${rg.segments.naming} 105 segment_naming = ${rg.segments.naming}
104 #if str($rg.segments.min_size) != "" or str($rg.segments.max_size) != "" 106 #if str($rg.segments.min_size) != "" or str($rg.segments.max_size) != ""
105 ##If our min/max validation failed I trust MIRA to give an error message... 107 ##If our min/max validation failed I trust MIRA to give an error message...
106 templatesize = $rg.segments.min_size $rg.segments.max_size 108 template_size = $rg.segments.min_size $rg.segments.max_size
107 #end if 109 #end if
108 #end if 110 #end if
109 #if str($rg.segments.type) == "none" 111 ##if str($rg.segments.type) == "none"
110 segmentplacement = ? 112 ##MIRA4 manual says use segment_placement = unknown or ? for unpaired data
111 #end if 113 ##but this stopped working in MIRA 4.0 RC5 and 4.0 (final). See:
114 ##http://www.freelists.org/post/mira_talk/Unpaired-reads-and-segment-placement--or-unknown
115 ##segment_placement = ?
116 ##end if
112 ##MIRA will accept multiple filenames on one data line, or multiple data lines 117 ##MIRA will accept multiple filenames on one data line, or multiple data lines
113 #for $f in $rg.filenames 118 #for $f in $rg.filenames
114 ##Must now map Galaxy datatypes to MIRA file types... 119 ##Must now map Galaxy datatypes to MIRA file types...
115 #if $f.ext.startswith("fastq") 120 #if $f.ext.startswith("fastq")
116 ##MIRA doesn't like fastqsanger etc, just plain old fastq: 121 ##MIRA doesn't like fastqsanger etc, just plain old fastq:
128 </configfiles> 133 </configfiles>
129 <tests> 134 <tests>
130 <!-- Tiger mitochondria, selected paired end Illumina reads from SRR639755 135 <!-- Tiger mitochondria, selected paired end Illumina reads from SRR639755
131 Note we're using just one repeat group, and only the filenames parameter 136 Note we're using just one repeat group, and only the filenames parameter
132 within it, so this should work with current test framework limitations: 137 within it, so this should work with current test framework limitations:
138 TODO: Revise example and/or -NW:cac=warn and -NW:acv=80 settings
139 MIRA 4.0 complains as coverage is about x93 which is over 80 limit.
140 Also MIRA 4.0 gives three contigs as output.
133 <test> 141 <test>
134 <param name="job_type" value="genome" /> 142 <param name="job_type" value="genome" />
135 <param name="job_quality" value="accurate" /> 143 <param name="job_quality" value="accurate" />
136 <param name="filenames" value="SRR639755_mito_pairs.fastq.gz" ftype="fastqsanger" /> 144 <param name="filenames" value="SRR639755_mito_pairs.fastq.gz" ftype="fastqsanger" />
137 <output name="out_fasta" file="SRR639755_mito_pairs.mira4_de_novo.fasta" ftype="fasta" /> 145 <output name="out_fasta" file="SRR639755_mito_pairs.mira4_de_novo.fasta" ftype="fasta" />
151 </test> 159 </test>
152 --> 160 -->
153 <!-- Simple assembly based on MIRA's minidemo/solexa1 example 161 <!-- Simple assembly based on MIRA's minidemo/solexa1 example
154 Note we're using just one repeat group, 162 Note we're using just one repeat group,
155 but two parameters within the repeat (filename, no pairing) 163 but two parameters within the repeat (filename, no pairing)
164 -->
156 <test> 165 <test>
157 <param name="job_type" value="genome" /> 166 <param name="job_type" value="genome" />
158 <param name="job_quality" value="accurate" /> 167 <param name="job_quality" value="accurate" />
159 <param name="type" value="none" /> 168 <param name="type" value="none" />
160 <param name="filenames" value="ecoli.fastq" ftype="fastqsanger" /> 169 <param name="filenames" value="ecoli.fastq" ftype="fastqsanger" />
161 <output name="out_fasta" file="ecoli.mira4_de_novo.fasta" ftype="fasta" /> 170 <output name="out_fasta" file="ecoli.mira4_de_novo.fasta" ftype="fasta" />
171 <output name="out_bam" file="empty_file.dat" compare="contains" />
172 <output name="out_maf" file="empty_file.dat" compare="contains" />
173 <output name="out_log" file="empty_file.dat" compare="contains" />
162 </test> 174 </test>
163 -->
164 </tests> 175 </tests>
165 <help> 176 <help>
166 177
167 **What it does** 178 **What it does**
168 179