Mercurial > repos > peterjc > mira4_assembler
diff tools/mira4/mira4_de_novo.xml @ 13:7fcabeeca5df draft
Uploaded v0.0.2 preview 5, fixes for MIRA 4.0 (final), more verbose error if $MIRA4 path wrong
author | peterjc |
---|---|
date | Sun, 16 Feb 2014 16:30:48 -0500 |
parents | 302d13490b23 |
children | 133b863a8a40 |
line wrap: on
line diff
--- a/tools/mira4/mira4_de_novo.xml Mon Feb 03 06:25:35 2014 -0500 +++ b/tools/mira4/mira4_de_novo.xml Sun Feb 16 16:30:48 2014 -0500 @@ -79,9 +79,11 @@ <configfile name="manifest"> project = MIRA job = denovo,${job_type},${job_quality} -parameters = -GE:not=1 -NW:cmrnl -DI:trt=/tmp +parameters = -NW:cmrnl=no -DI:trt=/tmp ## -GE:not is short for -GENERAL:number_of_threads and using one (1) ## can be useful for repeatability of assemblies and bug hunting. +## This is overriden by the command line -t switch which is easier +## to set from within Galaxy. ## ## -NW:cmrnl is short for -NAG_AND_WARN:check_maxreadnamelength ## and without this MIRA aborts with read names over 40 characters @@ -99,16 +101,19 @@ technology = ${rg.technology} ##Record the segment placement (if any) #if str($rg.segments.type) == "paired" -segmentplacement = ${rg.segments.placement} -segmentnaming = ${rg.segments.naming} +segment_placement = ${rg.segments.placement} +segment_naming = ${rg.segments.naming} #if str($rg.segments.min_size) != "" or str($rg.segments.max_size) != "" ##If our min/max validation failed I trust MIRA to give an error message... -templatesize = $rg.segments.min_size $rg.segments.max_size +template_size = $rg.segments.min_size $rg.segments.max_size #end if #end if -#if str($rg.segments.type) == "none" -segmentplacement = ? -#end if +##if str($rg.segments.type) == "none" +##MIRA4 manual says use segment_placement = unknown or ? for unpaired data +##but this stopped working in MIRA 4.0 RC5 and 4.0 (final). See: +##http://www.freelists.org/post/mira_talk/Unpaired-reads-and-segment-placement--or-unknown +##segment_placement = ? +##end if ##MIRA will accept multiple filenames on one data line, or multiple data lines #for $f in $rg.filenames ##Must now map Galaxy datatypes to MIRA file types... @@ -130,6 +135,9 @@ <!-- Tiger mitochondria, selected paired end Illumina reads from SRR639755 Note we're using just one repeat group, and only the filenames parameter within it, so this should work with current test framework limitations: + TODO: Revise example and/or -NW:cac=warn and -NW:acv=80 settings + MIRA 4.0 complains as coverage is about x93 which is over 80 limit. + Also MIRA 4.0 gives three contigs as output. <test> <param name="job_type" value="genome" /> <param name="job_quality" value="accurate" /> @@ -153,14 +161,17 @@ <!-- Simple assembly based on MIRA's minidemo/solexa1 example Note we're using just one repeat group, but two parameters within the repeat (filename, no pairing) + --> <test> <param name="job_type" value="genome" /> <param name="job_quality" value="accurate" /> <param name="type" value="none" /> <param name="filenames" value="ecoli.fastq" ftype="fastqsanger" /> <output name="out_fasta" file="ecoli.mira4_de_novo.fasta" ftype="fasta" /> + <output name="out_bam" file="empty_file.dat" compare="contains" /> + <output name="out_maf" file="empty_file.dat" compare="contains" /> + <output name="out_log" file="empty_file.dat" compare="contains" /> </test> - --> </tests> <help>