view fermikit_run_calling.xml @ 0:38838353adb4 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fermikit commit 47795b03c956d0f239aede8e27d2aa4e3c4c1d27
author mvdbeek
date Fri, 30 Dec 2016 10:26:16 -0500
parents
children b66e81e4ffc7
line wrap: on
line source

<tool id="fermikit_variants" name="fermikit-variants" version="0.14.dev1">
    <description>call variants from genome-aligned contigs</description>
    <requirements>
        <requirement type="package" version="0.14.dev1">fermikit</requirement>
        <requirement type="package" version="0.6.5">sambamba</requirement>
    </requirements>
    <command detect_errors="aggressive"><![CDATA[
        #import re
        #set escaped_element_identifier = re.sub('[^\w\-\s]', '_', str($bam.element_identifier))
        #set ref = $reference_genome.fasta_item.fields.path if $reference_genome.reference_genome_source == "reference" else $reference_genome.history_item
        export ROOT=\$(dirname \$(type -P k8)) &&
        ln -f -s '$bam' '$escaped_element_identifier' &&
        htsbox pileup -cuf '$ref' '$escaped_element_identifier'  | gzip -1 > raw.vcf.gz &&
        k8 "\$ROOT"/hapdip.js deovlp raw.vcf.gz | k8 "\$ROOT"/hapdip.js anno | gzip -1 > tmp.vcf.gz 2> flt.vcf.log &&
        k8 "\$ROOT"/hapdip.js filter -q3 tmp.vcf.gz > flt.vcf 2>> flt.vcf.log &&
        htsbox abreak -bcuf '$ref' <(sambamba sort -n -o /dev/stdout '$escaped_element_identifier') > sv.vcf
     ]]></command>
     <inputs>
         <param name="bam" type="data" label="aligned contigs" help="To generate aligned contigs align fermi2 contigs with BWA mem options -B9 -O16 -L5" format="bam"/>
         <conditional name="reference_genome" label="Reference genome to call variants against">
             <param name="reference_genome_source" type="select">
                 <option value="reference">Use a built-in genome to call variants</option>
                 <option value="history">Use a genome from history to call variants</option>
             </param>
             <when value="history">
                <param format="fasta" label="Select a reference genome" name="history_item" type="data" />
            </when>
            <when value="reference">
                <param label="Select a reference genome" name="fasta_item" type="select">
                    <options from_data_table="fasta_indexes">
                        <filter column="2" type="sort_by"/>
                    </options>
                </param>
            </when>
         </conditional>
    </inputs>
    <outputs>
        <data name="structural_variants" format="vcf" label="fermikit SV on ${on_string}" from_work_dir="sv.vcf"/>
        <data name="snps_indels" format="vcf" label="fermikit SNPs and short INDELs on ${on_string}" from_work_dir="flt.vcf"/>
    </outputs>
    <tests>
        <test>
            <param name="reference_genome_source" value="history"/>
            <param name="history_item" value="small.fa"/>
            <param name="bam" value="aligned_contigs.bam"/>
            <output name="structural_variants" file="sv.vcf" lines_diff="2"/>
            <output name="snps_indels" file="flt.vcf" lines_diff="2"/>
        </test>
    </tests>
    <help><![CDATA[

FermiKit is a de novo assembly based variant calling pipeline for deep Illumina
resequencing data. This galaxy wrapper can be used to call variants from contigs
generated by fermi2 that have subsequently been aligned to a reference genome
using bwa (options -B9 -O16 -L5 or -x intractg).

]]></help> <citations> <citation
type="doi">10.1093/bioinformatics/btv440</citation> </citations> </tool>