Mercurial > repos > greg > multigps
diff multigps.xml @ 0:269f8d00045c draft
Uploaded
author | greg |
---|---|
date | Wed, 23 Dec 2015 10:08:24 -0500 |
parents | |
children | 7779952f00dd |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/multigps.xml Wed Dec 23 10:08:24 2015 -0500 @@ -0,0 +1,141 @@ +<tool id="multigps" name="MultiGPS" version="0.5.0.0"> + <description>analyzes collections of multi-condition ChIP-seq data</description> + <requirements> + <requirement type="package" version="4.11.0">meme</requirement> + <requirement type="package" version="3.11.0">edger</requirement> + <requirement type="package" version="2.14">biocbasics</requirement> + </requirements> + <command> + <![CDATA[ + ## when I don't run on my mac... + ## java -Xmx20G -jar $__tool_directory__/multigps_v0.5.jar + mkdir multigps_out && + java -jar $__tool_directory__/multigps_v0.5.jar + --threads="\${GALAXY_SLOTS:-4}" + --verbose + --geninfo ${chromInfo} + #if str($use_motif_cond.use_motif) == "yes": + #set seq_dir = python "$get_seq_dir" + --seq "${seq_dir}" + --mememinw $use_motif_cond.min_motif_width + --mememaxw $use_motif_cond.max_motif_width + --design $design_file + #if str($gauss_model_smoothing_cond.gauss_model_smoothing) == "yes": + --gaussmodelsmoothing + --gausssmoothparam $gauss_model_smoothing_cond.gauss_model_smoothing.gauss_smooth + #end if + --out multigps_out + ]]> + </command> + <configfiles> + <configfile name="design_file"> + <![CDATA[ + #for input in $input_files: + #set filename = "{$input['input'].filename}" + #set signal_control = $input['signal_control'] + #set format = $input['input'].ext + #set condition_name = $input['condition_name'] + #set replicate_name = $input['replicate_name'] + #set line = '\t'.join($filename, $signal_control, $format, $condition_name, $replicate_name]) + ${line} + #end for + ]]> + </configfile> + <configfile name="get_seq_dir"> +<![CDATA[ +#!/usr/bin/env python +import os +import tempfile + +# All inputs must have the same dbkey, and MultiGPS requires a directory, not the reference file. +if $use_motif_cond.reference_genome_cond.reference_genome_source == "cached": + return os.path.split($use_motif_cond.reference_genome_cond.reference_genome.fields.path)[0] +else: + seq_dir = tempfile.mkdtemp(prefix="tmp-multigps-") + # Populate the directory with the history dataset + tmp_filename = "%s.fa" % $use_motif_cond.reference_genome_cond.reference_genome.dbkey + ln -f -s $use_motif_cond.reference_genome_cond.reference_genome.filename os.path.join(seq_dir, tmp_filename) + return seq_dir +]]> + </configfile> + </configfiles> + <inputs> + <repeat name="input_files" title="Input Files" min="1"> + <param name="input" type="data" format="bam,bed,scidx" label="Add file"> + <validator type="unspecified_build" /> + </param> + <param name="signal_control" type="select" label="Signal or control" display="checkboxes" > + <option value="signal" selected="True">Signal</option> + <option value="control">Control</option> + </param> + <param label="Condition name" name="condition_name" type="text" /> + <param label="Replicate name" name="replicate_name" type="text" /> + + <conditional name="use_motif_cond"> + <param name="use_motif" type="select" label="Perform motif-finding or use a motif-prior?"> + <option value="yes" selected="True">Yes</option> + <option value="no">No</option> + </param> + <when value="yes"> + <conditional name="reference_genome_cond"> + <param name="reference_genome_source" type="select" label="Choose the source for the reference genome"> + <option value="cached">Locally Cached</option> + <option value="history">From History</option> + </param> + <when value="cached"> + <param name="reference_genome" type="select" label="Using reference genome"> + <options from_data_table="fasta_indexes"/> + <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/> + </param> + </when> + <when value="history"> + <param name="reference_genome" type="data" format="fasta" label="Using reference genome"/> + </when> + </conditional> + <param name="min_motif_width" type="integer" min="0" value="6" label="Minimum motif width for MEME"> + <param name="max_motif_width" type="integer" min="0" value="16" label="Maximum motif width for MEME"> + </when> + <when value="no"> + </conditional> + + + </repeat> + + <param name="genome_info_file" type="data" format="tabular" label="Genome information dataset" help="What's this? See the help section below."/> + <conditional name="gauss_model_smoothing_cond"> + <param name="gauss_model_smoothing" type="select" label="Turn on Gaussian model smoothing?" help="Smoothing is done with a cubic spline."> + <option value="yes" selected="True">Yes</option> + <option value="no">No</option> + </param> + <when value="yes"> + <param name="gauss_smooth" type="integer" value="3" min="0" label="Smoothing factor" help="Gaussian smoothing standard deviation." /> + </when> + <when value="no" /> + </conditional> + </inputs> + <outputs> + <data name="output_report" format="txt" label="MultiGPS-Report"/> + <data name="output_gff" format="gff" label="MultiGPS-GFF" /> + <data name="output_gz" format="gz" label="MultiGPS-GZ" /> + </outputs> + <help> + +**What it does** + +MultiGPS is a framework for analyzing collections of multi-condition ChIP-seq datasets and characterizing +differential binding events between conditions. MultiGPS encourages consistency in the reported binding +event locations across conditions and provides accurate estimation of ChIP enrichment levels at each event. +MultiGPS loads all data to memory, so you will need a lot of available memory if you are running analysis +over many conditions or large datasets. + +----- + +**Options** + +* **Input Files** + + </help> + <citations> + <citation type="doi">10.1371/journal.pcbi.1003501</citation> + </citations> +</tool>