comparison spotyping.xml @ 6:20c20bcdec36 draft

planemo upload
author jowong
date Tue, 13 Nov 2018 02:50:56 -0500
parents f1b3a263dd3a
children 1bf76073c034
comparison
equal deleted inserted replaced
5:f1b3a263dd3a 6:20c20bcdec36
1 <tool id="spotyping" name="Spoligotype Prediction" version="0.1.4"> 1 <tool id="spotyping" name="Spoligotype Prediction" version="0.1.5">
2 <description>fast and accurate in silico Mycobacterium spoligotyping from sequence reads</description>
2 <requirements> 3 <requirements>
3 <requirement type="package" version="2.1">spotyping</requirement> 4 <requirement type="package" version="2.1">spotyping</requirement>
4 </requirements> 5 </requirements>
5 <command detect_errors="aggressive"><![CDATA[ 6 <command detect_errors="aggressive"><![CDATA[
6 SpoTyping.py 7 SpoTyping.py
8 $advanced.seq
9 $advanced.swift
10 --min=$advanced.min
11 --rmin=$advanced.min_relax
7 #if str( $data_input.data_selector ) == "paired" 12 #if str( $data_input.data_selector ) == "paired"
8 $data_input.input1.forward $data_input.input1.reverse 13 $data_input.input1.forward $data_input.input1.reverse
9 #end if 14 #end if
10 #if str( $data_input.data_selector ) == "single" 15 #if str( $data_input.data_selector ) == "single"
11 $data_input.input2.element_identifier 16 $data_input.input2
12 #end if 17 #end if
13 && cp SITVIT_ONLINE.*.xls spotyping.xls 18 && cp SITVIT_ONLINE.*.xls spotyping.xls
14 ]]> 19 ]]>
15 </command> 20 </command>
16 <inputs> 21 <inputs>
17 <conditional name="data_input"> 22 <conditional name="data_input">
18 <param name="data_selector" type="select" label="Single or Paired-end Data" help="Select between paired and single end data to add name to dataset"> 23 <param name="data_selector" type="select" label="Single or Paired-end Data" help="Select between paired and single end data to add name to dataset">
19 <option value="paired">Paired</option> 24 <option value="paired">Paired</option>
20 <option value="single">Single</option> 25 <option value="single">Single</option>
21 </param> 26 </param>
22 <when value="paired"> 27 <when value="paired">
23 <param name="input1" format="data" type="data_collection" collection_type="paired" label="Select a paired collection" help="a paired data"/> 28 <param name="input1" format="data" type="data_collection" collection_type="paired" label="Select a paired collection" help="a paired data"/>
24 </when> 29 </when>
25 <when value="single"> 30 <when value="single">
26 <param name="input2" format="data" type="data" label="input" help="Specify dataset with single reads"/> 31 <param name="input2" format="data" type="data" label="input" help="Specify dataset with single reads"/>
27 </when> 32 </when>
28 </conditional> 33 </conditional>
34 <section name="advanced" title="Advanced options" expanded="false">
35 <param type="boolean" argument="--seq" label="Input is assembled sequence" help="Input is either a complete genomic sequence or assembled contigs from an isolate" truevalue="--seq" falsevalue="" checked="false" />
36 <param type="boolean" argument="--swift" label="Swift mode" checked="true" truevalue="--swift=on" falsevalue="--swift=off" />
37 <param name="min" type="integer" value="5" label="MIN" help="minimum number of error-free hits to support presence of a spacer" />
38 <param name="min_relax" type="integer" value="6" label="MIN RELAX" help="minimum number of 1-error-tolerant hits to support presence of a spacer " />
39 </section>
29 </inputs> 40 </inputs>
30 <outputs> 41 <outputs>
31 <data name="output1" label="spoligotyping results" format="txt" from_work_dir="SpoTyping"/> 42 <data name="output1" label="spoligotyping results" format="txt" from_work_dir="SpoTyping"/>
32 <data name="output2" label="spoligotyping log" format="txt" from_work_dir="SpoTyping.log"/> 43 <data name="output2" label="spoligotyping log" format="txt" from_work_dir="SpoTyping.log"/>
33 <data name="output3" label="query" format="excel.xls" from_work_dir="spotyping.xls"/> 44 <data name="output3" label="query" format="excel.xls" from_work_dir="spotyping.xls"/>
34 </outputs> 45 </outputs>
35 <help><![CDATA[ 46 <help><![CDATA[
36 Usage: python SpoTyping.py [options] FASTQ_1/FASTA FASTQ_2(optional) 47 This is a modified version of IUC's wrapper of spotyping without the concatenation and renaming or input files. The wrapper also runs properly when supplied with paired-end reads
48
49 SpoTyping_ is a software for predicting spoligotype_ from sequencing reads, complete genomic sequences and assembled contigs.
50
51 **Input:**
52
53 - Fastq file - if paired end data is used, you may choose to concatenate paired reads into a single input (e.g. using the cat tool)
54 - Fasta file of a complete genomic sequence or assembled contigs of an isolate (with --seq option)
55
56 *Note on input size*: In swift mode the sampling threshold is reached in approximately 30x coverage when using
57 paired end sequencing of a *M. tuberculosis* genome.
58
59 **Output:**
60
61 Count of hits from BLAST result for each spacer sequence and predicted spoligotype in the format of binary code and octal code.
62
63 **Options:**
64
65 \--noQuery
66 Avoid querying the SITVIT_ online service to describe the prevalance of the reported spoligotype.
67
68 \--seq
69 Set this if input is a fasta file that contains only complete genomic sequence or assembled contigs from an isolate. [Default is off]
70
71 \-s SWIFT, --swift=SWIFT
72 Swift mode, either "on" or "off" [Default: on] - swift mode samples 250 million bases to use for spoligotyping
73
74 \--sorted
75 Set if input reads are sorted relative to positions on a reference genome. If reads are sorted and swift mode is used, swift mode's sampling is adjusted
76 to sample reads across positions in the genome evenly.
77
78 \--filter
79 Filter reads such that:
80
81 1. Leading and trailing 'N's would be removed.
82 2. Any read with more than 3 'N's in the middle would be removed.
83 3. Any read with more than 7 consecutive bases identical would be trimmed/filtered out given
84 the length of the flanking regions.
85
86 **Got weird spoligotype prediction?**
87
88 Sequencing throughput is very low (<40Mbp, for example): SpoTyping may not be able to give accurate prediction due to the relatively low read depth.
89
90 **Interpreting the spoligotype**
91
92 The binary or octal spoligotype can be used to look up lineage information using a service
93 like `TB Lineage`_.
94
95 **SITVIT reports**
96
97 Optionally a report on the detected spoligotype can be retrieved from the SITVIT_ database. If such a report is requested it can also be
98 illustrated as a (PDF format) plot.
99
100 .. _SpoTyping: https://github.com/xiaeryu/SpoTyping
101 .. _spoligotype: https://www.ncbi.nlm.nih.gov/pubmed/19521871
102 .. _TB Lineage: http://tbinsight.cs.rpi.edu/run_tb_lineage.html
103 .. _SITVIT: http://www.pasteur-guadeloupe.fr:8081/SITVIT_ONLINE/
37 ]]></help> 104 ]]></help>
38 <citations> 105 <citations>
39 <citation type="bibtex"> 106 <citation type="bibtex">
40 @misc{githubSpoTyping, 107 @misc{githubSpoTyping,
41 author = {Xia, Eryu}, 108 author = {Xia, Eryu},
43 title = {SpoTyping}, 110 title = {SpoTyping},
44 publisher = {GitHub}, 111 publisher = {GitHub},
45 journal = {GitHub repository}, 112 journal = {GitHub repository},
46 url = {https://github.com/xiaeryu/SpoTyping}, 113 url = {https://github.com/xiaeryu/SpoTyping},
47 }</citation> 114 }</citation>
115 <citation type="doi">10.1186/s13073-016-0270-7</citation>
48 </citations> 116 </citations>
49 </tool> 117 </tool>