annotate grinder-fa1fa683bcf1/grinder.xml @ 0:a41241d67693 default tip

Uploaded
author greg
date Wed, 18 Jan 2012 11:45:20 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
a41241d67693 Uploaded
greg
parents:
diff changeset
1 <tool id="grinder" name="Grinder" version="0.4.3">
a41241d67693 Uploaded
greg
parents:
diff changeset
2
a41241d67693 Uploaded
greg
parents:
diff changeset
3 <description>versatile omic shotgun and amplicon read simulator</description>
a41241d67693 Uploaded
greg
parents:
diff changeset
4
a41241d67693 Uploaded
greg
parents:
diff changeset
5 <requirements>
a41241d67693 Uploaded
greg
parents:
diff changeset
6 <requirement type="binary">grinder</requirement>
a41241d67693 Uploaded
greg
parents:
diff changeset
7 </requirements>
a41241d67693 Uploaded
greg
parents:
diff changeset
8
a41241d67693 Uploaded
greg
parents:
diff changeset
9 <version_string>grinder --version</version_string>
a41241d67693 Uploaded
greg
parents:
diff changeset
10
a41241d67693 Uploaded
greg
parents:
diff changeset
11 <command interpreter="python">
a41241d67693 Uploaded
greg
parents:
diff changeset
12 stderr_wrapper.py
a41241d67693 Uploaded
greg
parents:
diff changeset
13 grinder
a41241d67693 Uploaded
greg
parents:
diff changeset
14 #if $reference_file.specify == "builtin":
a41241d67693 Uploaded
greg
parents:
diff changeset
15 -reference_file ${ filter( lambda x: str( x[0] ) == str( $reference_file.value ), $__app__.tool_data_tables[ 'all_fasta' ].get_fields() )[0][-1] }
a41241d67693 Uploaded
greg
parents:
diff changeset
16 #else if $reference_file.specify == "uploaded":
a41241d67693 Uploaded
greg
parents:
diff changeset
17 -reference_file $reference_file.value
a41241d67693 Uploaded
greg
parents:
diff changeset
18 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
19 #if str($coverage_fold):
a41241d67693 Uploaded
greg
parents:
diff changeset
20 -coverage_fold $coverage_fold
a41241d67693 Uploaded
greg
parents:
diff changeset
21 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
22 #if str($total_reads):
a41241d67693 Uploaded
greg
parents:
diff changeset
23 -total_reads $total_reads
a41241d67693 Uploaded
greg
parents:
diff changeset
24 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
25 #if str($read_dist):
a41241d67693 Uploaded
greg
parents:
diff changeset
26 -read_dist $read_dist
a41241d67693 Uploaded
greg
parents:
diff changeset
27 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
28 #if str($insert_dist):
a41241d67693 Uploaded
greg
parents:
diff changeset
29 -insert_dist $insert_dist
a41241d67693 Uploaded
greg
parents:
diff changeset
30 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
31 #if str($mate_orientation):
a41241d67693 Uploaded
greg
parents:
diff changeset
32 -mate_orientation $mate_orientation
a41241d67693 Uploaded
greg
parents:
diff changeset
33 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
34 #if str($exclude_chars):
a41241d67693 Uploaded
greg
parents:
diff changeset
35 -exclude_chars $exclude_chars
a41241d67693 Uploaded
greg
parents:
diff changeset
36 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
37 #if str($delete_chars):
a41241d67693 Uploaded
greg
parents:
diff changeset
38 -delete_chars $delete_chars
a41241d67693 Uploaded
greg
parents:
diff changeset
39 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
40 #if str($forward_reverse) != "None":
a41241d67693 Uploaded
greg
parents:
diff changeset
41 -forward_reverse $forward_reverse
a41241d67693 Uploaded
greg
parents:
diff changeset
42 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
43 #if str($unidirectional):
a41241d67693 Uploaded
greg
parents:
diff changeset
44 -unidirectional $unidirectional
a41241d67693 Uploaded
greg
parents:
diff changeset
45 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
46 #if str($length_bias):
a41241d67693 Uploaded
greg
parents:
diff changeset
47 -length_bias $length_bias
a41241d67693 Uploaded
greg
parents:
diff changeset
48 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
49 #if str($copy_bias):
a41241d67693 Uploaded
greg
parents:
diff changeset
50 -copy_bias $copy_bias
a41241d67693 Uploaded
greg
parents:
diff changeset
51 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
52 #if str($mutation_dist):
a41241d67693 Uploaded
greg
parents:
diff changeset
53 -mutation_dist $mutation_dist
a41241d67693 Uploaded
greg
parents:
diff changeset
54 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
55 #if str($mutation_ratio):
a41241d67693 Uploaded
greg
parents:
diff changeset
56 -mutation_ratio $mutation_ratio
a41241d67693 Uploaded
greg
parents:
diff changeset
57 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
58 #if str($homopolymer_dist):
a41241d67693 Uploaded
greg
parents:
diff changeset
59 -homopolymer_dist $homopolymer_dist
a41241d67693 Uploaded
greg
parents:
diff changeset
60 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
61 #if str($chimera_perc):
a41241d67693 Uploaded
greg
parents:
diff changeset
62 -chimera_perc $chimera_perc
a41241d67693 Uploaded
greg
parents:
diff changeset
63 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
64 #if str($chimera_dist):
a41241d67693 Uploaded
greg
parents:
diff changeset
65 -chimera_dist $chimera_dist
a41241d67693 Uploaded
greg
parents:
diff changeset
66 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
67 #if str($chimera_kmer):
a41241d67693 Uploaded
greg
parents:
diff changeset
68 -chimera_kmer $chimera_kmer
a41241d67693 Uploaded
greg
parents:
diff changeset
69 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
70 #if str($abundance_file) != "None":
a41241d67693 Uploaded
greg
parents:
diff changeset
71 -abundance_file $abundance_file
a41241d67693 Uploaded
greg
parents:
diff changeset
72 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
73 #if str($abundance_model):
a41241d67693 Uploaded
greg
parents:
diff changeset
74 -abundance_model $abundance_model
a41241d67693 Uploaded
greg
parents:
diff changeset
75 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
76 #if str($num_libraries):
a41241d67693 Uploaded
greg
parents:
diff changeset
77 -num_libraries $num_libraries
a41241d67693 Uploaded
greg
parents:
diff changeset
78 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
79 #if str($multiplex_ids) != "None":
a41241d67693 Uploaded
greg
parents:
diff changeset
80 -multiplex_ids $multiplex_ids
a41241d67693 Uploaded
greg
parents:
diff changeset
81 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
82 #if str($diversity):
a41241d67693 Uploaded
greg
parents:
diff changeset
83 -diversity $diversity
a41241d67693 Uploaded
greg
parents:
diff changeset
84 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
85 #if str($shared_perc):
a41241d67693 Uploaded
greg
parents:
diff changeset
86 -shared_perc $shared_perc
a41241d67693 Uploaded
greg
parents:
diff changeset
87 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
88 #if str($permuted_perc):
a41241d67693 Uploaded
greg
parents:
diff changeset
89 -permuted_perc $permuted_perc
a41241d67693 Uploaded
greg
parents:
diff changeset
90 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
91 #if str($random_seed):
a41241d67693 Uploaded
greg
parents:
diff changeset
92 -random_seed $random_seed
a41241d67693 Uploaded
greg
parents:
diff changeset
93 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
94 #if str($permuted_perc):
a41241d67693 Uploaded
greg
parents:
diff changeset
95 -desc_track $desc_track
a41241d67693 Uploaded
greg
parents:
diff changeset
96 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
97 #if str($qual_levels):
a41241d67693 Uploaded
greg
parents:
diff changeset
98 -qual_levels $qual_levels
a41241d67693 Uploaded
greg
parents:
diff changeset
99 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
100 #if str($fastq_output) == '1':
a41241d67693 Uploaded
greg
parents:
diff changeset
101 -fastq_output $fastq_output
a41241d67693 Uploaded
greg
parents:
diff changeset
102 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
103 #if str($profile_file) != "None":
a41241d67693 Uploaded
greg
parents:
diff changeset
104 -profile_file $profile_file.value
a41241d67693 Uploaded
greg
parents:
diff changeset
105 #end if
a41241d67693 Uploaded
greg
parents:
diff changeset
106 <!-- When Galaxy bug #661 is resolved, then we can use the same method to check for all optional argument -->
a41241d67693 Uploaded
greg
parents:
diff changeset
107 <!-- i.e. either if str($param) != "None": or if str($param): -->
a41241d67693 Uploaded
greg
parents:
diff changeset
108 <!-- URL: https://bitbucket.org/galaxy/galaxy-central/issue/661/optional-arguments-problems#comment-655611 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
109 </command>
a41241d67693 Uploaded
greg
parents:
diff changeset
110
a41241d67693 Uploaded
greg
parents:
diff changeset
111 <inputs>
a41241d67693 Uploaded
greg
parents:
diff changeset
112
a41241d67693 Uploaded
greg
parents:
diff changeset
113 <conditional name="reference_file">
a41241d67693 Uploaded
greg
parents:
diff changeset
114 <param name="specify" type="select" label="Specify">
a41241d67693 Uploaded
greg
parents:
diff changeset
115 <option value="builtin">Built-in file</option>
a41241d67693 Uploaded
greg
parents:
diff changeset
116 <option value="uploaded">Uploaded file</option>
a41241d67693 Uploaded
greg
parents:
diff changeset
117 </param>
a41241d67693 Uploaded
greg
parents:
diff changeset
118 <when value="builtin">
a41241d67693 Uploaded
greg
parents:
diff changeset
119 <param name="value" type="select" label="Reference sequences (genomes, genes, transcripts, proteins)" help="Galaxy built-in FASTA file">
a41241d67693 Uploaded
greg
parents:
diff changeset
120 <options from_data_table="all_fasta" />
a41241d67693 Uploaded
greg
parents:
diff changeset
121 </param>
a41241d67693 Uploaded
greg
parents:
diff changeset
122 </when>
a41241d67693 Uploaded
greg
parents:
diff changeset
123 <when value="uploaded">
a41241d67693 Uploaded
greg
parents:
diff changeset
124 <param name="value" type="data" format="fasta" label="Reference sequences" help="FASTA file that contains the input reference sequences" />
a41241d67693 Uploaded
greg
parents:
diff changeset
125 </when>
a41241d67693 Uploaded
greg
parents:
diff changeset
126 </conditional>
a41241d67693 Uploaded
greg
parents:
diff changeset
127
a41241d67693 Uploaded
greg
parents:
diff changeset
128 <param name="total_reads" type="text" value="100" optional="true" label="Number of reads" help="Number of shotgun or amplicon reads to generate for each library. Do not specify this if you specify the fold coverage." />
a41241d67693 Uploaded
greg
parents:
diff changeset
129
a41241d67693 Uploaded
greg
parents:
diff changeset
130 <param name="coverage_fold" type="text" optional="true" label="Coverage fold" help="Desired fold coverage of the input reference sequences (the output FASTA length divided by the input FASTA length). Do not specify this if you specify the number of reads directly." />
a41241d67693 Uploaded
greg
parents:
diff changeset
131
a41241d67693 Uploaded
greg
parents:
diff changeset
132 <param name="read_dist" type="text" value="100" optional="true" label="Sequence length distribution" help="Desired sequence length distribution specified as:
a41241d67693 Uploaded
greg
parents:
diff changeset
133 average length, distribution ('uniform' or 'normal') and standard deviation
a41241d67693 Uploaded
greg
parents:
diff changeset
134 Only the first element is required.
a41241d67693 Uploaded
greg
parents:
diff changeset
135 Examples:
a41241d67693 Uploaded
greg
parents:
diff changeset
136 1/ All reads exactly 101 bp long (Illumina GA 2x): 101
a41241d67693 Uploaded
greg
parents:
diff changeset
137 2/ Uniform read distribution around 100+-10 bp: 100 uniform 10
a41241d67693 Uploaded
greg
parents:
diff changeset
138 3/ Reads normally distributed with an average of 800 and a standard deviation
a41241d67693 Uploaded
greg
parents:
diff changeset
139 of 100 bp (Sanger reads): 800 normal 100
a41241d67693 Uploaded
greg
parents:
diff changeset
140 4/ Reads normally distributed with an average of 450 and a standard deviation
a41241d67693 Uploaded
greg
parents:
diff changeset
141 of 50 bp (454 GS-FLX Ti): 450 normal 50
a41241d67693 Uploaded
greg
parents:
diff changeset
142 Reference sequences smaller than the specified read length are not used." />
a41241d67693 Uploaded
greg
parents:
diff changeset
143
a41241d67693 Uploaded
greg
parents:
diff changeset
144 <param name="insert_dist" type="text" value="0" optional="true" label="Insert size distribution" help="Create paired-end or mate-pair reads spanning the given insert length. Important: the insert is defined in the biological sense, i.e. its length includes the length of both reads and of the stretch of DNA between them:
a41241d67693 Uploaded
greg
parents:
diff changeset
145 0 : off,
a41241d67693 Uploaded
greg
parents:
diff changeset
146 or: insert size distribution in bp, in the same format as the read length
a41241d67693 Uploaded
greg
parents:
diff changeset
147 distribution (a typical value is 2,500 bp)
a41241d67693 Uploaded
greg
parents:
diff changeset
148 Two distinct reads are generated whether or not the mate pair overlaps." />
a41241d67693 Uploaded
greg
parents:
diff changeset
149
a41241d67693 Uploaded
greg
parents:
diff changeset
150 <param name="mate_orientation" type="text" value="FR" optional="true" label="Mate orientation" help="When generating paired-end or mate-pair reads (see the insert distribution parameter), specify the orientation of the reads (F: forward, R: reverse): FR for Sanger or Illumina paired-end, FF for 454, RF for Illumina mate-pairs, or RR" />
a41241d67693 Uploaded
greg
parents:
diff changeset
151
a41241d67693 Uploaded
greg
parents:
diff changeset
152 <param name="exclude_chars" type="text" optional="true" label="Characters to exclude" help="Do not create reads containing any of the specified characters (case insensitive), e.g. 'N-' to prevent reads with gaps (-) or ambiguities (N)." />
a41241d67693 Uploaded
greg
parents:
diff changeset
153
a41241d67693 Uploaded
greg
parents:
diff changeset
154 <param name="delete_chars" type="text" optional="true" label="Characters to delete" help="Remove the specified characters from the reference sequences (case insensitive), e.g. 'N-' to remove gaps (-) and ambiguities (N)." />
a41241d67693 Uploaded
greg
parents:
diff changeset
155
a41241d67693 Uploaded
greg
parents:
diff changeset
156 <param name="forward_reverse" type="data" format="fasta" optional="true" label="Amplicon primers" help="Use DNA amplicon sequencing using a forward and reverse PCR primer sequence provided in a FASTA file. The primer sequences should use the IUPAC convention for degenerate residues and the reference sequences that that do not match the specified primers are excluded. If your reference sequences are full genomes, it is recommended to turn the copy number bias option on and the length bias option off reads. To sequence from the forward strand, set the sequencing direction option to 1 and put the forward primer first and reverse primer second in the FASTA file. To sequence from the reverse strand, invert the primers in the FASTA file and use -1 for the sequencing direction option. The second primer sequence in the FASTA file is always optional. Example: AAACTYAAAKGAATTGRCGG and ACGGGCGGTGTGTRC for the 926F and 1392R primers that target the V6 to V9 region of the 16S rRNA gene." />
a41241d67693 Uploaded
greg
parents:
diff changeset
157
a41241d67693 Uploaded
greg
parents:
diff changeset
158 <param name="unidirectional" type="select" display="radio" value="0" label="Sequencing direction" help="Instead of producing reads bidirectionally, from the reference strand and its reverse complement, proceed unidirectionally, from one strand only (forward or reverse). Values: 0 (off, i.e. bidirectional), 1 (forward), -1 (reverse). Use the value 1 for strand specific transcriptomic or proteomic datasets.">
a41241d67693 Uploaded
greg
parents:
diff changeset
159 <option value="0">both strands</option>
a41241d67693 Uploaded
greg
parents:
diff changeset
160 <option value="1">forward strand only</option>
a41241d67693 Uploaded
greg
parents:
diff changeset
161 <option value="-1">reverse strand only</option>
a41241d67693 Uploaded
greg
parents:
diff changeset
162 </param>
a41241d67693 Uploaded
greg
parents:
diff changeset
163
a41241d67693 Uploaded
greg
parents:
diff changeset
164 <param name="length_bias" type="boolean" truevalue="1" falsevalue="0" checked="true" label="Length bias" help="In shotgun libraries, sample reference sequences proportionally to their length. For example, in simulated microbial datasets, this means that at the same relative abundance, larger genomes contribute more reads than smaller genomes. 0 = no, 1 = yes." />
a41241d67693 Uploaded
greg
parents:
diff changeset
165
a41241d67693 Uploaded
greg
parents:
diff changeset
166 <param name="copy_bias" type="boolean" truevalue="1" falsevalue="0" checked="true" label="Copy number bias" help="In amplicon libraries where full genomes are used as input, sample species proportionally to the number of copies of the target gene: at equal relative abundance, genomes that have multiple copies of the target gene contribute more amplicon reads than genomes that have a single copy. 0 = no, 1 = yes." />
a41241d67693 Uploaded
greg
parents:
diff changeset
167
a41241d67693 Uploaded
greg
parents:
diff changeset
168 <param name="mutation_dist" type="text" value="0" optional="true" label="Mutation distribution" help="Introduce sequencing errors in the reads, under the form of mutations (substitutions, insertions and deletions) at positions that follow a specified distribution (with replacement): model (uniform, linear, poly4), model parameters. For example, for a uniform 0.1% error rate, use: uniform 0.1. To simulate Sanger errors, use a linear model where the errror rate is 1% at the 5' end of reads and 2% at the 3' end: linear 1 2. To model Illumina errors using the 4th degree polynome 3e-3 + 3.3e-8 * i^4 (Korbel et al 2009), use: poly4 3e-3 3.3e-8. Use the mutation ratio option to alter how many of these mutations are substitutions
a41241d67693 Uploaded
greg
parents:
diff changeset
169 or indels." />
a41241d67693 Uploaded
greg
parents:
diff changeset
170
a41241d67693 Uploaded
greg
parents:
diff changeset
171 <param name="mutation_ratio" type="text" value="80 20" optional="true" label="Mutation ratio" help="Indicate the percentage of substitutions and the number of indels (insertions and deletions). For example, use '80 20' (4 substitutions for each indel) for Sanger reads. Note that this parameter has no effect unless you specify the mutation distribution option." />
a41241d67693 Uploaded
greg
parents:
diff changeset
172
a41241d67693 Uploaded
greg
parents:
diff changeset
173 <param name="homopolymer_dist" type="text" value="0" optional="true" label="Homopolymer distribution" help="Introduce sequencing errors in the reads under the form of homopolymeric stretches (e.g. AAA, CCCCC) using a specified model where the homopolymer length
a41241d67693 Uploaded
greg
parents:
diff changeset
174 follows a normal distribution N(mean, standard deviation) that is function of
a41241d67693 Uploaded
greg
parents:
diff changeset
175 the homopolymer length n.
a41241d67693 Uploaded
greg
parents:
diff changeset
176 Margulies: N(n, 0.15 * n), Margulies et al. 2005.
a41241d67693 Uploaded
greg
parents:
diff changeset
177 Richter: N(n, 0.15 * sqrt(n)), Richter et al. 2008.
a41241d67693 Uploaded
greg
parents:
diff changeset
178 Balzer: N(n, 0.03494 + n * 0.06856), Balzer et al. 2010." />
a41241d67693 Uploaded
greg
parents:
diff changeset
179
a41241d67693 Uploaded
greg
parents:
diff changeset
180 <param name="chimera_perc" type="text" value="0" optional="true" label="Percentage of chimeras" help="Specify the percent of reads in amplicon libraries that should be chimeric sequences. The 'reference' field in the description of chimeric reads will
a41241d67693 Uploaded
greg
parents:
diff changeset
181 contain the ID of all the reference sequences forming the chimeric template. A typical value is 10%." />
a41241d67693 Uploaded
greg
parents:
diff changeset
182
a41241d67693 Uploaded
greg
parents:
diff changeset
183 <param name="chimera_dist" type="text" value="314 38 1" optional="true" label="Multimera distribution" help="Specify the distribution of chimeras: bimeras, trimeras, quadrameras and multimeras of higher order. The default is the average values from Quince et al. 2011: '314 38 1', which corresponds to 89% of bimeras, 11% of trimeras and 0.3% of quadrameras. Note that this option only takes effect when you request the generation of chimeras with the chimera percentage option." />
a41241d67693 Uploaded
greg
parents:
diff changeset
184
a41241d67693 Uploaded
greg
parents:
diff changeset
185 <param name="chimera_kmer" type="text" value="10" optional="true" label="k-mer based chimeras" help="Activate a method to form chimeras by picking breakpoints at places where k-mers are shared between sequences. The value to provide to this option represents k, the length of the k-mers (in bp). The longer the kmer, the more similar the sequences have to be to be eligible to form chimeras. The more frequent a k-mer is in the pool of reference sequences (taking into account their relative abundance), the more often this k-mer will be chosen. For example, CHSIM (Edgar et al. 2011) uses a k-mer length of 10 bp. If you do not want to use k-mer information to form chimeras, use 0, which will result in the reference sequences and breakpoints to be taken randomly. Note that this option only takes effect when you request the generation of chimeras with the chimera percentage option." />
a41241d67693 Uploaded
greg
parents:
diff changeset
186
a41241d67693 Uploaded
greg
parents:
diff changeset
187 <param name="abundance_file" type="data" format="tabular" optional="true" label="Abundance file" help="Specify the relative abundance of the reference sequencse manually in an input file. Each line of the file should contain a sequence name and its relative abundance (%), e.g. 'seqABC 82.1' or 'seqABC 82.1 10.2' if you are specifying two different libraries." />
a41241d67693 Uploaded
greg
parents:
diff changeset
188
a41241d67693 Uploaded
greg
parents:
diff changeset
189 <param name="abundance_model" type="text" value="uniform 1" optional="true" label="Rank abundance model" help="Relative abundance model for the input reference sequences: uniform, linear, powerlaw, logarithmic or exponential. The uniform and linear models do not require a parameter, but the other models take a parameter in the range [0, infinity). If this parameter is not specified, then it is randomly chosen. Examples:
a41241d67693 Uploaded
greg
parents:
diff changeset
190
a41241d67693 Uploaded
greg
parents:
diff changeset
191 uniform distribution: uniform
a41241d67693 Uploaded
greg
parents:
diff changeset
192 powerlaw distribution with parameter 0.1: powerlaw 0.1
a41241d67693 Uploaded
greg
parents:
diff changeset
193 exponential distribution with automatically chosen parameter: exponential" />
a41241d67693 Uploaded
greg
parents:
diff changeset
194
a41241d67693 Uploaded
greg
parents:
diff changeset
195 <param name="num_libraries" type="text" value="1" optional="true" label="Number of libraries" help="Number of independent libraries to create. Specify how diverse and similar they should be using the diversity, shared percent and permuted percent options. Assign them different MID tags with the multiplex mids option. Note that in Galaxy, the maximum number of libraries is 10." />
a41241d67693 Uploaded
greg
parents:
diff changeset
196
a41241d67693 Uploaded
greg
parents:
diff changeset
197 <param name="multiplex_ids" type="data" format="fasta" optional="true" label="Specify MID tags file" help="Specify an optional FASTA file that contains sequence identifiers (a.k.a MIDs or barcodes) to add to the sequences (one sequence per library)."/>
a41241d67693 Uploaded
greg
parents:
diff changeset
198
a41241d67693 Uploaded
greg
parents:
diff changeset
199 <!-- When Galaxy bug #661 is resolved, then we can really have optional parameters of type "integer" or "float" -->
a41241d67693 Uploaded
greg
parents:
diff changeset
200 <!-- URL: https://bitbucket.org/galaxy/galaxy-central/issue/661/optional-arguments-problems#comment-655611 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
201 <!-- Affected params: diversity (int), shared_perc (float), permuted_perc (float), random_seed (int), num_libraries (int), chimera_perc (float) -->
a41241d67693 Uploaded
greg
parents:
diff changeset
202 <param name="diversity" type="text" optional="true" label="Diversity (richness)" help="Richness, or number of reference sequences to include in the shotgun libraries. Use 0 for the maximum diversity possible (based on the number of reference sequences
a41241d67693 Uploaded
greg
parents:
diff changeset
203 available). Provide one value to make all libraries have the same diversity, or one diversity value per library otherwise." />
a41241d67693 Uploaded
greg
parents:
diff changeset
204
a41241d67693 Uploaded
greg
parents:
diff changeset
205 <param name="shared_perc" type="text" value="0" optional="true" label="Percent shared" help="For multiple libraries, percent of reference sequences they should have in common (relative to the diversity of the least diverse library)." />
a41241d67693 Uploaded
greg
parents:
diff changeset
206
a41241d67693 Uploaded
greg
parents:
diff changeset
207 <param name="permuted_perc" type="text" value="0" optional="true" label="Percent permuted" help="For multiple libraries, percent of the most-abundant reference sequences to permute in rank-abundance." />
a41241d67693 Uploaded
greg
parents:
diff changeset
208
a41241d67693 Uploaded
greg
parents:
diff changeset
209 <param name="random_seed" type="text" optional="true" label="Random seed" help="Seed number to use for the pseudo-random number generator." />
a41241d67693 Uploaded
greg
parents:
diff changeset
210
a41241d67693 Uploaded
greg
parents:
diff changeset
211 <param name="desc_track" type="boolean" truevalue="1" falsevalue="0" checked="true" label="Read tracking" help="Track read information (reference sequence, position, errors, ...) by writing it in the FASTA read description." />
a41241d67693 Uploaded
greg
parents:
diff changeset
212
a41241d67693 Uploaded
greg
parents:
diff changeset
213 <param name="qual_levels" type="text" optional="true" label="Quality score levels" help="Generate basic quality scores for the simulated reads. Good residues are given a specified good score (e.g. 30) and residues that are the result of an insertion or substitution are given a specified bad score (e.g. 10). Specify first the good score and then the bad score, e.g. '30 10'" />
a41241d67693 Uploaded
greg
parents:
diff changeset
214
a41241d67693 Uploaded
greg
parents:
diff changeset
215 <param name="fastq_output" type="boolean" truevalue="1" falsevalue="0" checked="false" label="FASTQ output" help="
a41241d67693 Uploaded
greg
parents:
diff changeset
216 Write the generated reads in FASTQ format (Sanger variant) instead of FASTA and
a41241d67693 Uploaded
greg
parents:
diff changeset
217 QUAL. Quality score levels need to be specified for this option to be effective." />
a41241d67693 Uploaded
greg
parents:
diff changeset
218
a41241d67693 Uploaded
greg
parents:
diff changeset
219 <param name="profile_file" type="data" format="txt" optional="true" label="Profile file" help="A file that contains Grinder arguments. This is useful if you use many options or often use the same options. Lines with comments (#) are ignored. Consider the profile file, 'simple_profile.txt':
a41241d67693 Uploaded
greg
parents:
diff changeset
220
a41241d67693 Uploaded
greg
parents:
diff changeset
221 # A simple Grinder profile
a41241d67693 Uploaded
greg
parents:
diff changeset
222 -read_dist 105 normal 12
a41241d67693 Uploaded
greg
parents:
diff changeset
223 -total_reads 1000
a41241d67693 Uploaded
greg
parents:
diff changeset
224
a41241d67693 Uploaded
greg
parents:
diff changeset
225 Running: grinder -reference_file viral_genomes.fa -profile_file simple_profile.txt
a41241d67693 Uploaded
greg
parents:
diff changeset
226
a41241d67693 Uploaded
greg
parents:
diff changeset
227 Translates into: grinder -reference_file viral_genomes.fa -read_dist 105 normal 12 -total_reads 1000
a41241d67693 Uploaded
greg
parents:
diff changeset
228
a41241d67693 Uploaded
greg
parents:
diff changeset
229 Note that the arguments specified in the profile should not be specified again on the command line." />
a41241d67693 Uploaded
greg
parents:
diff changeset
230
a41241d67693 Uploaded
greg
parents:
diff changeset
231 </inputs>
a41241d67693 Uploaded
greg
parents:
diff changeset
232
a41241d67693 Uploaded
greg
parents:
diff changeset
233
a41241d67693 Uploaded
greg
parents:
diff changeset
234 <outputs>
a41241d67693 Uploaded
greg
parents:
diff changeset
235
a41241d67693 Uploaded
greg
parents:
diff changeset
236 <!-- single library output -->
a41241d67693 Uploaded
greg
parents:
diff changeset
237 <data format="tabular" name="ranks" from_work_dir="grinder-ranks.txt" label="${tool.name} ranks from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
238 <filter>int(str(num_libraries)) == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
239 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
240 <data format="fasta" name="fasta" from_work_dir="grinder-reads.fa" label="${tool.name} reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
241 <filter>int(str(num_libraries)) == 1 and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
242 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
243 <data format="qual" name="qual" from_work_dir="grinder-reads.qual" label="${tool.name} quals from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
244 <filter>int(str(num_libraries)) == 1 and str(qual_levels) and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
245 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
246 <data format="fastqsanger" name="fastq" from_work_dir="grinder-reads.fastq" label="${tool.name} reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
247 <filter>int(str(num_libraries)) == 1 and fastq_output == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
248 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
249
a41241d67693 Uploaded
greg
parents:
diff changeset
250 <!-- When Galaxy bug #670 is resolved, then we won't have to harcode the number of output datasets -->
a41241d67693 Uploaded
greg
parents:
diff changeset
251 <!-- URL: https://bitbucket.org/galaxy/galaxy-central/issue/670/better-support-for-multiple-outputs -->
a41241d67693 Uploaded
greg
parents:
diff changeset
252
a41241d67693 Uploaded
greg
parents:
diff changeset
253 <!-- multiple libraries: library 1 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
254 <data format="tabular" name="ranks1" from_work_dir="grinder-1-ranks.txt" label="${tool.name} lib 1 ranks from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
255 <filter>int(str(num_libraries)) >= 2</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
256 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
257 <data format="fasta" name="fasta1" from_work_dir="grinder-1-reads.fa" label="${tool.name} lib 1 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
258 <filter>int(str(num_libraries)) >= 2 and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
259 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
260 <data format="qual" name="qual1" from_work_dir="grinder-1-reads.qual" label="${tool.name} lib 1 quals from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
261 <filter>int(str(num_libraries)) >= 2 and str(qual_levels) and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
262 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
263 <data format="fastqsanger" name="fastq1" from_work_dir="grinder-1-reads.fastq" label="${tool.name} lib 1 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
264 <filter>int(str(num_libraries)) >= 2 and fastq_output == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
265 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
266
a41241d67693 Uploaded
greg
parents:
diff changeset
267 <!-- multiple libraries: library 2 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
268 <data format="tabular" name="ranks2" from_work_dir="grinder-2-ranks.txt" label="${tool.name} lib 2 ranks from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
269 <filter>int(str(num_libraries)) >= 2</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
270 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
271 <data format="fasta" name="fasta2" from_work_dir="grinder-2-reads.fa" label="${tool.name} lib 2 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
272 <filter>int(str(num_libraries)) >= 2 and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
273 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
274 <data format="qual" name="qual2" from_work_dir="grinder-2-reads.qual" label="${tool.name} lib 2 quals from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
275 <filter>int(str(num_libraries)) >= 2 and str(qual_levels) and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
276 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
277 <data format="fastqsanger" name="fastq2" from_work_dir="grinder-2-reads.fastq" label="${tool.name} lib 2 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
278 <filter>int(str(num_libraries)) >= 2 and fastq_output == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
279 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
280
a41241d67693 Uploaded
greg
parents:
diff changeset
281 <!-- multiple libraries: library 3 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
282 <data format="tabular" name="ranks3" from_work_dir="grinder-3-ranks.txt" label="${tool.name} lib 3 ranks from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
283 <filter>int(str(num_libraries)) >= 3</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
284 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
285 <data format="fasta" name="fasta3" from_work_dir="grinder-3-reads.fa" label="${tool.name} lib 3 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
286 <filter>int(str(num_libraries)) >= 3 and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
287 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
288 <data format="qual" name="qual3" from_work_dir="grinder-3-reads.qual" label="${tool.name} lib 3 quals from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
289 <filter>int(str(num_libraries)) >= 3 and str(qual_levels) and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
290 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
291 <data format="fastqsanger" name="fastq3" from_work_dir="grinder-3-reads.fastq" label="${tool.name} lib 3 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
292 <filter>int(str(num_libraries)) >= 3 and fastq_output == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
293 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
294
a41241d67693 Uploaded
greg
parents:
diff changeset
295 <!-- multiple libraries: library 4 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
296 <data format="tabular" name="ranks4" from_work_dir="grinder-4-ranks.txt" label="${tool.name} lib 4 ranks from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
297 <filter>int(str(num_libraries)) >= 4</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
298 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
299 <data format="fasta" name="fasta4" from_work_dir="grinder-4-reads.fa" label="${tool.name} lib 4 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
300 <filter>int(str(num_libraries)) >= 4 and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
301 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
302 <data format="qual" name="qual4" from_work_dir="grinder-4-reads.qual" label="${tool.name} lib 4 quals from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
303 <filter>int(str(num_libraries)) >= 4 and str(qual_levels) and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
304 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
305 <data format="fastqsanger" name="fastq4" from_work_dir="grinder-4-reads.fastq" label="${tool.name} lib 4 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
306 <filter>int(str(num_libraries)) >= 4 and fastq_output == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
307 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
308
a41241d67693 Uploaded
greg
parents:
diff changeset
309 <!-- multiple libraries: library 5 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
310 <data format="tabular" name="ranks5" from_work_dir="grinder-5-ranks.txt" label="${tool.name} lib 5 ranks from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
311 <filter>int(str(num_libraries)) >= 5</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
312 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
313 <data format="fasta" name="fasta5" from_work_dir="grinder-5-reads.fa" label="${tool.name} lib 5 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
314 <filter>int(str(num_libraries)) >= 5 and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
315 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
316 <data format="qual" name="qual5" from_work_dir="grinder-5-reads.qual" label="${tool.name} lib 5 quals from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
317 <filter>int(str(num_libraries)) >= 5 and str(qual_levels) and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
318 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
319 <data format="fastqsanger" name="fastq5" from_work_dir="grinder-5-reads.fastq" label="${tool.name} lib 5 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
320 <filter>int(str(num_libraries)) >= 5 and fastq_output == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
321 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
322
a41241d67693 Uploaded
greg
parents:
diff changeset
323 <!-- multiple libraries: library 6 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
324 <data format="tabular" name="ranks6" from_work_dir="grinder-6-ranks.txt" label="${tool.name} lib 6 ranks from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
325 <filter>int(str(num_libraries)) >= 6</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
326 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
327 <data format="fasta" name="fasta6" from_work_dir="grinder-6-reads.fa" label="${tool.name} lib 6 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
328 <filter>int(str(num_libraries)) >= 6 and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
329 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
330 <data format="qual" name="qual6" from_work_dir="grinder-6-reads.qual" label="${tool.name} lib 6 quals from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
331 <filter>int(str(num_libraries)) >= 6 and str(qual_levels) and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
332 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
333 <data format="fastqsanger" name="fastq6" from_work_dir="grinder-6-reads.fastq" label="${tool.name} lib 6 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
334 <filter>int(str(num_libraries)) >= 6 and fastq_output == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
335 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
336
a41241d67693 Uploaded
greg
parents:
diff changeset
337 <!-- multiple libraries: library 7 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
338 <data format="tabular" name="ranks7" from_work_dir="grinder-7-ranks.txt" label="${tool.name} lib 7 ranks from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
339 <filter>int(str(num_libraries)) >= 7</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
340 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
341 <data format="fasta" name="fasta7" from_work_dir="grinder-7-reads.fa" label="${tool.name} lib 7 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
342 <filter>int(str(num_libraries)) >= 7 and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
343 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
344 <data format="qual" name="qual7" from_work_dir="grinder-7-reads.qual" label="${tool.name} lib 7 quals from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
345 <filter>int(str(num_libraries)) >= 7 and str(qual_levels) and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
346 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
347 <data format="fastqsanger" name="fastq7" from_work_dir="grinder-7-reads.fastq" label="${tool.name} lib 7 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
348 <filter>int(str(num_libraries)) >= 7 and fastq_output == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
349 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
350
a41241d67693 Uploaded
greg
parents:
diff changeset
351 <!-- multiple libraries: library 8 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
352 <data format="tabular" name="ranks8" from_work_dir="grinder-8-ranks.txt" label="${tool.name} lib 8 ranks from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
353 <filter>int(str(num_libraries)) >= 8</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
354 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
355 <data format="fasta" name="fasta8" from_work_dir="grinder-8-reads.fa" label="${tool.name} lib 8 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
356 <filter>int(str(num_libraries)) >= 8 and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
357 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
358 <data format="qual" name="qual8" from_work_dir="grinder-8-reads.qual" label="${tool.name} lib 8 quals from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
359 <filter>int(str(num_libraries)) >= 8 and str(qual_levels) and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
360 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
361 <data format="fastqsanger" name="fastq8" from_work_dir="grinder-8-reads.fastq" label="${tool.name} lib 8 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
362 <filter>int(str(num_libraries)) >= 8 and fastq_output == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
363 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
364
a41241d67693 Uploaded
greg
parents:
diff changeset
365 <!-- multiple libraries: library 9 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
366 <data format="tabular" name="ranks9" from_work_dir="grinder-9-ranks.txt" label="${tool.name} lib 9 ranks from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
367 <filter>int(str(num_libraries)) >= 9</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
368 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
369 <data format="fasta" name="fasta9" from_work_dir="grinder-9-reads.fa" label="${tool.name} lib 9 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
370 <filter>int(str(num_libraries)) >= 9 and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
371 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
372 <data format="qual" name="qual9" from_work_dir="grinder-9-reads.qual" label="${tool.name} lib 9 quals from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
373 <filter>int(str(num_libraries)) >= 9 and str(qual_levels) and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
374 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
375 <data format="fastqsanger" name="fastq9" from_work_dir="grinder-9-reads.fastq" label="${tool.name} lib 9 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
376 <filter>int(str(num_libraries)) >= 9 and fastq_output == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
377 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
378
a41241d67693 Uploaded
greg
parents:
diff changeset
379 <!-- multiple libraries: library 10 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
380 <data format="tabular" name="ranks10" from_work_dir="grinder-10-ranks.txt" label="${tool.name} lib 10 ranks from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
381 <filter>int(str(num_libraries)) >= 10</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
382 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
383 <data format="fasta" name="fasta10" from_work_dir="grinder-10-reads.fa" label="${tool.name} lib 10 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
384 <filter>int(str(num_libraries)) >= 10 and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
385 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
386 <data format="qual" name="qual10" from_work_dir="grinder-10-reads.qual" label="${tool.name} lib 10 quals from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
387 <filter>int(str(num_libraries)) >= 10 and str(qual_levels) and fastq_output == 0</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
388 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
389 <data format="fastqsanger" name="fastq10" from_work_dir="grinder-10-reads.fastq" label="${tool.name} lib 10 reads from ${on_string}">
a41241d67693 Uploaded
greg
parents:
diff changeset
390 <filter>int(str(num_libraries)) >= 10 and fastq_output == 1</filter>
a41241d67693 Uploaded
greg
parents:
diff changeset
391 </data>
a41241d67693 Uploaded
greg
parents:
diff changeset
392
a41241d67693 Uploaded
greg
parents:
diff changeset
393 </outputs>
a41241d67693 Uploaded
greg
parents:
diff changeset
394
a41241d67693 Uploaded
greg
parents:
diff changeset
395 <tests>
a41241d67693 Uploaded
greg
parents:
diff changeset
396 <!-- no tests since they would not not always return the same results -->
a41241d67693 Uploaded
greg
parents:
diff changeset
397 <!--
a41241d67693 Uploaded
greg
parents:
diff changeset
398 <test>
a41241d67693 Uploaded
greg
parents:
diff changeset
399 <param name="specify" value="uploaded" />
a41241d67693 Uploaded
greg
parents:
diff changeset
400 <param name="value" value="ngs_simulation_in1.fasta" ftype="fasta" />
a41241d67693 Uploaded
greg
parents:
diff changeset
401 <output name="ranks" file="" />
a41241d67693 Uploaded
greg
parents:
diff changeset
402 <output name="fasta" file="" />
a41241d67693 Uploaded
greg
parents:
diff changeset
403 <output name="qual" file="" />
a41241d67693 Uploaded
greg
parents:
diff changeset
404 </test>
a41241d67693 Uploaded
greg
parents:
diff changeset
405
a41241d67693 Uploaded
greg
parents:
diff changeset
406 <test>
a41241d67693 Uploaded
greg
parents:
diff changeset
407 <param name="specify" value="builtin" />
a41241d67693 Uploaded
greg
parents:
diff changeset
408 <param name="builtin" value="pUC18" />
a41241d67693 Uploaded
greg
parents:
diff changeset
409 <output name="ranks" file="" />
a41241d67693 Uploaded
greg
parents:
diff changeset
410 <output name="fasta" file="" />
a41241d67693 Uploaded
greg
parents:
diff changeset
411 <output name="qual" file="" />
a41241d67693 Uploaded
greg
parents:
diff changeset
412 </test>
a41241d67693 Uploaded
greg
parents:
diff changeset
413 -->
a41241d67693 Uploaded
greg
parents:
diff changeset
414 </tests>
a41241d67693 Uploaded
greg
parents:
diff changeset
415
a41241d67693 Uploaded
greg
parents:
diff changeset
416 <help>
a41241d67693 Uploaded
greg
parents:
diff changeset
417
a41241d67693 Uploaded
greg
parents:
diff changeset
418 **What it does**
a41241d67693 Uploaded
greg
parents:
diff changeset
419
a41241d67693 Uploaded
greg
parents:
diff changeset
420 Grinder is a program to create random shotgun and amplicon sequence libraries
a41241d67693 Uploaded
greg
parents:
diff changeset
421 based on reference sequences in a FASTA file. Features include:
a41241d67693 Uploaded
greg
parents:
diff changeset
422
a41241d67693 Uploaded
greg
parents:
diff changeset
423 * omic support: genomic, metagenomic, transcriptomic, metatranscriptomic,
a41241d67693 Uploaded
greg
parents:
diff changeset
424 proteomic and metaproteomic
a41241d67693 Uploaded
greg
parents:
diff changeset
425 * shotgun library or amplicon library
a41241d67693 Uploaded
greg
parents:
diff changeset
426 * arbitrary read length distribution and number of reads
a41241d67693 Uploaded
greg
parents:
diff changeset
427 * simulation of PCR and sequencing errors (chimeras, point mutations, homopolymers)
a41241d67693 Uploaded
greg
parents:
diff changeset
428 * support for creating paired-end (mate pair) datasets
a41241d67693 Uploaded
greg
parents:
diff changeset
429 * specific rank-abundance settings or manually given abundance for each genome
a41241d67693 Uploaded
greg
parents:
diff changeset
430 * creation of datasets with a given richness (alpha diversity)
a41241d67693 Uploaded
greg
parents:
diff changeset
431 * independent datasets can share a variable number of genomes (beta diversity)
a41241d67693 Uploaded
greg
parents:
diff changeset
432 * modeling of the bias created by varying genome lengths or gene copy number
a41241d67693 Uploaded
greg
parents:
diff changeset
433 * profile mechanism to store preferred options
a41241d67693 Uploaded
greg
parents:
diff changeset
434 * API to automate the creation of a large number of simulated datasets
a41241d67693 Uploaded
greg
parents:
diff changeset
435
a41241d67693 Uploaded
greg
parents:
diff changeset
436
a41241d67693 Uploaded
greg
parents:
diff changeset
437 **Input**
a41241d67693 Uploaded
greg
parents:
diff changeset
438
a41241d67693 Uploaded
greg
parents:
diff changeset
439 A variety of FASTA databases containing genes or genomes can be used as input
a41241d67693 Uploaded
greg
parents:
diff changeset
440 for Grinder, such as the NCBI RefSeq collection (ftp://ftp.ncbi.nih.gov/refseq/release/microbial/),
a41241d67693 Uploaded
greg
parents:
diff changeset
441 the GreenGenes 16S rRNA database (http://greengenes.lbl.gov/Download/Sequence_Data/Fasta_data_files/Isolated_named_strains_16S_aligned.fasta), the human genome and transcriptome (ftp://ftp.ncbi.nih.gov/refseq/H_sapiens/RefSeqGene/, ftp://ftp.ncbi.nih.gov/refseq/H_sapiens/mRNA_Prot/human.rna.fna.gz), ...
a41241d67693 Uploaded
greg
parents:
diff changeset
442
a41241d67693 Uploaded
greg
parents:
diff changeset
443 These input files can either be provided as a Galaxy dataset, or can be uploaded
a41241d67693 Uploaded
greg
parents:
diff changeset
444 by Galaxy users in their history.
a41241d67693 Uploaded
greg
parents:
diff changeset
445
a41241d67693 Uploaded
greg
parents:
diff changeset
446
a41241d67693 Uploaded
greg
parents:
diff changeset
447 **Output**
a41241d67693 Uploaded
greg
parents:
diff changeset
448
a41241d67693 Uploaded
greg
parents:
diff changeset
449 For each library requested, a first file contains the abundance of the species
a41241d67693 Uploaded
greg
parents:
diff changeset
450 in the simulated community created, e.g.::
a41241d67693 Uploaded
greg
parents:
diff changeset
451
a41241d67693 Uploaded
greg
parents:
diff changeset
452 # rank seqID rel. abundance
a41241d67693 Uploaded
greg
parents:
diff changeset
453 1 86715_Lachnospiraceae 0.367936925098555
a41241d67693 Uploaded
greg
parents:
diff changeset
454 2 6439_Neisseria_polysaccharea 0.183968462549277
a41241d67693 Uploaded
greg
parents:
diff changeset
455 3 103712_Fusobacterium_nucleatum 0.122645641699518
a41241d67693 Uploaded
greg
parents:
diff changeset
456 4 103024_Frigoribacterium 0.0919842312746386
a41241d67693 Uploaded
greg
parents:
diff changeset
457 5 129066_Streptococcus_pyogenes 0.0735873850197109
a41241d67693 Uploaded
greg
parents:
diff changeset
458 6 106485_Pseudomonas_aeruginosa 0.0613228208497591
a41241d67693 Uploaded
greg
parents:
diff changeset
459 7 13824_Veillonella_criceti 0.0525624178712221
a41241d67693 Uploaded
greg
parents:
diff changeset
460 8 28044_Lactosphaera 0.0459921156373193
a41241d67693 Uploaded
greg
parents:
diff changeset
461
a41241d67693 Uploaded
greg
parents:
diff changeset
462 The second file is a FASTA file containing shotgun or amplicon reads, e.g.::
a41241d67693 Uploaded
greg
parents:
diff changeset
463
a41241d67693 Uploaded
greg
parents:
diff changeset
464 >1 reference=13824_Veillonella_criceti position=89-1088 strand=+
a41241d67693 Uploaded
greg
parents:
diff changeset
465 ACCAACCTGCCCTTCAGAGGGGGATAACAACGGGAAACCGTTGCTAATACCGCGTACGAA
a41241d67693 Uploaded
greg
parents:
diff changeset
466 TGGACTTCGGCATCGGAGTTCATTGAAAGGTGGCCTCTATTTATAAGCTATCGCTGAAGG
a41241d67693 Uploaded
greg
parents:
diff changeset
467 AGGGGGTTGCGTCTGATTAGCTAGTTGGAGGGGTAATGGCCCACCAAGGCAA
a41241d67693 Uploaded
greg
parents:
diff changeset
468
a41241d67693 Uploaded
greg
parents:
diff changeset
469 >2 reference=103712_Fusobacterium_nucleatum position=2-1001 strand=+
a41241d67693 Uploaded
greg
parents:
diff changeset
470 TGAACGAAGAGTTTGATCCTGGCTCAGGATGAACGCTGACAGAATGCTTAACACATGCAA
a41241d67693 Uploaded
greg
parents:
diff changeset
471 GTCAACTTGAATTTGGGTTTTTAACTTAGGTTTGGG
a41241d67693 Uploaded
greg
parents:
diff changeset
472
a41241d67693 Uploaded
greg
parents:
diff changeset
473 If you specify the quality score levels option, a third file representing the
a41241d67693 Uploaded
greg
parents:
diff changeset
474 quality scores of the reads is created::
a41241d67693 Uploaded
greg
parents:
diff changeset
475
a41241d67693 Uploaded
greg
parents:
diff changeset
476 >1 reference=103712_Fusobacterium_nucleatum position=2-1001 strand=+
a41241d67693 Uploaded
greg
parents:
diff changeset
477 30 30 30 10 30 30 ...
a41241d67693 Uploaded
greg
parents:
diff changeset
478
a41241d67693 Uploaded
greg
parents:
diff changeset
479
a41241d67693 Uploaded
greg
parents:
diff changeset
480 </help>
a41241d67693 Uploaded
greg
parents:
diff changeset
481
a41241d67693 Uploaded
greg
parents:
diff changeset
482 </tool>
a41241d67693 Uploaded
greg
parents:
diff changeset
483