Mercurial > repos > computational-metabolomics > dimspy_align_samples
comparison align_samples.xml @ 0:49d20b18fc6a draft default tip
"planemo upload for repository https://github.com/computational-metabolomics/dimspy-galaxy commit 80069808371b58f45da0c8133c27d67ac1a5b448"
author | computational-metabolomics |
---|---|
date | Wed, 17 Feb 2021 10:51:22 +0000 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:49d20b18fc6a |
---|---|
1 <tool id="dimspy_align_samples" name="Align Samples" version="@TOOL_VERSION@+galaxy1"> | |
2 <description> - Align peaks across Peaklists</description> | |
3 <macros> | |
4 <import>macros.xml</import> | |
5 </macros> | |
6 <expand macro="requirements" /> | |
7 <command detect_errors="exit_code"> | |
8 <![CDATA[ | |
9 dimspy align-samples | |
10 --input '$hdf5_file_in' | |
11 --output '$hdf5_file_out' | |
12 #if $filelist | |
13 --filelist '$filelist' | |
14 #end if | |
15 --ppm $ppm | |
16 --ncpu \${GALAXY_SLOTS:-1} | |
17 --block-size $adv.block_size | |
18 #if $hdf5_to_txt.standard | |
19 && | |
20 @HDF5_PM_TO_TXT@ | |
21 #end if | |
22 #if $hdf5_to_txt.comprehensive | |
23 && | |
24 @HDF5_PM_TO_TXT_COMPREHENSIVE@ | |
25 #end if | |
26 ]]> | |
27 </command> | |
28 <inputs> | |
29 <param name="hdf5_file_in" argument="--input" type="data" format="h5" label="Peaklists (HDF5 file)" help="" /> | |
30 <param name="filelist" argument="--filelist" type="data" format="tsv,tabular" optional="true" label="Filelist / Samplelist" help="Only provide a filelist if you like to exclude Peaklists, update the metadata (e.g. classLabel), or if you have not provided a filelist for Process Scans or Replicate Filter." /> | |
31 <param name="ppm" argument="--ppm" type="float" value="2.0" label="Ppm error tolerance" help="Maximum tolerated m/z deviation across samples in parts per million (ppm)." /> | |
32 <param name="delimiter" argument="--delimiter" type="hidden" value="tab" /> | |
33 <expand macro="hdf5_pm_to_txt" /> | |
34 <section name="adv" title="Advanced options" expanded="False"> | |
35 <param name="block_size" argument="--block-size" type="integer" value="5000" label="Block size" help="The size of each block of peaks to perform clustering on." /> | |
36 </section> | |
37 </inputs> | |
38 <outputs> | |
39 <expand macro="outputs_peak_intensity_matrix" /> | |
40 </outputs> | |
41 <tests> | |
42 <test> | |
43 <param name="hdf5_file_in" value="pls_rf.h5" ftype="h5"/> | |
44 <param name="ppm" value="2.0"/> | |
45 <param name="delimiter" value="tab"/> | |
46 <conditional name="hdf5_to_txt" > | |
47 <param name="standard" value="True"/> | |
48 <param name="comprehensive" value="False"/> | |
49 <param name="samples_representations" value="rows"/> | |
50 <param name="matrix_attr" value="intensity"/> | |
51 </conditional> | |
52 <output name="hdf5_file_out" file="pm_as.h5" ftype="h5" compare="sim_size"/> | |
53 <output name="matrix_file_out" file="peak_matrix_as.txt" ftype="tsv"/> | |
54 </test> | |
55 <test> | |
56 <param name="hdf5_file_in" value="pls_rf.h5" ftype="h5"/> | |
57 <param name="ppm" value="2.0"/> | |
58 <param name="delimiter" value="tab"/> | |
59 <conditional name="hdf5_to_txt" > | |
60 <param name="standard" value="True"/> | |
61 <param name="comprehensive" value="False"/> | |
62 <param name="samples_representations" value="rows"/> | |
63 <param name="matrix_attr" value="intensity"/> | |
64 </conditional> | |
65 <section name="adv"> | |
66 <param name="block_size" value="10000"/> | |
67 </section> | |
68 <output name="hdf5_file_out" file="pm_as.h5" ftype="h5" compare="sim_size"/> | |
69 <output name="matrix_file_out" file="peak_matrix_as.txt" ftype="tsv"/> | |
70 </test> | |
71 <test> | |
72 <param name="hdf5_file_in" value="pls_rf.h5" ftype="h5"/> | |
73 <param name="ppm" value="2.0"/> | |
74 <param name="delimiter" value="tab"/> | |
75 <conditional name="hdf5_to_txt"> | |
76 <param name="standard" value="True"/> | |
77 <param name="comprehensive" value="False"/> | |
78 <param name="representation_samples" value="columns"/> | |
79 <param name="matrix_attr" value="intensity"/> | |
80 </conditional> | |
81 <output name="hdf5_file_out" file="pm_as.h5" ftype="h5" compare="sim_size"/> | |
82 <output name="matrix_file_out" file="peak_matrix_as_t.txt" ftype="tsv"/> | |
83 </test> | |
84 <test> | |
85 <param name="hdf5_file_in" value="pls_rf.h5" ftype="h5"/> | |
86 <param name="ppm" value="2.0"/> | |
87 <param name="delimiter" value="tab"/> | |
88 <conditional name="hdf5_to_txt"> | |
89 <param name="standard" value="True"/> | |
90 <param name="comprehensive" value="True"/> | |
91 <param name="samples_representations" value="rows"/> | |
92 <param name="matrix_attr" value="mz"/> | |
93 </conditional> | |
94 <output name="hdf5_file_out" file="pm_as.h5" ftype="h5" compare="sim_size"/> | |
95 <output name="matrix_file_out" file="peak_matrix_as_mz.txt" ftype="tsv"/> | |
96 <output name="matrix_comprehensive_file_out" file="peak_matrix_as_mz_compr.txt" ftype="tsv"/> | |
97 </test> | |
98 </tests> | |
99 <help> | |
100 ------------- | |
101 Align Samples | |
102 ------------- | |
103 | |
104 .. | |
105 | |
106 ------------------------------- | |
107 | |
108 Description | |
109 ----------- | |
110 | |
111 Standard DIMS processing workflow: Process Scans -> [Replicate Filter] -> **Align Samples** -> Blank Filter -> Sample Filter -> [Missing values sample filter] -> Pre-processing -> Statistics | |
112 | |
113 | | |
114 | |
115 This tool takes the peaklists for all study samples and merges them in to single aligned peak matrix. The peak matrix comprises a table, with samples along one axis and the mass-to-charge ratios of detected mass spectral peaks along the opposite axis. At the intersection of sample and mass-to-charge ratio, the intensity is given for a specific peak in a specific sample (if no intensity recorded, then ‘0’ is inserted). | |
116 | |
117 ------------------------------- | |
118 | |
119 Parameters | |
120 ---------- | |
121 | |
122 **Peaklists (HDF5 file)** (REQUIRED) - a HDF5 file containing all peaklists to undergo alignment. | |
123 | |
124 | | |
125 | |
126 **Filelist / Samplelist** (REQUIRED) - a file of type ‘tabular’ with the following required columns (additional metadata columns may also be included, e.g. “collectionTime”, etc.): | |
127 | |
128 - **filename** - the name of the .raw or .mzML files from which peaklists were extracted using the “Process Scans” tool | |
129 | |
130 - **batch** - a numeric value indicating the analysis batches samples were analysed in (if a single large analytica run then the default = 1) | |
131 | |
132 - **classLabel** - a string indicating the experiment classes the samples belong to (e.g. control, QC, blank/placebo, exposed/treatment) | |
133 | |
134 - **injectionOrder** - a numeric value indicating the order in which samples were analysed. | |
135 | |
136 | | |
137 | |
138 **ppm error tolerance** (REQUIRED; default = 2.0) - a numeric value equal-to or greater-than 0. | |
139 | |
140 This parameter will influence the alignment of peaks from input peaklists. Peaks from distinct peaklists (corresponding to individual study samples) are aligned if the difference between their mass-to-charge ratios, when divided by the average of their mass-to-charge ratios and multiplied by 1 × 10\ :sup:`6` \, is equal-to or less-than than this parameter value (i.e. the difference between the mass-to-charge ratios, measured on the ppm scale, is less than the user-defined “ppm error tolerance”). | |
141 | |
142 | | |
143 | |
144 @help_options_addtional_output@ | |
145 | |
146 | | |
147 | |
148 ------------------------------ | |
149 | |
150 Output file(s) | |
151 -------------- | |
152 | |
153 @help_outputs_matrix@ | |
154 | |
155 ------------------------------------------------------------- | |
156 | |
157 @github_developers_contributors@ | |
158 @license@ | |
159 </help> | |
160 <expand macro="citations" /> | |
161 </tool> |