0
|
1 <tool id="feature_alignment" name="Feature Alignment" version="0.1">
|
|
2 <description>of peakgroups below a FDR</description>
|
|
3 <stdio>
|
|
4 <exit_code level="fatal" range="1:"/>
|
|
5 </stdio>
|
|
6 <version_command>feature_alignment.py --version</version_command>
|
|
7 <command interpreter="python">
|
|
8 <![CDATA[
|
|
9 feature_alignment.py
|
|
10 --in #'" "'.join([ $file for $file in $inputs ])#
|
|
11 --file_format $oformat
|
|
12 #if str($out) == "openswath":
|
|
13 --out $out
|
|
14 #end if
|
|
15 --out_matrix out_matrix.tsv
|
|
16 --out_ids $out_ids
|
|
17 --fdr_cutoff $fdr_cutoff
|
|
18 #if $max_fdr_quality and $max_fdr_quality is not None:
|
|
19 --max_fdr_quality "$max_fdr_quality"
|
|
20 #end if
|
|
21 --max_rt_diff $max_rt_diff
|
|
22 --iso_max_rt_diff $iso_max_rt_diff
|
|
23 --frac_selected $frac_selected
|
|
24 --method $method
|
|
25 --matrix_output_method $matrix_output_method
|
|
26 --realign_method $realign_method
|
|
27
|
|
28 &&
|
|
29 mv out_matrix.tsv $out_matrix
|
|
30
|
|
31 ]]></command>
|
|
32 <inputs>
|
|
33
|
|
34 <param name="inputs" type="data" multiple="True"
|
|
35 label="A list of mProphet output files containing all peakgroups" help="(--in)"/>
|
|
36 <param name="oformat" type="select" label="Which input file format is used" help="(--file_format)">
|
|
37 <option value="openswath">OpenSwath</option>
|
|
38 <option value="peakview" selected="True">Peakview</option>
|
|
39 </param>
|
|
40
|
|
41 <param name="fdr_cutoff" type="float" value="0.01" label="Seeding score cutoff" help="(--fdr_cutoff)" />
|
|
42 <param name="max_fdr_quality" type="text" default="-1.0"
|
|
43 label="Extension score cutoff"
|
|
44 help="During the extension phase of the algorithm, peakgroups of this quality will still be considered for alignment (in FDR) - it is possible to give a range in the format lower,higher+stepsize,stepsize - e.g. 0,0.31,0.01 (-1 will set it to fdr_cutoff) (--max_fdr_quality)"/>
|
|
45 <param name="max_rt_diff" type="integer" default="30"
|
|
46 label="Maximal difference in RT for two aligned features" help="(--max_rt_diff)"/>
|
|
47 <param name="iso_max_rt_diff" type="text" default="10"
|
|
48 label="Maximal difference in RT for two isotopic channels in the same run" help="(--iso_max_rt_diff)" />
|
|
49 <param name="frac_selected" type="float" value="0.0" min="0" max="1"
|
|
50 label="Do not write peakgroup if selected in less than this fraction of runs" help="(--frac_selected)"/>
|
|
51 <param name="method" type="select"
|
|
52 label="Which method to use for the clustering"
|
1
|
53 help="Note that the MST options will perform a local, MST guided alignment while the other options will use a reference-guided alignment. The global option will also move peaks which are below the selected FDR threshold. (--method)" >
|
0
|
54 <option value='best_overall' selected="True">best_overall</option>
|
|
55 <option value='best_cluster_score'>best_cluster_score</option>
|
|
56 <option value='global_best_cluster_score'>global_best_cluster_score</option>
|
|
57 <option value='global_best_overall'>global_best_overall</option>
|
|
58 <option value='LocalMST'>LocalMST</option>
|
|
59 <option value='LocalMSTAllCluster'>LocalMSTAllCluster</option>
|
|
60 </param>
|
|
61
|
|
62 <param name="matrix_output_method" type="select"
|
|
63 label="Which columns are written besides Intensity" help="(--matrix_output_method)">
|
|
64 <option value='none' selected="True">None</option>
|
|
65 <option value='RT'>RT</option>
|
|
66 <option value='score'>Score</option>
|
|
67 <option value='source'>Source</option>
|
|
68 <option value='full'>Full</option>
|
|
69 </param>
|
|
70 <param name="realign_method" type="select" label="How to re-align runs in retention time" help="(--realign_method)">
|
|
71 <option value='diRT' selected="True">Use only deltaiRT from the input file</option>
|
|
72 <option value='linear'>Perform a linear regression using best peakgroups</option>
|
|
73 <!--option value='splineR'>Perform a spline fit using R</option-->
|
|
74 <!--option value='splineR_external'>Perform a spline fit using R</option-->
|
|
75 <option value='splinePy'>Use Python native spline from scikits.datasmooth (slow!)</option>
|
|
76 <option value='lowess'>Use Robust locally weighted regression (lowess smoother)</option>
|
|
77 <option value='CVSpline'>Splines with cross-validation</option>
|
|
78 <option value='nonCVSpline'>Splines without cross-validation</option>
|
|
79 <option value='earth' >Use Multivariate Adaptive Regression Splines using py-earth</option>
|
|
80 </param>
|
|
81 </inputs>
|
|
82 <outputs>
|
|
83 <!-- Matrix containing one peak group per row -->
|
|
84 <data format="tabular" name="out_matrix"/>
|
|
85 <!-- Id file only containing the ids -->
|
|
86 <data format="tabular" name="out_ids"/>
|
|
87 <!-- Output file with filtered peakgroups for quantification (only works for OpenSWATH) -->
|
|
88 <data format="text" name="out">
|
|
89 <filter>oformat == 'openswath'</filter>
|
|
90 </data>
|
|
91 </outputs>
|
|
92 <help>
|
|
93 <![CDATA[
|
|
94
|
|
95 **What it does**
|
|
96
|
|
97 This program will select all peakgroups below the FDR cutoff in all files and try to align them to each other.
|
|
98 If only one file is given, it will act as peakgroup selector (best by m_score)
|
|
99 and will apply the provided FDR cutoff.
|
|
100 ]]>
|
|
101 </help>
|
|
102 <citations>
|
|
103 <citation type="doi"></citation>
|
|
104 </citations>
|
|
105 </tool>
|
|
106
|