|
0
|
1 <tool id="msfragger" name="MSFragger" version="1.0.0">
|
|
|
2 <description>search for peptide identifications in mass spectrometry proteomics</description>
|
|
|
3 <command>
|
|
|
4 <![CDATA[
|
|
|
5 #import re
|
|
|
6 ## Is file naming going to be a problem? May need to have a name param
|
|
|
7 #set $param_file = 'fragger.params'
|
|
|
8 cat $fragger_params > '$param_file'
|
|
|
9 ##
|
|
|
10 && echo " " >> '$param_file'
|
|
|
11 && echo "num_threads = \$GALAXY_SLOTS" >> '$param_file'
|
|
|
12 && cat $param_file > '$output_params'
|
|
|
13 #if $input.extension == 'mzml':
|
|
|
14 #set $file_ext = 'mzML'
|
|
|
15 #elif $input.extension == 'mzxml':
|
|
|
16 #set $file_ext = 'mzXML'
|
|
|
17 #elif $input.extension == 'mgf':
|
|
|
18 #set $file_ext = 'mgf'
|
|
|
19 #end if
|
|
|
20 #if $input_prefix and len($input_prefix.strip()) > 0:
|
|
|
21 #set $input_path = $input_prefix.__str__ + "_rep" + str($i + 1) + "." + $file_ext
|
|
|
22 #else:
|
|
|
23 #set $input_path = $re.sub('\.[mM]\w+$','',$re.sub('[^-a-zA-Z0-9_.]','_',$input.name)) + "." + $file_ext
|
|
|
24 #end if
|
|
|
25 && ln -s '${input}' '$input_path'
|
|
1
|
26 && java -Xmx30G -jar $__tool_directory__/MSFragger.jar fragger.params '$input_path'
|
|
0
|
27 ## && cat *.log
|
|
|
28 >> "$logfile"
|
|
|
29 #if $output_format == 'pepXML':
|
|
|
30 && cat *.pep.xml > $output_pepxml
|
|
|
31 #else
|
|
|
32 && cat *.tsv > $output_tsv
|
|
|
33 #end if
|
|
|
34 ]]>
|
|
|
35 </command>
|
|
|
36 <configfiles>
|
|
|
37 <configfile name="fragger_params"><![CDATA[#slurp
|
|
|
38 #import re
|
|
|
39 database_name = $database ## Uniprot.20151009.Hs.revDecoys.fa
|
|
|
40 ## num_threads = 0 ## 0=poll CPU to set num threads; else specify num threads directly (max 64)
|
|
|
41
|
|
|
42 ## Search Tolerances
|
|
|
43
|
|
|
44 precursor_mass_tolerance = #if str( $search_tolerances.mass.precursor_mass_tolerance ) then $search_tolerances.mass.precursor_mass_tolerance else 500.00#
|
|
|
45 precursor_mass_units = #if $search_tolerances.mass.units == 'Da' then 0 else 1# ## 0=Daltons, 1=ppm
|
|
|
46 precursor_true_tolerance = #if str( $search_tolerances.mass.precursor_true_tolerance ) then $search_tolerances.mass.precursor_true_tolerance else 20.00#
|
|
|
47 precursor_true_units = #if $search_tolerances.mass.units == 'Da' then 0 else 1# ## 0=Daltons, 1=ppm
|
|
|
48 fragment_mass_tolerance = #if str( $search_tolerances.mass.fragment_mass_tolerance ) then $search_tolerances.mass.fragment_mass_tolerance else 20.00#
|
|
|
49 fragment_mass_units = #if $search_tolerances.mass.units == 'Da' then 0 else 1# ## 0=Daltons, 1=ppm
|
|
|
50 isotope_error = $search_tolerances.isotope_error ## 0=off, 0/1/2 (standard C13 error)
|
|
|
51
|
|
|
52 ## digest parameters
|
|
|
53
|
|
|
54 search_enzyme_name = #if $digestion.search_enzyme_name then $digestion.search_enzyme_name else 'Trypsin'# ## Trypsin
|
|
|
55 search_enzyme_cutafter = #if $digestion.search_enzyme_cutafter then $digestion.search_enzyme_cutafter else 'KR'# ##KR
|
|
|
56 search_enzyme_butnotafter = #if $digestion.search_enzyme_butnotafter then $digestion.search_enzyme_butnotafter else 'P'# ##P
|
|
|
57
|
|
|
58 num_enzyme_termini = $digestion.num_enzyme_termini ## 2 for enzymatic, 1 for semi-enzymatic, 0 for nonspecific digestion
|
|
|
59 allowed_missed_cleavage = #if $digestion.allowed_missed_cleavage then $digestion.allowed_missed_cleavage else 1# ## maximum value is 5
|
|
|
60
|
|
|
61 digest_min_length = #if $digestion.digest_min_length then $digestion.digest_min_length else 7#
|
|
|
62 digest_max_length = #if $digestion.digest_max_length then $digestion.digest_max_length else 50#
|
|
|
63 digest_mass_range = #if str( $digestion.digest_mass_range_min ) then $digestion.digest_mass_range_min else 500.0# #if $digestion.digest_mass_range_max is not None then $digestion.digest_mass_range_max else 5000.0# ## MH+ peptide mass range to analyze
|
|
|
64
|
|
|
65
|
|
|
66 ## Variable Modification Parameters
|
|
|
67
|
|
|
68 clip_nTerm_M = $variable_modification.clip_nTerm_M
|
|
|
69
|
|
|
70 ##maximum of 7 mods - amino acid codes, * for any amino acid, [ and ] specifies protein termini, n and c specifies peptide termini
|
|
|
71 ##variable_mod_01 = 15.9949 M
|
|
|
72 ##variable_mod_02 = 42.0106 [*
|
|
|
73 ##variable_mod_03 = 79.96633 STY
|
|
|
74 ##variable_mod_03 = -17.0265 nQnC
|
|
|
75 ##variable_mod_04 = -18.0106 nE
|
|
|
76
|
|
|
77 allow_multiple_variable_mods_on_residue = $variable_modification.allow_multiple_variable_mods_on_residue ## static mods are not considered
|
|
|
78 max_variable_mods_per_mod = #if str( $variable_modification.max_variable_mods_per_mod ) then $variable_modification.max_variable_mods_per_mod else 3# ## maximum of 5
|
|
|
79 max_variable_mods_combinations = #if str( $variable_modification.max_variable_mods_combinations ) then $variable_modification.max_variable_mods_combinations else 1000# ## maximum of 65534, limits number of modified peptides generated from sequence
|
|
|
80
|
|
|
81 #set $vmods = $re.findall('([+-]?\d+[.]\d+\s\S+)',str($variable_modification.variable_mods))
|
|
|
82 #for i,vmod in enumerate($vmods):
|
|
|
83 variable_mod_0${int(i)+1} = $vmod
|
|
|
84 #end for
|
|
|
85
|
|
|
86 ##open search parameters
|
|
|
87 track_zero_topN = #if str( $open_search.track_zero_topN ) then $open_search.track_zero_topN else 0# ## in addition to topN results, keep track of top results in zero bin
|
|
|
88 zero_bin_accept_expect = #if str( $open_search.zero_bin_accept_expect ) then $open_search.zero_bin_accept_expect else 0# ## boost top zero bin entry to top if it has expect under 0.01 - set to 0 to disable
|
|
|
89 zero_bin_mult_expect = #if str( $open_search.zero_bin_mult_expect ) then $open_search.zero_bin_mult_expect else 1# ## disabled if above passes - multiply expect of zero bin for ordering purposes (does not affect reported expect)
|
|
|
90 add_topN_complementary = #if str( $open_search.add_topN_complementary ) then $open_search.add_topN_complementary else 0#
|
|
|
91
|
|
|
92 ## spectral processing
|
|
|
93
|
|
|
94 minimum_peaks = #if str( $spectrum_processing.minimum_peaks ) then $spectrum_processing.minimum_peaks else 15# ## required minimum number of peaks in spectrum to search (default 10)
|
|
|
95 use_topN_peaks = #if str( $spectrum_processing.use_topN_peaks ) then $spectrum_processing.use_topN_peaks else 100#
|
|
|
96
|
|
|
97
|
|
|
98 minimum_ratio = #if str($spectrum_processing.minimum_ratio) then $spectrum_processing.minimum_ratio else 0.01# ## filter peaks below this fraction of strongest peak
|
|
|
99
|
|
|
100 override_charge = $spectrum_processing.precursor.override_charge
|
|
|
101 #if $spectrum_processing.precursor.override_charge == 1
|
|
|
102 precursor_charge = $spectrum_processing.precursor.precursor_charge_min $spectrum_processing.precursor.precursor_charge_max ## precursor charge range to analyze; does not override any existing charge; 0 as 1st entry ignores parameter
|
|
|
103 #end if
|
|
|
104 max_fragment_charge = #if str( $spectrum_processing.max_fragment_charge ) then $spectrum_processing.max_fragment_charge else 2# ## set maximum fragment charge state to analyze (allowed max 5)
|
|
|
105 #if str( $spectrum_processing.clear.clear_mz_range_min ) or str( $spectrum_processing.clear.clear_mz_range_max )
|
|
|
106 clear_mz_range = #if str( $spectrum_processing.clear.clear_mz_range_min ) then $spectrum_processing.clear.clear_mz_range_min else 0.0# #if str( $spectrum_processing.clear.clear_mz_range_max ) then $spectrum_processing.clear.clear_mz_range_max else 0.0#
|
|
|
107 #else
|
|
|
108 clear_mz_range = 0.0 0.0 ## for iTRAQ/TMT type data; will clear out all peaks in the specified m/z range
|
|
|
109 #end if
|
|
|
110
|
|
|
111
|
|
|
112 min_fragments_modelling = #if str( $modeling_output.min_fragments_modelling ) then $modeling_output.min_fragments_modelling else 3#
|
|
|
113 min_matched_fragments = #if str( $modeling_output.min_matched_fragments ) then $modeling_output.min_matched_fragments else 6#
|
|
|
114 output_report_topN = #if $modeling_output.output_report_topN is not None then $modeling_output.output_report_topN else 1#
|
|
|
115 output_max_expect = #if str( $modeling_output.output_max_expect ) then $modeling_output.output_max_expect else 50.0#
|
|
|
116
|
|
|
117 output_file_extension = #if $output_format == 'pepXML' then 'pep.xml' else 'tsv'# ##pepXML
|
|
|
118 output_format = $output_format ##pepXML or tsv
|
|
|
119
|
|
|
120 ## additional modifications
|
|
|
121 static_modification
|
|
|
122
|
|
|
123 add_Cterm_peptide = #if str( $static_modification.add_Cterm_peptide ) then $static_modification.add_Cterm_peptide else 0.0#
|
|
|
124 add_Nterm_peptide = #if str( $static_modification.add_Nterm_peptide ) then $static_modification.add_Nterm_peptide else 0.0#
|
|
|
125 add_Cterm_protein = #if str( $static_modification.add_Cterm_protein ) then $static_modification.add_Cterm_protein else 0.0#
|
|
|
126 add_Nterm_protein = #if str( $static_modification.add_Nterm_protein ) then $static_modification.add_Nterm_protein else 0.0#
|
|
|
127 add_G_glycine = #if str( $static_modification.add_G_glycine ) then $static_modification.add_G_glycine else 0.0000# ## added to G - avg. 57.0513, mono. 57.02146
|
|
|
128 add_A_alanine = #if str( $static_modification.add_A_alanine ) then $static_modification.add_A_alanine else 0.0000# ## added to A - avg. 71.0779, mono. 71.03711
|
|
|
129 add_S_serine = #if str( $static_modification.add_S_serine ) then $static_modification.add_S_serine else 0.0000# ## added to S - avg. 87.0773, mono. 87.03203
|
|
|
130 add_P_proline = #if str( $static_modification.add_P_proline ) then $static_modification.add_P_proline else 0.0000# ## added to P - avg. 97.1152, mono. 97.05276
|
|
|
131 add_V_valine = #if str( $static_modification.add_V_valine ) then $static_modification.add_V_valine else 0.0000# ## added to V - avg. 99.1311, mono. 99.06841
|
|
|
132 add_T_threonine = #if str( $static_modification.add_T_threonine ) then $static_modification.add_T_threonine else 0.0000# ## added to T - avg. 101.1038, mono. 101.04768
|
|
|
133 add_C_cysteine = #if str( $static_modification.add_C_cysteine ) then $static_modification.add_C_cysteine else 0.0000# ## added to C - avg. 103.1429, mono. 103.00918
|
|
|
134 add_L_leucine = #if str( $static_modification.add_L_leucine ) then $static_modification.add_L_leucine else 0.0000# ## added to L - avg. 113.1576, mono. 113.08406
|
|
|
135 add_I_isoleucine = #if str( $static_modification.add_I_isoleucine ) then $static_modification.add_I_isoleucine else 0.0000# ## added to I - avg. 113.1576, mono. 113.08406
|
|
|
136 add_N_asparagine = #if str( $static_modification.add_N_asparagine ) then $static_modification.add_N_asparagine else 0.0000# ## added to N - avg. 114.1026, mono. 114.04293
|
|
|
137 add_D_aspartic_acid = #if str( $static_modification.add_D_aspartic_acid ) then $static_modification.add_D_aspartic_acid else 0.0000# ## added to D - avg. 115.0874, mono. 115.02694
|
|
|
138 add_Q_glutamine = #if str( $static_modification.add_Q_glutamine ) then $static_modification.add_Q_glutamine else 0.0000# ## added to Q - avg. 128.1292, mono. 128.05858
|
|
|
139 add_K_lysine = #if str( $static_modification.add_K_lysine ) then $static_modification.add_K_lysine else 0.0000# ## added to K - avg. 128.1723, mono. 128.09496
|
|
|
140 add_E_glutamic_acid = #if str( $static_modification.add_E_glutamic_acid ) then $static_modification.add_E_glutamic_acid else 0.0000# ## added to E - avg. 129.1140, mono. 129.04259
|
|
|
141 add_M_methionine = #if str( $static_modification.add_M_methionine ) then $static_modification.add_M_methionine else 0.0000# ## added to M - avg. 131.1961, mono. 131.04048
|
|
|
142 add_H_histidine = #if str( $static_modification.add_H_histidine ) then $static_modification.add_H_histidine else 0.0000# ## added to H - avg. 137.1393, mono. 137.05891
|
|
|
143 add_F_phenylalanine = #if str( $static_modification.add_F_phenylalanine ) then $static_modification.add_F_phenylalanine else 0.0000# ## added to F - avg. 147.1739, mono. 147.06841
|
|
|
144 add_R_arginine = #if str( $static_modification.add_R_arginine ) then $static_modification.add_R_arginine else 0.0000# ## added to R - avg. 156.1857, mono. 156.10111
|
|
|
145 add_Y_tyrosine = #if str( $static_modification.add_Y_tyrosine ) then $static_modification.add_Y_tyrosine else 0.0000# ## added to Y - avg. 163.0633, mono. 163.06333
|
|
|
146 add_W_tryptophan = #if str( $static_modification.add_W_tryptophan ) then $static_modification.add_W_tryptophan else 0.0000# ## added to W - avg. 186.0793, mono. 186.07931
|
|
|
147 #*
|
|
|
148 add_B_user_amino_acid = #if str( $static_modification.add_B_user_amino_acid ) then $static_modification.add_B_user_amino_acid else 0.0000# ## added to B - avg. 0.0000, mono. 0.00000
|
|
|
149 add_J_user_amino_acid = #if str( $static_modification.add_J_user_amino_acid ) then $static_modification.add_J_user_amino_acid else 0.0000# ## added to J - avg. 0.0000, mono. 0.00000
|
|
|
150 add_O_user_amino_acid = #if str( $static_modification.add_O_user_amino_acid ) then $static_modification.add_O_user_amino_acid else 0.0000# ## added to O - avg. 0.0000, mono 0.00000
|
|
|
151 add_U_user_amino_acid = #if str( $static_modification.add_U_user_amino_acid ) then $static_modification.add_U_user_amino_acid else 0.0000# ## added to U - avg. 0.0000, mono. 0.00000
|
|
|
152 add_X_user_amino_acid = #if str( $static_modification.add_X_user_amino_acid ) then $static_modification.add_X_user_amino_acid else 0.0000# ## added to X - avg. 0.0000, mono. 0.00000
|
|
|
153 add_Z_user_amino_acid = #if str( $static_modification.add_Z_user_amino_acid ) then $static_modification.add_Z_user_amino_acid else 0.0000# ## added to Z - avg. 0.0000, mono. 0.00000
|
|
|
154 *#
|
|
|
155 #slurp]]>
|
|
|
156 </configfile>
|
|
|
157 </configfiles>
|
|
|
158
|
|
|
159 <inputs>
|
|
|
160 <param name="input" type="data" format="mzml,mzxml" label="Proteomics Spectrum files in mzML or mzXML format"/>
|
|
|
161 <param name="input_prefix" type="text" value="" optional="true" label="File name prefix" help="Names inputs: prefix_rep#.mzXML Leave blank to use History names of inputs">
|
|
|
162 <validator type="regex" message="">[a-zA-Z][a-zA-Z0-9_-]*</validator>
|
|
|
163 </param>
|
|
|
164 <param name="database" type="data" format="fasta" label="Proteomics Search Database in FASTA format"/>
|
|
|
165 <section name="search_tolerances" expanded="false" title="Search Tolerances">
|
|
|
166 <conditional name="mass">
|
|
|
167 <param name="units" type="select" label="Set Mass tolerances" help="Sets default parameters">
|
|
|
168 <option value="Da">Daltons</option>
|
|
|
169 <option value="ppm">ppm</option>
|
|
|
170 </param>
|
|
|
171 <when value="Da">
|
|
|
172 <!-- Need to get correct defaults for Daltions -->
|
|
|
173 <param name="precursor_mass_tolerance" type="float" value="20" min="1" max="100" optional="true" label="Precursor mass tolerance"
|
|
|
174 help="Precursor mass tolerance (window is +/- this value) Default: 20"/>
|
|
|
175 <param name="precursor_true_tolerance" type="float" value="0" min="1" max="100" optional="true" label="Precursor true tolerance"
|
|
|
176 help="True precursor mass tolerance (window is +/- this value). Used for tie breaker of results (in spectrally ambiguous cases) and zero bin boosting in open searches (0 disables these features). This option is STRONGLY recommended for open searches. Default: 0"/>
|
|
|
177 <param name="fragment_mass_tolerance" type="float" value="20" min="1" max="100" optional="true" label="Fragment mass tolerance"
|
|
|
178 help="Fragment mass tolerance (window is +/- this value) Default: 20"/>
|
|
|
179 </when>
|
|
|
180 <when value="ppm">
|
|
|
181 <!-- Should these be integer for ppm? -->
|
|
|
182 <param name="precursor_mass_tolerance" type="float" value="20" min="1" max="100" optional="true" label="Precursor mass tolerance"
|
|
|
183 help="Precursor mass tolerance (window is +/- this value) Default: 20"/>
|
|
|
184 <param name="precursor_true_tolerance" type="float" value="0.0" min="0.0" max="100" optional="true" label="Precursor true tolerance"
|
|
|
185 help="True precursor mass tolerance (window is +/- this value). Used for tie breaker of results (in spectrally ambiguous cases) and zero bin boosting in open searches (0 disables these features). This option is STRONGLY recommended for open searches. Default: 0"/>
|
|
|
186 <param name="fragment_mass_tolerance" type="float" value="20" min="1" max="100" optional="true" label="Fragment mass tolerance"
|
|
|
187 help="Fragment mass tolerance (window is +/- this value) Default: 20"/>
|
|
|
188 </when>
|
|
|
189 </conditional>
|
|
|
190 <param name="isotope_error" type="select" label="isotope_error">
|
|
|
191 <help>
|
|
|
192 Isotope correction for MS/MS events triggered on isotopic peaks. Should be set to 0 (disabled) for open search or 0/1/2 for correction of narrow window searches. Shifts the precursor mass window to multiples of this value multiplied by the mass of C13-C12.
|
|
|
193 </help>
|
|
|
194 <option value="0">0 - Disabled (for open search)</option>
|
|
|
195 <option value="0/1/2">0/1/2 - (Correction for narrow window searches)</option>
|
|
|
196 </param>
|
|
|
197 </section>
|
|
|
198
|
|
|
199 <section name="digestion" expanded="false" title="In-silico Digestion Parameters">
|
|
|
200 <param name="search_enzyme_name" type="text" value="Trypsin" optional="true"
|
|
|
201 label="Digestion Enzyme" help="Name of enzyme to be written to the pepXML file."/>
|
|
|
202 <param name="search_enzyme_cutafter" type="text" value="" optional="true"
|
|
|
203 label="Residues after which the enzyme cuts" help="search_enzyme_cutafter Residues after which the enzyme cuts Default: KR"/>
|
|
|
204 <param name="search_enzyme_butnotafter" type="text" value="" optional="true"
|
|
|
205 label="Residues that the enzyme will not cut before" help="search_enzyme_butnotafter - (misnomer: should really be called butnotbefore) Default: P"/>
|
|
|
206 <param name="num_enzyme_termini" type="select" label="Number of enzyme termini">
|
|
|
207 <option value="0">0 - non-enzymatic</option>
|
|
|
208 <option value="1">1 - semi-enzymatic</option>
|
|
|
209 <option value="2">2 - fully-enzymatic</option>
|
|
|
210 </param>
|
|
|
211
|
|
|
212 <param name="allowed_missed_cleavage" type="integer" value="2" min="0" max="5" optional="true"
|
|
|
213 label="Allowed number of missed cleavages"/>
|
|
|
214 <param name="digest_min_length" type="integer" value="7" min="1" max="30" optional="true"
|
|
|
215 label="Minimum length of peptides to be generated during in-silico digestion"/>
|
|
|
216 <param name="digest_max_length" type="integer" value="64" min="10" max="100" optional="true"
|
|
|
217 label="Maximum length of peptides to be generated during in-silico digestion"/>
|
|
|
218 <param name="digest_mass_range_min" type="float" value="500.0" min="0.0" optional="true"
|
|
|
219 label="Minimum Mass of peptides to be generated during in-silico digestion in Daltons" />
|
|
|
220 <param name="digest_mass_range_max" type="float" value="5000.0" min="0.0" optional="true"
|
|
|
221 label="Maximum Mass of peptides to be generated during in-silico digestion in Daltons" />
|
|
|
222
|
|
|
223 </section>
|
|
|
224
|
|
|
225 <section name="variable_modification" expanded="false" title="Variable Modifications">
|
|
|
226 <param name="variable_mods" type="text" area="True" size="120x7" value="" optional="true"
|
|
|
227 label="">
|
|
|
228 <help><![CDATA[
|
|
|
229 Sets variable modifications. (variable_mod_01 to variable_mod_07). Space separated values with 1st value being the modification mass and the second being the residues (specified consecutively as a string) it modifies.
|
|
|
230 * is used to represent any amino acid [ is a modifier for protein N-terminal
|
|
|
231 ] is a modifier for protein C-terminal
|
|
|
232 n is a modifier for peptide N-terminal c is a modifier for peptide C-terminal
|
|
|
233 Syntax Examples:
|
|
|
234 15.9949 M (for oxidation on methionine)
|
|
|
235 79.66331 STY (for phosphorylation)
|
|
|
236 -17.0265 nQnC (for pyro-Glu or loss of ammonia at peptide N-terminal)
|
|
|
237 Example (M oxidation and N-terminal acetylation):
|
|
|
238 variable_mod_01 = 15.9949 M variable_mod_02 = 42.0106 [*
|
|
|
239 ]]></help>
|
|
|
240 <!-- regex working in python, but not webform -->
|
|
|
241 <validator type="regex">^(?ms)(([+-]?\d+[.]\d+\s\S+)(\s+[+-]?\d+[.]\d+\s\S+)*)?$</validator>
|
|
|
242 <sanitizer sanitize="False"/>
|
|
|
243 </param>
|
|
|
244 <param name="clip_nTerm_M" type="boolean" truevalue="1" falsevalue="0" checked="false"
|
|
|
245 label="Trim protein N-terminal methionine as a variable modification"/>
|
|
|
246 <param name="allow_multiple_variable_mods_on_residue" type="boolean" truevalue="1" falsevalue="0" checked="true"
|
|
|
247 label="Allow each amino acid to be modified by multiple variable modifications"/>
|
|
|
248 <param name="max_variable_mods_per_mod" type="integer" value="2" min="0" max="5" optional="true"
|
|
|
249 label="Maximum number of residues that can be occupied by each variable modification"/>
|
|
|
250 <param name="max_variable_mods_combinations" type="integer" value="5000" min="0" max="65534" optional="true"
|
|
|
251 label="Maximum allowed number of modified variably modified peptides from each peptide sequence"
|
|
|
252 help="If a greater number than the maximum is generated, only the unmodified peptide is considered."/>
|
|
|
253 </section>
|
|
|
254 <section name="static_modification" expanded="false" title="Static Modifications">
|
|
|
255 <param name="add_Cterm_peptide" type="float" value="" optional="true"
|
|
|
256 label="Statically add mass in Da to C-terminal of peptide Default: 0.0" />
|
|
|
257 <param name="add_Nterm_peptide" type="float" value="" optional="true"
|
|
|
258 label="Statically add mass in Da to N-terminal of peptide Default: 0.0" />
|
|
|
259 <param name="add_Cterm_protein" type="float" value="" optional="true"
|
|
|
260 label="Statically add mass in Da to C-terminal of protein Default: 0.0" />
|
|
|
261 <param name="add_Nterm_protein" type="float" value="" optional="true"
|
|
|
262 label="Statically add mass in Da to N-terminal of protein Default: 0.0" />
|
|
|
263 <param name="add_A_alanine" type="float" value="" optional="true"
|
|
|
264 label="Statically add mass in Da to A (alanine) Default: 0.0" />
|
|
|
265 <param name="add_R_arginine" type="float" value="" optional="true"
|
|
|
266 label="Statically add mass in Da to R (arginine) Default: 0.0" />
|
|
|
267 <param name="add_N_asparagine" type="float" value="" optional="true"
|
|
|
268 label="Statically add mass in Da to N (asparagine) Default: 0.0" />
|
|
|
269 <param name="add_D_aspartic_acid" type="float" value="" optional="true"
|
|
|
270 label="Statically add mass in Da to D (aspartic_acid) Default: 0.0" />
|
|
|
271 <param name="add_C_cysteine" type="float" value="" optional="true"
|
|
|
272 label="Statically add mass in Da to C (cysteine) Default: 0.0" />
|
|
|
273 <param name="add_E_glutamic_acid" type="float" value="" optional="true"
|
|
|
274 label="Statically add mass in Da to E (glutamic_acid) Default: 0.0" />
|
|
|
275 <param name="add_Q_glutamine" type="float" value="" optional="true"
|
|
|
276 label="Statically add mass in Da to Q (glutamine) Default: 0.0" />
|
|
|
277 <param name="add_G_glycine" type="float" value="" optional="true"
|
|
|
278 label="Statically add mass in Da to G (glycine) Default: 0.0" />
|
|
|
279 <param name="add_H_histidine" type="float" value="" optional="true"
|
|
|
280 label="Statically add mass in Da to H (histidine) Default: 0.0" />
|
|
|
281 <param name="add_I_isoleucine" type="float" value="" optional="true"
|
|
|
282 label="Statically add mass in Da to I (isoleucine) Default: 0.0" />
|
|
|
283 <param name="add_L_leucine" type="float" value="" optional="true"
|
|
|
284 label="Statically add mass in Da to L (leucine) Default: 0.0" />
|
|
|
285 <param name="add_K_lysine" type="float" value="" optional="true"
|
|
|
286 label="Statically add mass in Da to K (lysine) Default: 0.0" />
|
|
|
287 <param name="add_M_methionine" type="float" value="" optional="true"
|
|
|
288 label="Statically add mass in Da to M (methionine) Default: 0.0" />
|
|
|
289 <param name="add_F_phenylalanine" type="float" value="" optional="true"
|
|
|
290 label="Statically add mass in Da to F (phenylalanine) Default: 0.0" />
|
|
|
291 <param name="add_P_proline" type="float" value="" optional="true"
|
|
|
292 label="Statically add mass in Da to P (proline) Default: 0.0" />
|
|
|
293 <param name="add_S_serine" type="float" value="" optional="true"
|
|
|
294 label="Statically add mass in Da to S (serine) Default: 0.0" />
|
|
|
295 <param name="add_T_threonine" type="float" value="" optional="true"
|
|
|
296 label="Statically add mass in Da to T (threonine) Default: 0.0" />
|
|
|
297 <param name="add_W_tryptophan" type="float" value="" optional="true"
|
|
|
298 label="Statically add mass in Da to W (tryptophan) Default: 0.0" />
|
|
|
299 <param name="add_Y_tyrosine" type="float" value="" optional="true"
|
|
|
300 label="Statically add mass in Da to Y (tyrosine) Default: 0.0" />
|
|
|
301 <param name="add_V_valine" type="float" value="" optional="true"
|
|
|
302 label="Statically add mass in Da to V (valine) Default: 0.0" />
|
|
|
303 </section>
|
|
|
304 <section name="spectrum_processing" expanded="false" title="Spectrum Processing">
|
|
|
305 <param name="minimum_peaks" type="integer" value="10" min="0" optional="true"
|
|
|
306 label="Minimum number of peaks in experimental spectrum for matching" />
|
|
|
307 <param name="use_topN_peaks" type="integer" value="50" min="0" optional="true"
|
|
|
308 label="Pre-process experimental spectrum to only use top N peaks" />
|
|
|
309 <param name="minimum_ratio" type="float" value="" min="0.0" optional="true"
|
|
|
310 label="Filter peaks by minimum_ratio of base peak"
|
|
|
311 help="Filters out all peaks in experimental spectrum less intense than this multiple of the base peak intensit Default: 0.0" />
|
|
|
312
|
|
|
313 <param name="max_fragment_charge" type="integer" value="2" min="1" max="4" optional="true"
|
|
|
314 label="Maximum charge state for theoretical fragments to match (1-4)" />
|
|
|
315
|
|
|
316 <conditional name="precursor">
|
|
|
317 <param name="override_charge" type="select" label="Precursor Charge">
|
|
|
318 <option value="0">Use precursor charge</option>
|
|
|
319 <option value="1">Ignore precursor charge and set range</option>
|
|
|
320 </param>
|
|
|
321 <when value="0"/>
|
|
|
322 <when value="1">
|
|
|
323 <param name="precursor_charge_min" type="integer" value="1" min="0" max="6"
|
|
|
324 label="Minimum Potential Precursor Charge" />
|
|
|
325 <param name="precursor_charge_max" type="integer" value="4" min="0" max="8"
|
|
|
326 label="Maximum Potential Precursor Charge" />
|
|
|
327 </when>
|
|
|
328 </conditional>
|
|
|
329 <section name="clear" expanded="false" title="Clear mz range for iTRAQ/TMT experiments">
|
|
|
330 <param name="clear_mz_range_min" type="float" value="0.0" min="0.0" optional="true" label="Minimum of m/z range to remove" />
|
|
|
331 <param name="clear_mz_range_max" type="float" value="0.0" min="0.0" optional="true" label="Maximum of m/z range to remove" />
|
|
|
332 </section>
|
|
|
333 </section>
|
|
|
334 <section name="open_search" expanded="false" title="Open Search">
|
|
|
335 <param name="track_zero_topN" type="integer" value="" min="0" optional="true"
|
|
|
336 label="Track top N unmodified peptide results" >
|
|
|
337 <help>
|
|
|
338 Track top N unmodified peptide results separately from main results internally for boosting features.
|
|
|
339 Should be set to a number greater than output_report_topN if zero bin boosting is desired.
|
|
|
340 Default: 0
|
|
|
341 </help>
|
|
|
342 </param>
|
|
|
343 <param name="zero_bin_accept_expect" type="float" value="" min="0.0" optional="true"
|
|
|
344 label="Ranks a zero-bin hit above all non-zero-bin hit if it has expectation less than this value."
|
|
|
345 help="Default: 0.0" />
|
|
|
346 <param name="zero_bin_mult_expect" type="float" value="" min="0.0" optional="true"
|
|
|
347 label="Multiplies expect value of PSMs in the zero-bin during results ordering"
|
|
|
348 help="(set to less than 1 for boosting) Default: 1.0" />
|
|
|
349 <param name="add_topN_complementary" type="integer" value="" min="0" optional="true"
|
|
|
350 label="Insert complementary ions corresponding to the top N most intense fragments in each experimental spectra." >
|
|
|
351 <help>
|
|
|
352 Useful for recovery of modified peptides near C-terminal in open search.
|
|
|
353 Should be set to 0 (disabled) otherwise.
|
|
|
354 Default: 0
|
|
|
355 </help>
|
|
|
356 </param>
|
|
|
357
|
|
|
358 </section>
|
|
|
359 <section name="modeling_output" expanded="false" title="Modeling and Output">
|
|
|
360 <param name="min_fragments_modelling" type="integer" value="3" min="1" optional="true"
|
|
|
361 label="Minimum number of matched peaks in PSM for inclusion in statistical modeling Default:3" />
|
|
|
362 <param name="min_matched_fragments" type="integer" value="4" min="1" optional="true"
|
|
|
363 label="Minimum number of matched peaks for PSM to be reported Default:3"
|
|
|
364 help="recommend a minimum of 4 for narrow window searching and 6 for open searches"/>
|
|
|
365 <param name="output_report_topN" type="integer" value="1" min="1" optional="true"
|
|
|
366 label="Reports top N PSMs per input spectrum Default:1" />
|
|
|
367 <param name="output_max_expect" type="float" value="50.0" min="0.0" optional="true"
|
|
|
368 label="Suppresses reporting of PSM if top hit has expectation greater than this threshold" />
|
|
|
369 </section>
|
|
|
370 <param name="output_format" type="select" label="output format">
|
|
|
371 <option value="pepXML">pepXML</option>
|
|
|
372 <option value="tsv">Tabular</option>
|
|
|
373 </param>
|
|
|
374 </inputs>
|
|
|
375
|
|
|
376 <outputs>
|
|
|
377 <data format="txt" name="output_params" label="${tool.name}.params"/>
|
|
|
378 <data format="txt" name="logfile" label="${tool.name} log"/>
|
|
|
379 <data format="tsv" name="output_tsv" label="${tool.name}.tsv ${on_string}" >
|
|
|
380 <filter>output_format == 'tsv'</filter>
|
|
|
381 </data>
|
|
|
382 <data format="pepxml" name="output_pepxml" label="${tool.name}.pep.xml ${on_string}" >
|
|
|
383 <filter>output_format == 'pepXML'</filter>
|
|
|
384 </data>
|
|
|
385 </outputs>
|
|
|
386 <tests>
|
|
|
387 <test>
|
|
|
388 </test>
|
|
|
389 </tests>
|
|
|
390 <help>
|
|
|
391 <![CDATA[
|
|
|
392 =============
|
|
|
393 **MSFragger**
|
|
|
394 =============
|
|
|
395
|
|
|
396 MSFragger is an ultrafast database search tool for peptide identifications in mass spectrometry-based proteomics. It differs from conventional search engines by computing similarity scores in a fragment-centric fashion using a theoretical fragment index of candidate peptides. The speed of MSFragger makes it particularly suitable for `open' database searches, where the precursor mass tolerance is set to hundreds of Daltons, for the identification of modified peptides. MSFragger is implemented in the cross-platform Java programming language and is compatible with standard proteomics file formats such as MGF/mzXML/mzML/pepXML.
|
|
|
397
|
|
|
398
|
|
|
399 **Common Static Modifications**
|
|
|
400
|
|
|
401 ::
|
|
|
402
|
|
|
403 - methylation of K : 14.015650
|
|
|
404 - oxidation of M : 15.994915
|
|
|
405 - carboxymethyl C : 58.005479
|
|
|
406 - carbamidomethyl C : 57.021464
|
|
|
407 - deamidation of N and Q : 0.984016
|
|
|
408 - propionamide C : 71.037114
|
|
|
409 - phosphorylation of S : 79.966331
|
|
|
410 - phosphorylation of T : 79.966331
|
|
|
411 - phosphorylation of Y : 79.966331
|
|
|
412 - M cleavage from protein n-term : -131.040485
|
|
|
413 - acetylation of protein n-term : 42.010565
|
|
|
414 - methylation of protein n-term : 14.015650
|
|
|
415 - tri-methylation of protein n-term : 42.046950
|
|
|
416 - beta methythiolation of D : 45.987721
|
|
|
417 - methylation of Q : 14.015650
|
|
|
418 - tri-methylation of K : 42.046950
|
|
|
419 - methylation of D : 14.015650
|
|
|
420 - methylation of E : 14.015650
|
|
|
421 - methylation of peptide c-term : 14.015650
|
|
|
422 - tri-deuteromethylation of D : 17.034480
|
|
|
423 - tri-deuteromethylation of E : 17.034480
|
|
|
424 - tri-deuteromethylation of peptide c-term : 17.034480
|
|
|
425 - n-formyl met addition : 159.035399
|
|
|
426 - 2-amino-3-oxo-butanoic acid T : -2.015650
|
|
|
427 - acetylation of K : 42.010565
|
|
|
428 - amidation of peptide c-term : -0.984016
|
|
|
429 - beta-methylthiolation of D (duplicate of 13) : 45.987721
|
|
|
430 - carboxyamidomethylation of K : 57.021464
|
|
|
431 - carboxyamidomethylation of H : 57.021464
|
|
|
432 - carboxyamidomethylation of D : 57.021464
|
|
|
433 - carboxyamidomethylation of E : 57.021464
|
|
|
434 - carbamylation of K : 43.005814
|
|
|
435 - carbamylation of n-term peptide : 43.005814
|
|
|
436 - citrullination of R : 0.984016
|
|
|
437 - oxidation of C to cysteic acid : 47.984744
|
|
|
438 - di-iodination of Y : 251.793296
|
|
|
439 - di-methylation of K : 28.031300
|
|
|
440 - di-methylation of R : 28.031300
|
|
|
441 - di-methylation of peptide n-term : 28.031300
|
|
|
442 - oxidation of F to dihydroxyphenylalanine : 31.989829
|
|
|
443 - gammathiopropionylation of K : 87.998285
|
|
|
444 - gammathiopropionylation of peptide n-term : 87.998285
|
|
|
445 - farnesylation of C : 204.187801
|
|
|
446 - formylation of K : 27.994915
|
|
|
447 - formylation of peptide n-term : 27.994915
|
|
|
448 - oxidation of W to formylkynurenin : 31.989829
|
|
|
449 - fluorophenylalanine : 17.990578
|
|
|
450 - beta-carboxylation of D : 43.989829
|
|
|
451 - gamma-carboxylation of E : 43.989829
|
|
|
452 - geranyl-geranyl : 272.250401
|
|
|
453 - glucuronylation of protein n-term : 176.032088
|
|
|
454 - glutathione disulfide : 305.068156
|
|
|
455 - ubiquitinylation residue : 114.042927
|
|
|
456 - guanidination of K : 42.021798
|
|
|
457 - oxidation of H to N : -23.015984
|
|
|
458 - oxidation of H to D : -22.031969
|
|
|
459 - homoserine : -29.992806
|
|
|
460 - homoserine lactone : -48.003371
|
|
|
461 - oxidation of W to hydroxykynurenin : 19.989829
|
|
|
462 - hydroxylation of D : 15.994915
|
|
|
463 - hydroxylation of K : 15.994915
|
|
|
464 - hydroxylation of N : 15.994915
|
|
|
465 - hydroxylation of P : 15.994915
|
|
|
466 - hydroxylation of F : 15.994915
|
|
|
467 - hydroxylation of Y : 15.994915
|
|
|
468 - iodination of Y : 125.896648
|
|
|
469 - oxidation of W to kynurenin : 3.994915
|
|
|
470 - lipoyl K : 188.032956
|
|
|
471 - methyl ester of peptide c-term (duplicate of 18) : 14.015650
|
|
|
472 - methyl ester of D : 14.015650
|
|
|
473 - methyl ester of E (duplicate of 17) : 14.015650
|
|
|
474 - methyl ester of S : 14.015650
|
|
|
475 - methyl ester of Y : 14.015650
|
|
|
476 - methyl C : 14.015650
|
|
|
477 - methyl H : 14.015650
|
|
|
478 - methyl N : 14.015650
|
|
|
479 - methylation of peptide n-term : 14.015650
|
|
|
480 - methyl R : 14.015650
|
|
|
481 - myristoleylation of G : 208.182715
|
|
|
482 - myristoyl-4H of G : 206.167065
|
|
|
483 - myristoylation of peptide n-term G : 210.198366
|
|
|
484 - myristoylation of K : 210.198366
|
|
|
485 - formylation of protein n-term : 27.994915
|
|
|
486 - NEM C : 125.047679
|
|
|
487 - NIPCAM : 99.068414
|
|
|
488 - oxidation of W to nitro : 44.985078
|
|
|
489 - oxidation of Y to nitro : 44.985078
|
|
|
490 - O18 on peptide n-term : 2.004246
|
|
|
491 - di-O18 on peptide n-term : 4.008490
|
|
|
492 - oxidation of H : 15.994915
|
|
|
493 - oxidation of W : 15.994915
|
|
|
494 - phosphopantetheine S : 340.085794
|
|
|
495 - palmitoylation of C : 238.229666
|
|
|
496 - palmitoylation of K : 238.229666
|
|
|
497 - palmitoylation of S : 238.229666
|
|
|
498 - palmitoylation of T : 238.229666
|
|
|
499 - phosphorylation of S with prompt loss : -18.010565
|
|
|
500 - phosphorylation of T with prompt loss : -18.010565
|
|
|
501 - phosphorylation with prompt loss on Y : -18.010565
|
|
|
502 - phosphorylation with neutral loss on C : 79.966331
|
|
|
503 - phosphorylation with neutral loss on D : 79.966331
|
|
|
504 - phosphorylation with neutral loss on H : 79.966331
|
|
|
505 - propionyl light K : 56.026215
|
|
|
506 - propionyl light on peptide n-term : 56.026215
|
|
|
507 - propionyl heavy K : 59.036279
|
|
|
508 - propionyl heavy peptide n-term : 59.036279
|
|
|
509 - pyridyl K : 119.037114
|
|
|
510 - pyridyl peptide n-term : 119.037114
|
|
|
511 - pyro-cmC : -17.026549
|
|
|
512 - pyro-glu from n-term E : -18.010565
|
|
|
513 - pyro-glu from n-term Q : -17.026549
|
|
|
514 - oxidation of P to pyroglutamic acid : 13.979265
|
|
|
515 - s-pyridylethylation of C : 105.057849
|
|
|
516 - SeMet : 47.944449
|
|
|
517 - sulfation of Y : 79.956815
|
|
|
518 - sulphone of M : 31.989829
|
|
|
519 - tri-iodination of Y : 377.689944
|
|
|
520 - tri-methylation of R : 42.046950
|
|
|
521 - n-acyl diglyceride cysteine : 788.725777
|
|
|
522 - ICAT light : 227.126991
|
|
|
523 - ICAT heavy : 236.157185
|
|
|
524 - CAMthiopropanoyl K : 145.019749
|
|
|
525 - phosphorylation with neutral loss on S : 79.966331
|
|
|
526 - phosphorylation with neutral loss on T : 79.966331
|
|
|
527 - phosphorylation of S with ETD loss : 79.966331
|
|
|
528 - phosphorylation of T with ETD loss : 79.966331
|
|
|
529 - heavy arginine-13C6 : 6.020129
|
|
|
530 - heavy arginine-13C6-15N4 : 10.008269
|
|
|
531 - heavy lysine-13C6 : 6.020129
|
|
|
532 - PNGasF in O18 water : 2.988261
|
|
|
533 - beta elimination of S : -18.010565
|
|
|
534 - beta elimination of T : -18.010565
|
|
|
535 - oxidation of C to sulfinic acid : 31.989829
|
|
|
536 - arginine to ornithine : -42.021798
|
|
|
537 - dehydro of S and T : -18.010565
|
|
|
538 - carboxykynurenin of W : 47.984744
|
|
|
539 - sumoylation of K : 484.228200
|
|
|
540 - iTRAQ114 on nterm : 144.105918
|
|
|
541 - iTRAQ114 on K : 144.105918
|
|
|
542 - iTRAQ114 on Y : 144.105918
|
|
|
543 - iTRAQ115 on nterm : 144.099599
|
|
|
544 - iTRAQ115 on K : 144.099599
|
|
|
545 - iTRAQ115 on Y : 144.099599
|
|
|
546 - iTRAQ116 on nterm : 144.102063
|
|
|
547 - iTRAQ116 on K : 144.102063
|
|
|
548 - iTRAQ116 on Y : 144.102063
|
|
|
549 - iTRAQ117 on nterm : 144.102063
|
|
|
550 - iTRAQ117 on K : 144.102063
|
|
|
551 - iTRAQ117 on Y : 144.102063
|
|
|
552 - MMTS on C : 45.987721
|
|
|
553 - heavy lysine - 2H4 : 4.025107
|
|
|
554 - heavy lysine - 13C6 15N2 : 8.014199
|
|
|
555 - Asparagine HexNAc : 203.079373
|
|
|
556 - Asparagine dHexHexNAc : 349.137281
|
|
|
557 - Serine HexNAc : 203.079373
|
|
|
558 - Threonine HexNAc : 203.079373
|
|
|
559 - palmitoleyl of S : 236.214016
|
|
|
560 - palmitoleyl of C : 236.214016
|
|
|
561 - palmitoleyl of T : 236.214016
|
|
|
562 - CHD2-di-methylation of K : 32.056407
|
|
|
563 - CHD2-di-methylation of peptide n-term : 32.056407
|
|
|
564 - Maleimide-PEO2-Biotin of C : 525.225719
|
|
|
565 - phosphorylation of H : 79.966331
|
|
|
566 - oxidation of C : 15.994915
|
|
|
567 - oxidation of Y (duplicate of 64) : 15.994915
|
|
|
568 - Uniblue A on K : 484.039891
|
|
|
569 - deamidation of N : 0.984016
|
|
|
570 - trideuteration of L (SILAC) : 3.018830
|
|
|
571 - TMT duplex on K : 225.155833
|
|
|
572 - TMT duplex on n-term peptide : 225.155833
|
|
|
573 - TMT 6-plex on K : 229.162932
|
|
|
574 - TMT 6-plex on n-term peptide : 229.162932
|
|
|
575 - iTRAQ8plex:13C(7)15N(1) on nterm : 304.205360
|
|
|
576 - iTRAQ8plex:13C(7)15N(1) on K : 304.205360
|
|
|
577 - iTRAQ8plex:13C(7)15N(1) on Y : 304.205360
|
|
|
578 - iTRAQ8plex:13C(6)15N(2) on nterm : 304.199040
|
|
|
579 - iTRAQ8plex:13C(6)15N(2) on K : 304.199040
|
|
|
580 - iTRAQ8plex:13C(6)15N(2) on Y : 304.199040
|
|
|
581 - selenocysteine : 47.944449
|
|
|
582 - carboxymethylated selenocysteine : 105.949928
|
|
|
583
|
|
|
584 ]]>
|
|
|
585 </help>
|
|
1
|
586 <citations>
|
|
|
587 <citation type="doi">doi:10.1038/nmeth.4256</citation>
|
|
|
588 </citations>
|
|
0
|
589 </tool>
|