Mercurial > repos > iuc > rrmscorer
comparison RRMScorer.xml @ 0:2e9c4504af91 draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/main/tools/rrmscorer commit 1ed15985d486840a247b2803613c584c074e4744
| author | iuc |
|---|---|
| date | Wed, 17 Sep 2025 14:53:19 +0000 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| -1:000000000000 | 0:2e9c4504af91 |
|---|---|
| 1 <tool id="rrmscorer" name="RRM-Scorer" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@"> | |
| 2 <description>Predicts RNA Recognition Motif (RRM) scores</description> | |
| 3 <macros> | |
| 4 <import>macros.xml</import> | |
| 5 </macros> | |
| 6 <xrefs> | |
| 7 <xref type="bio.tools">RRMScorer</xref> | |
| 8 </xrefs> | |
| 9 <expand macro="requirements"/> | |
| 10 <command detect_errors="exit_code"><![CDATA[ | |
| 11 mkdir -p json tabular aligned plots && | |
| 12 rrmscorer | |
| 13 --json 'json' | |
| 14 --csv 'tabular' | |
| 15 --window_size $tool_parameters.window_size | |
| 16 #if str($input_sequence.input_type_cond.input_type) == 'fasta' | |
| 17 --fasta '$input_sequence.input_type_cond.fasta_input' | |
| 18 #elif str($input_sequence.input_type_cond.input_type) == 'uniprot' | |
| 19 --uniprot '$input_sequence.input_type_cond.uniprot_id' | |
| 20 #end if | |
| 21 | |
| 22 #if $output_options.generate_plots | |
| 23 --plot 'plots' | |
| 24 #end if | |
| 25 | |
| 26 #if $output_options.generate_fasta | |
| 27 --aligned 'aligned' | |
| 28 #end if | |
| 29 | |
| 30 #if $tool_parameters.target and not $output_options.top_scoring_rna | |
| 31 --rna '$tool_parameters.target' | |
| 32 #else | |
| 33 --top | |
| 34 #end if | |
| 35 ]]></command> | |
| 36 <inputs> | |
| 37 <section name="input_sequence" title="Input sequence" expanded="true"> | |
| 38 <conditional name="input_type_cond"> | |
| 39 <param name="input_type" type="select" label="Select the type of sequence input" optional="false"> | |
| 40 <option value="fasta" selected="true">FASTA file containing the protein sequence(s)</option> | |
| 41 <option value="uniprot">Protein identifier from UniProt</option> | |
| 42 </param> | |
| 43 <when value="fasta"> | |
| 44 <param name="fasta_input" type="data" format="fasta" optional="false" multiple="false" label="Protein sequence(s) in FASTA format" help="Provide a FASTA file containing the protein sequences."> | |
| 45 <validator type="dataset_ok_validator"/> | |
| 46 </param> | |
| 47 </when> | |
| 48 <when value="uniprot"> | |
| 49 <param name="uniprot_id" type="text" value="" optional="false" label="Protein identifier from UniProt" help="Provide a UniProt ID (e.g. P19339)."> | |
| 50 <validator type="empty_field" message="Missing UniProt ID"/> | |
| 51 </param> | |
| 52 </when> | |
| 53 </conditional> | |
| 54 </section> | |
| 55 <section name="tool_parameters" title="Tool parameters" help="Configure this section to select the predictions to be executed"> | |
| 56 <param name="target" type="text" optional="true" label="Target RNA sequence (min. 5 nucleotides)" help="Provide a valid target RNA sequence. Leave blank if not specifying a target RNA so that the predictor will use the top-scoring RNA by default."> | |
| 57 <validator type="regex" message="The sequence must consist only of RNA nucleotides (A, U, G, C) or be left blank.">^([AUGCaugc]+)?$</validator> | |
| 58 </param> | |
| 59 <param name="window_size" type="select" label="The window size to test"> | |
| 60 <option value="5" selected="true">5</option> | |
| 61 <option value="3">3</option> | |
| 62 </param> | |
| 63 </section> | |
| 64 <section name="output_options" title="Output parameters" help="Configure this section to define the tool output files"> | |
| 65 <param name="generate_plots" type="boolean" label="Generate score plots for all the RNA possible windows" help="Enable to generate score plots."/> | |
| 66 <param name="top_scoring_rna" type="boolean" label="Find the top-scoring RNA for the specified RRM(s)" help="Enable to find and plot the top-scoring RNA. Attention: This option overrides the target RNA if present."/> | |
| 67 <param name="generate_fasta" type="boolean" label="Generate a FASTA file for each input sequence aligned to the HMM" help="Enable to generate a FASTA file with aligned sequences."/> | |
| 68 </section> | |
| 69 </inputs> | |
| 70 <outputs> | |
| 71 <collection name="split_csv" type="list" label="Tabular predictions by sequence"> | |
| 72 <discover_datasets pattern="__designation_and_ext__" directory="tabular" visible="true"/> | |
| 73 </collection> | |
| 74 <collection name="split_json" type="list" label="Json predictions by sequence"> | |
| 75 <discover_datasets pattern="__designation_and_ext__" directory="json" visible="true"/> | |
| 76 </collection> | |
| 77 <collection name="split_aligned" type="list" label="Alignment in FASTA format by sequence"> | |
| 78 <discover_datasets pattern="__designation_and_ext__" directory="aligned" visible="true"/> | |
| 79 </collection> | |
| 80 <collection name="split_plots" type="list" label="Plots by sequence"> | |
| 81 <discover_datasets pattern="__designation_and_ext__" directory="plots" visible="true"/> | |
| 82 </collection> | |
| 83 </outputs> | |
| 84 <tests> | |
| 85 <!-- Test 1: UniProt ID P19339, Window Size 5, RNA AUGGCU --> | |
| 86 <test expect_num_outputs="4"> | |
| 87 <section name="input_sequence"> | |
| 88 <conditional name="input_type_cond"> | |
| 89 <param name="input_type" value="uniprot"/> | |
| 90 <param name="uniprot_id" value="P19339"/> | |
| 91 </conditional> | |
| 92 </section> | |
| 93 <section name="tool_parameters"> | |
| 94 <param name="target" value="AUGGCU"/> | |
| 95 <param name="window_size" value="5"/> | |
| 96 </section> | |
| 97 <assert_command> | |
| 98 <has_text text="--uniprot 'P19339'"/> | |
| 99 <has_text text="--rna 'AUGGCU'"/> | |
| 100 <has_text text="--window_size 5"/> | |
| 101 <has_text text="--json 'json'"/> | |
| 102 <has_text text="--csv 'tabular'"/> | |
| 103 </assert_command> | |
| 104 <output_collection name="split_json" count="2"/> | |
| 105 <output_collection name="split_csv" count="2"/> | |
| 106 <output_collection name="split_aligned" count="0"/> | |
| 107 <output_collection name="split_plots" count="0"/> | |
| 108 </test> | |
| 109 <!-- Test 2: UniProt ID P19339, Window Size 3, RNA AUGGCU --> | |
| 110 <test expect_num_outputs="4"> | |
| 111 <section name="input_sequence"> | |
| 112 <conditional name="input_type_cond"> | |
| 113 <param name="input_type" value="uniprot"/> | |
| 114 <param name="uniprot_id" value="P19339"/> | |
| 115 </conditional> | |
| 116 </section> | |
| 117 <section name="tool_parameters"> | |
| 118 <param name="target" value="AUGGCU"/> | |
| 119 <param name="window_size" value="3"/> | |
| 120 </section> | |
| 121 <assert_command> | |
| 122 <has_text text="--uniprot 'P19339'"/> | |
| 123 <has_text text="--rna 'AUGGCU'"/> | |
| 124 <has_text text="--window_size 3"/> | |
| 125 <has_text text="--json 'json'"/> | |
| 126 <has_text text="--csv 'tabular'"/> | |
| 127 </assert_command> | |
| 128 <output_collection name="split_json" count="2"/> | |
| 129 <output_collection name="split_csv" count="2"/> | |
| 130 <output_collection name="split_aligned" count="0"/> | |
| 131 <output_collection name="split_plots" count="0"/> | |
| 132 </test> | |
| 133 <!-- Test 3: UniProt ID P19339, Window Size 5, RNA AUGGCU, Aligned FASTA files --> | |
| 134 <test expect_num_outputs="4"> | |
| 135 <section name="input_sequence"> | |
| 136 <conditional name="input_type_cond"> | |
| 137 <param name="input_type" value="uniprot"/> | |
| 138 <param name="uniprot_id" value="P19339"/> | |
| 139 </conditional> | |
| 140 </section> | |
| 141 <section name="tool_parameters"> | |
| 142 <param name="target" value="AUGGCU"/> | |
| 143 <param name="window_size" value="5"/> | |
| 144 </section> | |
| 145 <section name="output_options"> | |
| 146 <param name="generate_fasta" value="true"/> | |
| 147 </section> | |
| 148 <assert_command> | |
| 149 <has_text text="--uniprot 'P19339'"/> | |
| 150 <has_text text="--rna 'AUGGCU'"/> | |
| 151 <has_text text="--window_size 5"/> | |
| 152 <has_text text="--json 'json'"/> | |
| 153 <has_text text="--csv 'tabular'"/> | |
| 154 <has_text text="--aligned 'aligned'"/> | |
| 155 </assert_command> | |
| 156 <output_collection name="split_json" count="2"/> | |
| 157 <output_collection name="split_csv" count="2"/> | |
| 158 <output_collection name="split_aligned" count="2"/> | |
| 159 <output_collection name="split_plots" count="0"/> | |
| 160 </test> | |
| 161 <!-- Test 4: UniProt ID P19339, Window Size 5, Top RNA, with Plots --> | |
| 162 <test expect_num_outputs="4"> | |
| 163 <section name="input_sequence"> | |
| 164 <conditional name="input_type_cond"> | |
| 165 <param name="input_type" value="uniprot"/> | |
| 166 <param name="uniprot_id" value="P19339"/> | |
| 167 </conditional> | |
| 168 </section> | |
| 169 <section name="tool_parameters"> | |
| 170 <param name="window_size" value="5"/> | |
| 171 </section> | |
| 172 <section name="output_options"> | |
| 173 <param name="top_scoring_rna" value="true"/> | |
| 174 <param name="generate_plots" value="true"/> | |
| 175 </section> | |
| 176 <assert_command> | |
| 177 <has_text text="--uniprot 'P19339'"/> | |
| 178 <has_text text="--window_size 5"/> | |
| 179 <has_text text="--json 'json'"/> | |
| 180 <has_text text="--csv 'tabular'"/> | |
| 181 <has_text text="--top"/> | |
| 182 </assert_command> | |
| 183 <output_collection name="split_json" count="2"/> | |
| 184 <output_collection name="split_csv" count="0"/> | |
| 185 <output_collection name="split_aligned" count="0"/> | |
| 186 <output_collection name="split_plots" count="8"/> | |
| 187 </test> | |
| 188 <!-- Test 5: UniProt ID P19339, Window Size 5, Top RNA, with Plots, Aligned FASTA files --> | |
| 189 <test expect_num_outputs="4"> | |
| 190 <section name="input_sequence"> | |
| 191 <conditional name="input_type_cond"> | |
| 192 <param name="input_type" value="uniprot"/> | |
| 193 <param name="uniprot_id" value="P19339"/> | |
| 194 </conditional> | |
| 195 </section> | |
| 196 <section name="tool_parameters"> | |
| 197 <param name="window_size" value="5"/> | |
| 198 </section> | |
| 199 <section name="output_options"> | |
| 200 <param name="top_scoring_rna" value="true"/> | |
| 201 <param name="generate_plots" value="true"/> | |
| 202 <param name="generate_fasta" value="true"/> | |
| 203 </section> | |
| 204 <assert_command> | |
| 205 <has_text text="--uniprot 'P19339'"/> | |
| 206 <has_text text="--window_size 5"/> | |
| 207 <has_text text="--json 'json'"/> | |
| 208 <has_text text="--csv 'tabular'"/> | |
| 209 <has_text text="--plot 'plots'"/> | |
| 210 <has_text text="--aligned 'aligned'"/> | |
| 211 <has_text text="--top"/> | |
| 212 </assert_command> | |
| 213 <output_collection name="split_json" type="list" count="2"/> | |
| 214 <output_collection name="split_aligned" type="list" count="2"/> | |
| 215 <output_collection name="split_plots" type="list" count="8"/> | |
| 216 </test> | |
| 217 <!-- Test 6: UniProt ID P19339, Window Size 5, RNA AUGGCU, with Plots --> | |
| 218 <test expect_num_outputs="4"> | |
| 219 <section name="input_sequence"> | |
| 220 <conditional name="input_type_cond"> | |
| 221 <param name="input_type" value="uniprot"/> | |
| 222 <param name="uniprot_id" value="P19339"/> | |
| 223 </conditional> | |
| 224 </section> | |
| 225 <section name="tool_parameters"> | |
| 226 <param name="target" value="AUGGCU"/> | |
| 227 <param name="window_size" value="5"/> | |
| 228 </section> | |
| 229 <section name="output_options"> | |
| 230 <param name="generate_plots" value="true"/> | |
| 231 </section> | |
| 232 <assert_command> | |
| 233 <has_text text="--uniprot 'P19339'"/> | |
| 234 <has_text text="--rna 'AUGGCU'"/> | |
| 235 <has_text text="--window_size 5"/> | |
| 236 <has_text text="--json 'json'"/> | |
| 237 <has_text text="--csv 'tabular'"/> | |
| 238 </assert_command> | |
| 239 <output_collection name="split_json" count="2"/> | |
| 240 <output_collection name="split_csv" count="2"/> | |
| 241 <output_collection name="split_aligned" count="0"/> | |
| 242 <output_collection name="split_plots" count="2"/> | |
| 243 </test> | |
| 244 <!-- Test 7: UniProt ID P19339, Window Size 5, RNA AUGGCU, with Plots, Aligned FASTA files --> | |
| 245 <test expect_num_outputs="4"> | |
| 246 <section name="input_sequence"> | |
| 247 <conditional name="input_type_cond"> | |
| 248 <param name="input_type" value="uniprot"/> | |
| 249 <param name="uniprot_id" value="P19339"/> | |
| 250 </conditional> | |
| 251 </section> | |
| 252 <section name="tool_parameters"> | |
| 253 <param name="target" value="AUGGCU"/> | |
| 254 <param name="window_size" value="5"/> | |
| 255 </section> | |
| 256 <section name="output_options"> | |
| 257 <param name="top_scoring_rna" value="false"/> | |
| 258 <param name="generate_fasta" value="true"/> | |
| 259 <param name="generate_plots" value="true"/> | |
| 260 </section> | |
| 261 <assert_command> | |
| 262 <has_text text="--uniprot 'P19339'"/> | |
| 263 <has_text text="--window_size 5"/> | |
| 264 <has_text text="--json 'json'"/> | |
| 265 <has_text text="--csv 'tabular'"/> | |
| 266 <has_text text="--plot 'plots'"/> | |
| 267 <not_has_text text="--top"/> | |
| 268 </assert_command> | |
| 269 <output_collection name="split_json" count="2"/> | |
| 270 <output_collection name="split_csv" count="2"/> | |
| 271 <output_collection name="split_aligned" count="2"/> | |
| 272 <output_collection name="split_plots" count="2"/> | |
| 273 </test> | |
| 274 <!-- Test 8: Fasta file, Window Size 5, RNA AUGGCU, Aligned FASTA files --> | |
| 275 <test expect_num_outputs="4"> | |
| 276 <section name="input_sequence"> | |
| 277 <conditional name="input_type_cond"> | |
| 278 <param name="input_type" value="fasta"/> | |
| 279 <param name="fasta_input" value="input.fasta" ftype="fasta"/> | |
| 280 </conditional> | |
| 281 </section> | |
| 282 <section name="tool_parameters"> | |
| 283 <param name="target" value="AUGGCU"/> | |
| 284 <param name="window_size" value="5"/> | |
| 285 </section> | |
| 286 <section name="output_options"> | |
| 287 <param name="generate_fasta" value="true"/> | |
| 288 </section> | |
| 289 <assert_command> | |
| 290 <has_text text="--fasta"/> | |
| 291 <has_text text="--rna 'AUGGCU'"/> | |
| 292 <has_text text="--window_size 5"/> | |
| 293 <has_text text="--json 'json'"/> | |
| 294 <has_text text="--csv 'tabular'"/> | |
| 295 </assert_command> | |
| 296 <output_collection name="split_json" count="2"/> | |
| 297 <output_collection name="split_csv" count="2"/> | |
| 298 <output_collection name="split_aligned" count="2"/> | |
| 299 <output_collection name="split_plots" type="list" count="0"/> | |
| 300 </test> | |
| 301 <!-- Test 9: Fasta file, Window Size 5, Top RNA, Aligned FASTA files --> | |
| 302 <test expect_num_outputs="4"> | |
| 303 <section name="input_sequence"> | |
| 304 <conditional name="input_type_cond"> | |
| 305 <param name="input_type" value="fasta"/> | |
| 306 <param name="fasta_input" value="input.fasta" ftype="fasta"/> | |
| 307 </conditional> | |
| 308 </section> | |
| 309 <section name="tool_parameters"> | |
| 310 <param name="window_size" value="5"/> | |
| 311 </section> | |
| 312 <section name="output_options"> | |
| 313 <param name="top_scoring_rna" value="true"/> | |
| 314 <param name="generate_fasta" value="true"/> | |
| 315 </section> | |
| 316 <assert_command> | |
| 317 <has_text text="--fasta"/> | |
| 318 <not_has_text text="--rna 'AUGGCU'"/> | |
| 319 <has_text text="--window_size 5"/> | |
| 320 <has_text text="--json 'json'"/> | |
| 321 <has_text text="--csv 'tabular'"/> | |
| 322 <has_text text="--aligned 'aligned'"/> | |
| 323 <has_text text="--top"/> | |
| 324 </assert_command> | |
| 325 <output_collection name="split_csv" type="list" count="0"/> | |
| 326 <output_collection name="split_json" type="list" count="2"/> | |
| 327 <output_collection name="split_plots" type="list" count="0"/> | |
| 328 <output_collection name="split_aligned" count="2"/> | |
| 329 </test> | |
| 330 <!-- Test 10: Fasta file, Window Size 5, Top RNA, with Plots, Aligned FASTA files --> | |
| 331 <test expect_num_outputs="4"> | |
| 332 <section name="input_sequence"> | |
| 333 <conditional name="input_type_cond"> | |
| 334 <param name="input_type" value="fasta"/> | |
| 335 <param name="fasta_input" value="input.fasta" ftype="fasta"/> | |
| 336 </conditional> | |
| 337 </section> | |
| 338 <section name="tool_parameters"> | |
| 339 <param name="window_size" value="5"/> | |
| 340 </section> | |
| 341 <section name="output_options"> | |
| 342 <param name="top_scoring_rna" value="true"/> | |
| 343 <param name="generate_fasta" value="true"/> | |
| 344 <param name="generate_plots" value="true"/> | |
| 345 </section> | |
| 346 <assert_command> | |
| 347 <has_text text="--fasta"/> | |
| 348 <not_has_text text="--rna 'AUGGCU'"/> | |
| 349 <has_text text="--window_size 5"/> | |
| 350 <has_text text="--json 'json'"/> | |
| 351 <has_text text="--csv 'tabular'"/> | |
| 352 <has_text text="--plot 'plots'"/> | |
| 353 <has_text text="--aligned 'aligned'"/> | |
| 354 <has_text text="--top"/> | |
| 355 </assert_command> | |
| 356 <output_collection name="split_csv" type="list" count="0"/> | |
| 357 <output_collection name="split_json" type="list" count="2"/> | |
| 358 <output_collection name="split_aligned" type="list" count="2"/> | |
| 359 <output_collection name="split_plots" type="list" count="8"/> | |
| 360 </test> | |
| 361 <!-- Test 11: Fasta file, Window Size 5, RNA AUGGCU, Aligned FASTA files --> | |
| 362 <test expect_num_outputs="4"> | |
| 363 <section name="input_sequence"> | |
| 364 <conditional name="input_type_cond"> | |
| 365 <param name="input_type" value="fasta"/> | |
| 366 <param name="fasta_input" value="input.fasta" ftype="fasta"/> | |
| 367 </conditional> | |
| 368 </section> | |
| 369 <section name="tool_parameters"> | |
| 370 <param name="window_size" value="5"/> | |
| 371 <param name="target" value="AUGGCU"/> | |
| 372 </section> | |
| 373 <section name="output_options"> | |
| 374 <param name="top_scoring_rna" value="false"/> | |
| 375 <param name="generate_fasta" value="true"/> | |
| 376 </section> | |
| 377 <assert_command> | |
| 378 <has_text text="--fasta"/> | |
| 379 <has_text text="--rna 'AUGGCU'"/> | |
| 380 <has_text text="--window_size 5"/> | |
| 381 <has_text text="--json 'json'"/> | |
| 382 <has_text text="--csv 'tabular'"/> | |
| 383 <has_text text="--aligned 'aligned'"/> | |
| 384 <not_has_text text="--top"/> | |
| 385 </assert_command> | |
| 386 <output_collection name="split_csv" type="list" count="2"/> | |
| 387 <output_collection name="split_json" type="list" count="2"/> | |
| 388 <output_collection name="split_plots" type="list" count="0"/> | |
| 389 <output_collection name="split_aligned" count="2"/> | |
| 390 </test> | |
| 391 <!-- Test 12: Fasta file, Window Size 5, RNA AUGGCU, with Plots, Aligned FASTA files --> | |
| 392 <test expect_num_outputs="4"> | |
| 393 <section name="input_sequence"> | |
| 394 <conditional name="input_type_cond"> | |
| 395 <param name="input_type" value="fasta"/> | |
| 396 <param name="fasta_input" value="input.fasta" ftype="fasta"/> | |
| 397 </conditional> | |
| 398 </section> | |
| 399 <section name="tool_parameters"> | |
| 400 <param name="window_size" value="5"/> | |
| 401 <param name="target" value="AUGGCU"/> | |
| 402 </section> | |
| 403 <section name="output_options"> | |
| 404 <param name="top_scoring_rna" value="false"/> | |
| 405 <param name="generate_fasta" value="true"/> | |
| 406 <param name="generate_plots" value="true"/> | |
| 407 </section> | |
| 408 <assert_command> | |
| 409 <has_text text="--fasta"/> | |
| 410 <has_text text="--rna 'AUGGCU'"/> | |
| 411 <has_text text="--window_size 5"/> | |
| 412 <has_text text="--json 'json'"/> | |
| 413 <has_text text="--csv 'tabular'"/> | |
| 414 <has_text text="--plot 'plots'"/> | |
| 415 <has_text text="--aligned 'aligned'"/> | |
| 416 <not_has_text text="--top"/> | |
| 417 </assert_command> | |
| 418 <output_collection name="split_csv" type="list" count="2"/> | |
| 419 <output_collection name="split_json" type="list" count="2"/> | |
| 420 <output_collection name="split_plots" type="list" count="2"/> | |
| 421 <output_collection name="split_aligned" count="2"/> | |
| 422 </test> | |
| 423 <!-- Test 13: Non-RRM-RNA protein (P05067) --> | |
| 424 <test> | |
| 425 <section name="input_sequence"> | |
| 426 <conditional name="input_type_cond"> | |
| 427 <param name="input_type" value="uniprot"/> | |
| 428 <param name="uniprot_id" value="P05067"/> | |
| 429 </conditional> | |
| 430 </section> | |
| 431 <section name="tool_parameters"> | |
| 432 <param name="target" value="AUGGCU"/> | |
| 433 <param name="window_size" value="5"/> | |
| 434 </section> | |
| 435 <section name="output_options"> | |
| 436 <param name="top_scoring_rna" value="false"/> | |
| 437 <param name="generate_plots" value="false"/> | |
| 438 <param name="generate_fasta" value="false"/> | |
| 439 </section> | |
| 440 <assert_command> | |
| 441 <has_text text="--uniprot 'P05067'"/> | |
| 442 <has_text text="--rna 'AUGGCU'"/> | |
| 443 <has_text text="--window_size 5"/> | |
| 444 <has_text text="--json 'json'"/> | |
| 445 <has_text text="--csv 'tabular'"/> | |
| 446 </assert_command> | |
| 447 <output_collection name="split_csv" type="list" count="0"/> | |
| 448 <output_collection name="split_json" type="list" count="0"/> | |
| 449 <output_collection name="split_plots" type="list" count="0"/> | |
| 450 <output_collection name="split_aligned" type="list" count="0"/> | |
| 451 </test> | |
| 452 </tests> | |
| 453 <creator> | |
| 454 <organization name="Bio2Byte, Vrije Universiteit Brussel (VUB)" address="Interuniversity Institute Bioinformatics Brussels, Université Libre de Bruxelles, 1050 Ixelles, Brussels, Belgium" url="https://bio2byte.be/rrmscorer" email="bio2byte@vub.be" image="https://0.gravatar.com/avatar/2b51fb7600d876086669bcc85a941b763a81d1c2bb3c667b8c83a1aa892cf740"/> | |
| 455 </creator> | |
| 456 <help><![CDATA[ | |
| 457 This tool allows you to predict RNA Recognition Motif (RRM) scores for protein | |
| 458 sequences provided in *FASTA* format or as *UniProt IDs*. | |
| 459 | |
| 460 **RRMScorer** is designed to predict RNA binding preferences for proteins containing | |
| 461 RNA recognition motifs (RRMs), the most prevalent RNA binding domain in eukaryotes. | |
| 462 | |
| 463 **Abstract:** | |
| 464 | |
| 465 By carefully analysing a dataset of 187 RRM-RNA structural complexes, we calculated | |
| 466 residue-level binding scores using a probabilistic model derived from | |
| 467 amino acid-nucleotide interaction propensities, which are the basis of | |
| 468 **RRMScorer**. | |
| 469 | |
| 470 With its ability to provide residue-level insights and accurate predictions, | |
| 471 **RRMScorer** serves as a valuable tool for researchers exploring the functional | |
| 472 landscape of RRM-RNA interactions. | |
| 473 | |
| 474 **Methodology**: | |
| 475 | |
| 476 The input sequence is scanned against our RRMScorer hidden Markov model (HMM) | |
| 477 to (i) identify whether the input sequence contains any RRM domain and (ii) | |
| 478 map to the 20 positions in the RRM protein sequence alignment that we use to compute | |
| 479 the RNA binding scores. | |
| 480 | |
| 481 If one or more RRM domains are identified in the input sequence, RRMScorer computes | |
| 482 the score of the user-defined RNA sequence, or if absent, the scores for all the | |
| 483 1024 RNA possible sequences with a length of 5 nt. By utilizing a specific | |
| 484 RNA sequence, the user can inspect to which 5-nt windows the RRM is more likely | |
| 485 to bind. | |
| 486 | |
| 487 **Input fields:** | |
| 488 | |
| 489 * **Protein sequence(s) FASTA format:** Provide a *FASTA* file containing the protein sequences. | |
| 490 * **Protein identifier from Uniprot:** Provide a *UniProt ID* (e.g. P19339). | |
| 491 * **Custom RNA target:** Enable or disable the use of a custom RNA target for the predictions. | |
| 492 * **Target:** Provide a valid target RNA sequence (minimum 5 nucleotides) if Custom RNA target is enabled. | |
| 493 * **The window size to test:** Select the window size (either 3 or 5 nucleotides). | |
| 494 * **Plot options:** Configure plot output options. | |
| 495 | |
| 496 **Output:** | |
| 497 | |
| 498 The results are provided in comprehensive bar plots as well as in | |
| 499 CSV and JSON formats. When a custom RNA is not provided, the results will | |
| 500 include protein sequence logos for a range of top-scoring RNA sequences, as well | |
| 501 as the aforementioned CSV and JSON files with the scores. | |
| 502 | |
| 503 **Funding:** | |
| 504 This project has received funding from the European Union's Horizon 2020 research | |
| 505 and innovation programme under the Marie Skłodowska-Curie grant | |
| 506 agreement No. 813239. This work was supported by the European Regional | |
| 507 Development Fund and Brussels-Capital Region-Innoviris within the framework of the | |
| 508 Operational Programme 2014-2020 (ERDF-2020 project ICITY-RDI.BRU) | |
| 509 ]]> | |
| 510 </help> | |
| 511 <citations> | |
| 512 <citation type="doi">10.1371/journal.pcbi.1010859</citation> | |
| 513 <citation type="doi">10.1093/nar/gkaf367</citation> | |
| 514 </citations> | |
| 515 </tool> |
