Mercurial > repos > eschen42 > mqppep_anova
view workflow/ppenrich_suite_wf.ga @ 14:6679616d0c18 draft
"planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/mqppep commit 514e7b9b3a3730a5676821554449d5feb323eb9a"
author | eschen42 |
---|---|
date | Tue, 22 Mar 2022 23:12:18 +0000 |
parents | b41a077af3aa |
children | 2c5f1a2fe16a |
line wrap: on
line source
{ "a_galaxy_workflow": "true", "annotation": "phoshpoproteomic enrichment data pre-processing and ANOVA", "creator": [ { "class": "Person", "identifier": "0000-0002-2882-0508", "name": "Art Eschenlauer" } ], "format-version": "0.1", "license": "MIT", "name": "ppenrich_suite_wf", "steps": { "0": { "annotation": "The Phospho (STY)Sites.txt file produced by MaxQuant (found in the txt folder).", "content_id": null, "errors": null, "id": 0, "input_connections": {}, "inputs": [ { "description": "The Phospho (STY)Sites.txt file produced by MaxQuant (found in the txt folder).", "name": "Phospho (STY)Sites.txt" } ], "label": "Phospho (STY)Sites.txt", "name": "Input dataset", "outputs": [], "position": { "bottom": 346.3999938964844, "height": 81.89999389648438, "left": 495, "right": 695, "top": 264.5, "width": 200, "x": 495, "y": 264.5 }, "tool_id": null, "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", "tool_version": null, "type": "data_input", "uuid": "21c3c29d-9e8c-4ece-b585-9e68fed7a93f", "workflow_outputs": [] }, "1": { "annotation": "FASTA file of all human canonical isoforms, derived from Swiss-Prot (e.g., merge of https://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot_varsplic.fasta.gz and https://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot.fasta.gz)", "content_id": null, "errors": null, "id": 1, "input_connections": {}, "inputs": [ { "description": "FASTA file of all human canonical isoforms, derived from Swiss-Prot (e.g., merge of https://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot_varsplic.fasta.gz and https://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot.fasta.gz)", "name": "SwissProt_Human_Canonical_Isoform.fasta" } ], "label": "SwissProt_Human_Canonical_Isoform.fasta", "name": "Input dataset", "outputs": [], "position": { "bottom": 708.8000030517578, "height": 102.30000305175781, "left": 685, "right": 885, "top": 606.5, "width": 200, "x": 685, "y": 606.5 }, "tool_id": null, "tool_state": "{\"optional\": false, \"format\": [\"fasta\"]}", "tool_version": null, "type": "data_input", "uuid": "5da7317c-4def-48f3-8eac-af95bd18b290", "workflow_outputs": [] }, "2": { "annotation": "Derived from https://networkin.info/download/networkin_human_predictions_3.1.tsv.xz (which is free for non-commercial use - for required citation, see https://networkin.info/)", "content_id": null, "errors": null, "id": 2, "input_connections": {}, "inputs": [ { "description": "Derived from https://networkin.info/download/networkin_human_predictions_3.1.tsv.xz (which is free for non-commercial use - for required citation, see https://networkin.info/)", "name": "NetworKIN_cutoffscore2.0.tabular" } ], "label": "NetworKIN_cutoffscore2.0.tabular", "name": "Input dataset", "outputs": [], "position": { "bottom": 853.8000030517578, "height": 102.30000305175781, "left": 696, "right": 896, "top": 751.5, "width": 200, "x": 696, "y": 751.5 }, "tool_id": null, "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", "tool_version": null, "type": "data_input", "uuid": "2edff8de-4379-45e2-b6b9-6ed4706bbf00", "workflow_outputs": [] }, "3": { "annotation": "Derived from http://hprd.org/serine_motifs, http://hprd.org/tyrosine_motifs, and http://pegasus.biochem.mpg.de/phosida/help/motifs.aspx", "content_id": null, "errors": null, "id": 3, "input_connections": {}, "inputs": [ { "description": "Derived from http://hprd.org/serine_motifs, http://hprd.org/tyrosine_motifs, and http://pegasus.biochem.mpg.de/phosida/help/motifs.aspx", "name": "pSTY_Motifs.tabular" } ], "label": "pSTY_Motifs.tabular", "name": "Input dataset", "outputs": [], "position": { "bottom": 977.3999938964844, "height": 81.89999389648438, "left": 708, "right": 908, "top": 895.5, "width": 200, "x": 708, "y": 895.5 }, "tool_id": null, "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", "tool_version": null, "type": "data_input", "uuid": "86ebaaf2-b050-4eca-a88b-23a4c1af39f5", "workflow_outputs": [] }, "4": { "annotation": "Derived from Kinase_Substrate_Dataset.gz found at https://www.phosphosite.org/staticDownloads (free for non-commercial use - see that link for citation.)", "content_id": null, "errors": null, "id": 4, "input_connections": {}, "inputs": [ { "description": "Derived from Kinase_Substrate_Dataset.gz found at https://www.phosphosite.org/staticDownloads (free for non-commercial use - see that link for citation.)", "name": "PSP_Kinase_Substrate_Dataset.tabular" } ], "label": "PSP_Kinase_Substrate_Dataset.tabular", "name": "Input dataset", "outputs": [], "position": { "bottom": 1126.8000030517578, "height": 102.30000305175781, "left": 729, "right": 929, "top": 1024.5, "width": 200, "x": 729, "y": 1024.5 }, "tool_id": null, "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", "tool_version": null, "type": "data_input", "uuid": "92f16705-a19c-4fb9-b278-3ae8e11f09d8", "workflow_outputs": [] }, "5": { "annotation": "Derived from Regulatory_sites.gz found at https://www.phosphosite.org/staticDownloads (free for non-commercial use - see that link for citation.)", "content_id": null, "errors": null, "id": 5, "input_connections": {}, "inputs": [ { "description": "Derived from Regulatory_sites.gz found at https://www.phosphosite.org/staticDownloads (free for non-commercial use - see that link for citation.)", "name": "PSP_Regulatory_sites.tabular" } ], "label": "PSP_Regulatory_sites.tabular", "name": "Input dataset", "outputs": [], "position": { "bottom": 1251.3999938964844, "height": 81.89999389648438, "left": 745, "right": 945, "top": 1169.5, "width": 200, "x": 745, "y": 1169.5 }, "tool_id": null, "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", "tool_version": null, "type": "data_input", "uuid": "5ab49d93-11e4-4e91-b30b-92269b319879", "workflow_outputs": [] }, "6": { "annotation": "List of alpha cutoff values for significance testing; text file having no header and a single line for each cutoff value.", "content_id": null, "errors": null, "id": 6, "input_connections": {}, "inputs": [ { "description": "List of alpha cutoff values for significance testing; text file having no header and a single line for each cutoff value.", "name": "alpha_levels.tabular" } ], "label": "alpha_levels.tabular", "name": "Input dataset", "outputs": [], "position": { "bottom": 1501.8999938964844, "height": 81.89999389648438, "left": 727, "right": 927, "top": 1420, "width": 200, "x": 727, "y": 1420 }, "tool_id": null, "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", "tool_version": null, "type": "data_input", "uuid": "481c627c-a4ce-45d7-b659-4f54692aafc7", "workflow_outputs": [] }, "7": { "annotation": "", "content_id": "mqppep_preproc", "errors": null, "id": 7, "input_connections": { "networkin": { "id": 2, "output_name": "output" }, "p_sty_motifs": { "id": 3, "output_name": "output" }, "phosphoSites": { "id": 0, "output_name": "output" }, "protein_fasta": { "id": 1, "output_name": "output" }, "psp_kinase_substrate": { "id": 4, "output_name": "output" }, "psp_regulatory_sites": { "id": 5, "output_name": "output" } }, "inputs": [], "label": null, "name": "MaxQuant Phosphopeptide Preprocessing", "outputs": [ { "name": "phosphoPepIntensities", "type": "tabular" }, { "name": "enrichGraph", "type": "pdf" }, { "name": "locProbCutoffGraph", "type": "pdf" }, { "name": "enrichGraph_svg", "type": "svg" }, { "name": "locProbCutoffGraph_svg", "type": "svg" }, { "name": "filteredData_tabular", "type": "tabular" }, { "name": "quantData_tabular", "type": "tabular" }, { "name": "mapped_phophopeptides", "type": "tabular" }, { "name": "melted_phophopeptide_map", "type": "tabular" }, { "name": "mqppep_output_sqlite", "type": "sqlite" }, { "name": "preproc_tab", "type": "tabular" }, { "name": "preproc_csv", "type": "csv" }, { "name": "preproc_sqlite", "type": "sqlite" } ], "position": { "bottom": 1408.7000122070312, "height": 793.2000122070312, "left": 1138.5, "right": 1338.5, "top": 615.5, "width": 200, "x": 1138.5, "y": 615.5 }, "post_job_actions": { "RenameDatasetActionenrichGraph": { "action_arguments": { "newname": "#{phosphoSites}.enrichGraph_pdf" }, "action_type": "RenameDatasetAction", "output_name": "enrichGraph" }, "RenameDatasetActionenrichGraph_svg": { "action_arguments": { "newname": "#{phosphoSites}.enrichGraph_svg" }, "action_type": "RenameDatasetAction", "output_name": "enrichGraph_svg" }, "RenameDatasetActionfilteredData_tabular": { "action_arguments": { "newname": "#{phosphoSites}.filteredData" }, "action_type": "RenameDatasetAction", "output_name": "filteredData_tabular" }, "RenameDatasetActionlocProbCutoffGraph": { "action_arguments": { "newname": "#{phosphoSites}.locProbCutoffGraph_pdf" }, "action_type": "RenameDatasetAction", "output_name": "locProbCutoffGraph" }, "RenameDatasetActionlocProbCutoffGraph_svg": { "action_arguments": { "newname": "#{phosphoSites}.locProbCutoffGraph_svg" }, "action_type": "RenameDatasetAction", "output_name": "locProbCutoffGraph_svg" }, "RenameDatasetActionmapped_phophopeptides": { "action_arguments": { "newname": "#{phosphoSites}.ppep_map" }, "action_type": "RenameDatasetAction", "output_name": "mapped_phophopeptides" }, "RenameDatasetActionmelted_phophopeptide_map": { "action_arguments": { "newname": "#{phosphoSites}.melted" }, "action_type": "RenameDatasetAction", "output_name": "melted_phophopeptide_map" }, "RenameDatasetActionmqppep_output_sqlite": { "action_arguments": { "newname": "#{phosphoSites}.ppep_mapping_sqlite" }, "action_type": "RenameDatasetAction", "output_name": "mqppep_output_sqlite" }, "RenameDatasetActionphosphoPepIntensities": { "action_arguments": { "newname": "#{phosphoSites}.ppep_intensities" }, "action_type": "RenameDatasetAction", "output_name": "phosphoPepIntensities" }, "RenameDatasetActionpreproc_csv": { "action_arguments": { "newname": "#{phosphoSites}.preproc_csv" }, "action_type": "RenameDatasetAction", "output_name": "preproc_csv" }, "RenameDatasetActionpreproc_sqlite": { "action_arguments": { "newname": "#{phosphoSites}.preproc_sqlite" }, "action_type": "RenameDatasetAction", "output_name": "preproc_sqlite" }, "RenameDatasetActionpreproc_tab": { "action_arguments": { "newname": "#{phosphoSites}.preproc_tab" }, "action_type": "RenameDatasetAction", "output_name": "preproc_tab" }, "RenameDatasetActionquantData_tabular": { "action_arguments": { "newname": "#{phosphoSites}.quantData" }, "action_type": "RenameDatasetAction", "output_name": "quantData_tabular" } }, "tool_id": "mqppep_preproc", "tool_state": "{\"collapseFunc\": \"sum\", \"intervalCol\": \"1\", \"localProbCutoff\": \"0.75\", \"merge_function\": \"sum\", \"networkin\": {\"__class__\": \"ConnectedValue\"}, \"p_sty_motifs\": {\"__class__\": \"ConnectedValue\"}, \"phosphoCol\": \"^Number of Phospho [(]STY[)]$\", \"phosphoSites\": {\"__class__\": \"ConnectedValue\"}, \"protein_fasta\": {\"__class__\": \"ConnectedValue\"}, \"psp_kinase_substrate\": {\"__class__\": \"ConnectedValue\"}, \"psp_regulatory_sites\": {\"__class__\": \"ConnectedValue\"}, \"pst_not_py\": \"true\", \"pst_py_selector\": \"st\", \"species\": \"human\", \"startCol\": \"^Intensity[^_]\", \"__page__\": null, \"__rerun_remap_job_id__\": null}", "tool_version": null, "type": "tool", "uuid": "1e983dba-edca-4aed-a589-49b1651b4a85", "workflow_outputs": [ { "label": "preproc_csv", "output_name": "preproc_csv", "uuid": "8cba5367-b25c-40e0-a324-552225b1aa1d" }, { "label": "locProbCutoffGraph_pdf", "output_name": "locProbCutoffGraph", "uuid": "641c5959-dab4-42d1-986d-8e6aaeb74ef6" }, { "label": "melted_phosphopeptide_map", "output_name": "melted_phophopeptide_map", "uuid": "878dc817-26a3-4061-9dd4-56e737b3c4f7" }, { "label": "enrichGraph_svg", "output_name": "enrichGraph_svg", "uuid": "4492366c-945e-492f-8381-1c97c4da2264" }, { "label": "locProbCutoffGraph_svg", "output_name": "locProbCutoffGraph_svg", "uuid": "06faf93c-5f04-4cb3-9e41-58e465f6180e" }, { "label": "filteredData", "output_name": "filteredData_tabular", "uuid": "76e2e268-f728-45f0-9973-793fbde0dd0a" }, { "label": "ppep_map", "output_name": "mapped_phophopeptides", "uuid": "d0fea028-2ea5-4862-8a92-c2088edfcbe1" }, { "label": "ppep_mapping_sqlite", "output_name": "mqppep_output_sqlite", "uuid": "eb996931-c548-4f3b-aaaa-39cc711df516" }, { "label": "preproc_tab", "output_name": "preproc_tab", "uuid": "c9410cf1-44a2-4aa6-b3df-06cef74f3a45" }, { "label": "preproc_sqlite", "output_name": "preproc_sqlite", "uuid": "4eb22cc3-5879-4625-89c0-e0fddb01a197" }, { "label": "ppep_intensities", "output_name": "phosphoPepIntensities", "uuid": "c704fd66-5ac3-4779-ad40-536955cd81e3" }, { "label": "enrichGraph_pdf", "output_name": "enrichGraph", "uuid": "5bf2a478-0431-4d32-84a9-7d46aad80ec5" }, { "label": "quantData", "output_name": "quantData_tabular", "uuid": "cc922a75-6e72-4e60-add2-4b6ed8f73cdb" } ] }, "8": { "annotation": "Perform ANOVA. For imputing missing values, use median of non-missing values from the same treatment group.", "content_id": "mqppep_anova", "errors": null, "id": 8, "input_connections": { "alpha_file": { "id": 6, "output_name": "output" }, "input_file": { "id": 7, "output_name": "preproc_tab" } }, "inputs": [], "label": "MaxQuant Phosphopeptide ANOVA group-median imputed", "name": "MaxQuant Phosphopeptide ANOVA", "outputs": [ { "name": "imputed_data_file", "type": "tabular" }, { "name": "imp_qn_lt_file", "type": "tabular" }, { "name": "report_file", "type": "pdf" } ], "position": { "bottom": 1775.6000061035156, "height": 255.60000610351562, "left": 1370, "right": 1570, "top": 1520, "width": 200, "x": 1370, "y": 1520 }, "post_job_actions": { "RenameDatasetActionimputed_data_file": { "action_arguments": { "newname": "#{input_file}.intensities_group-mean-imputed_QN_LT" }, "action_type": "RenameDatasetAction", "output_name": "imp_qn_lt_file" }, "RenameDatasetActionimputed_data_file": { "action_arguments": { "newname": "#{input_file}.intensities_group-mean-imputed" }, "action_type": "RenameDatasetAction", "output_name": "imputed_data_file" }, "RenameDatasetActionreport_file": { "action_arguments": { "newname": "#{input_file}.intensities_group-mean-imputed_report (download/unzip to view)" }, "action_type": "RenameDatasetAction", "output_name": "report_file" } }, "tool_id": "mqppep_anova", "tool_state": "{\"alpha_file\": {\"__class__\": \"ConnectedValue\"}, \"first_data_column\": \"Intensity\", \"imputation\": {\"imputation_method\": \"group-median\", \"__current_case__\": 0}, \"input_file\": {\"__class__\": \"ConnectedValue\"}, \"sample_grouping_regex\": \"(\\\\d+)\", \"sample_names_regex\": \"\\\\.(\\\\d+)[A-Z]$\", \"__page__\": null, \"__rerun_remap_job_id__\": null}", "tool_version": null, "type": "tool", "uuid": "ffa771c3-c52d-42a4-b78f-a60a39678792", "workflow_outputs": [ { "label": "intensities_group-mean-imputed_QN_LT", "output_name": "imp_qn_lt_file", "uuid": "0e77a2e0-bd7a-4487-aaa6-ead2469509a2" }, { "label": "intensities_group-mean-imputed", "output_name": "imputed_data_file", "uuid": "169d677f-0acb-4c56-b057-21f4aaf2b920" }, { "label": "intensities_group-mean-imputed_report", "output_name": "report_file", "uuid": "25edae88-3bb6-4ec9-8b98-686fded7ed79" } ] }, "9": { "annotation": "Perform ANOVA. For imputing missing values, create random values.", "content_id": "mqppep_anova", "errors": null, "id": 9, "input_connections": { "alpha_file": { "id": 6, "output_name": "output" }, "input_file": { "id": 7, "output_name": "preproc_tab" } }, "inputs": [], "label": "MaxQuant Phosphopeptide ANOVA randomly imputed", "name": "MaxQuant Phosphopeptide ANOVA", "outputs": [ { "name": "imputed_data_file", "type": "tabular" }, { "name": "imp_qn_lt_file", "type": "tabular" }, { "name": "report_file", "type": "pdf" } ], "position": { "bottom": 1609.6000061035156, "height": 255.60000610351562, "left": 1617, "right": 1817, "top": 1354, "width": 200, "x": 1617, "y": 1354 }, "post_job_actions": { "RenameDatasetActionimputed_data_file": { "action_arguments": { "newname": "#{input_file}.intensities_randomly-imputed_QN_LT" }, "action_type": "RenameDatasetAction", "output_name": "imp_qn_lt_file" }, "RenameDatasetActionimputed_data_file": { "action_arguments": { "newname": "#{input_file}.intensities_randomly-imputed" }, "action_type": "RenameDatasetAction", "output_name": "imputed_data_file" }, "RenameDatasetActionreport_file": { "action_arguments": { "newname": "#{input_file}.intensities_randomly-imputed_report (download/unzip to view)" }, "action_type": "RenameDatasetAction", "output_name": "report_file" } }, "tool_id": "mqppep_anova", "tool_state": "{\"alpha_file\": {\"__class__\": \"ConnectedValue\"}, \"first_data_column\": \"Intensity\", \"imputation\": {\"imputation_method\": \"random\", \"__current_case__\": 3, \"meanPercentile\": \"1\", \"sdPercentile\": \"0.2\"}, \"input_file\": {\"__class__\": \"ConnectedValue\"}, \"sample_grouping_regex\": \"(\\\\d+)\", \"sample_names_regex\": \"\\\\.(\\\\d+)[A-Z]$\", \"__page__\": null, \"__rerun_remap_job_id__\": null}", "type": "tool", "uuid": "f1f2bdf9-fbc0-4205-b834-9a8af5814dc9", "workflow_outputs": [ { "label": "intensities_randomly-imputed_QN_LT", "output_name": "imputed_data_file", "uuid": "d70a3476-fb42-4533-831b-4fcb2bda74fc" }, { "label": "intensities_randomly-imputed_report", "output_name": "report_file", "uuid": "d6701a61-357b-4a27-8154-ca41eb16d8a6" }, { "label": "intensities_randomly-imputed_QN_LT", "output_name": "imp_qn_lt_file", "uuid": "637faf12-0d52-45b3-a318-40bfc7fcd4cb" } ] } }, "tags": [ "ppenrich" ], "uuid": "445a0eb0-25c7-44c0-8259-a3346b01cbf3", "version": 3 }