Mercurial > repos > eschen42 > mqppep_anova
diff workflow/ppenrich_suite_wf.ga @ 13:b41a077af3aa draft
"planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/mqppep commit 040e4945da00a279cb60daae799fce9489f99c50"
author | eschen42 |
---|---|
date | Tue, 22 Mar 2022 20:47:40 +0000 |
parents | |
children | 6679616d0c18 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/workflow/ppenrich_suite_wf.ga Tue Mar 22 20:47:40 2022 +0000 @@ -0,0 +1,652 @@ +{ + "a_galaxy_workflow": "true", + "annotation": "phoshpoproteomic enrichment data pre-processing and ANOVA", + "creator": [ + { + "class": "Person", + "identifier": "0000-0002-2882-0508", + "name": "Art Eschenlauer" + } + ], + "format-version": "0.1", + "license": "MIT", + "name": "ppenrich_suite_wf", + "steps": { + "0": { + "annotation": "The Phospho (STY)Sites.txt file produced by MaxQuant (found in the txt folder).", + "content_id": null, + "errors": null, + "id": 0, + "input_connections": {}, + "inputs": [ + { + "description": "The Phospho (STY)Sites.txt file produced by MaxQuant (found in the txt folder).", + "name": "Phospho (STY)Sites.txt" + } + ], + "label": "Phospho (STY)Sites.txt", + "name": "Input dataset", + "outputs": [], + "position": { + "bottom": 346.3999938964844, + "height": 81.89999389648438, + "left": 495, + "right": 695, + "top": 264.5, + "width": 200, + "x": 495, + "y": 264.5 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", + "tool_version": null, + "type": "data_input", + "uuid": "21c3c29d-9e8c-4ece-b585-9e68fed7a93f", + "workflow_outputs": [] + }, + "1": { + "annotation": "FASTA file of all human canonical isoforms, derived from Swiss-Prot (e.g., merge of https://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot_varsplic.fasta.gz and https://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot.fasta.gz)", + "content_id": null, + "errors": null, + "id": 1, + "input_connections": {}, + "inputs": [ + { + "description": "FASTA file of all human canonical isoforms, derived from Swiss-Prot (e.g., merge of https://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot_varsplic.fasta.gz and https://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot.fasta.gz)", + "name": "SwissProt_Human_Canonical_Isoform.fasta" + } + ], + "label": "SwissProt_Human_Canonical_Isoform.fasta", + "name": "Input dataset", + "outputs": [], + "position": { + "bottom": 708.8000030517578, + "height": 102.30000305175781, + "left": 685, + "right": 885, + "top": 606.5, + "width": 200, + "x": 685, + "y": 606.5 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"format\": [\"fasta\"]}", + "tool_version": null, + "type": "data_input", + "uuid": "5da7317c-4def-48f3-8eac-af95bd18b290", + "workflow_outputs": [] + }, + "2": { + "annotation": "Derived from https://networkin.info/download/networkin_human_predictions_3.1.tsv.xz (which is free for non-commercial use - for required citation, see https://networkin.info/)", + "content_id": null, + "errors": null, + "id": 2, + "input_connections": {}, + "inputs": [ + { + "description": "Derived from https://networkin.info/download/networkin_human_predictions_3.1.tsv.xz (which is free for non-commercial use - for required citation, see https://networkin.info/)", + "name": "NetworKIN_cutoffscore2.0.tabular" + } + ], + "label": "NetworKIN_cutoffscore2.0.tabular", + "name": "Input dataset", + "outputs": [], + "position": { + "bottom": 853.8000030517578, + "height": 102.30000305175781, + "left": 696, + "right": 896, + "top": 751.5, + "width": 200, + "x": 696, + "y": 751.5 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", + "tool_version": null, + "type": "data_input", + "uuid": "2edff8de-4379-45e2-b6b9-6ed4706bbf00", + "workflow_outputs": [] + }, + "3": { + "annotation": "Derived from http://hprd.org/serine_motifs, http://hprd.org/tyrosine_motifs, and http://pegasus.biochem.mpg.de/phosida/help/motifs.aspx", + "content_id": null, + "errors": null, + "id": 3, + "input_connections": {}, + "inputs": [ + { + "description": "Derived from http://hprd.org/serine_motifs, http://hprd.org/tyrosine_motifs, and http://pegasus.biochem.mpg.de/phosida/help/motifs.aspx", + "name": "pSTY_Motifs.tabular" + } + ], + "label": "pSTY_Motifs.tabular", + "name": "Input dataset", + "outputs": [], + "position": { + "bottom": 977.3999938964844, + "height": 81.89999389648438, + "left": 708, + "right": 908, + "top": 895.5, + "width": 200, + "x": 708, + "y": 895.5 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", + "tool_version": null, + "type": "data_input", + "uuid": "86ebaaf2-b050-4eca-a88b-23a4c1af39f5", + "workflow_outputs": [] + }, + "4": { + "annotation": "Derived from Kinase_Substrate_Dataset.gz found at https://www.phosphosite.org/staticDownloads (free for non-commercial use - see that link for citation.)", + "content_id": null, + "errors": null, + "id": 4, + "input_connections": {}, + "inputs": [ + { + "description": "Derived from Kinase_Substrate_Dataset.gz found at https://www.phosphosite.org/staticDownloads (free for non-commercial use - see that link for citation.)", + "name": "PSP_Kinase_Substrate_Dataset.tabular" + } + ], + "label": "PSP_Kinase_Substrate_Dataset.tabular", + "name": "Input dataset", + "outputs": [], + "position": { + "bottom": 1126.8000030517578, + "height": 102.30000305175781, + "left": 729, + "right": 929, + "top": 1024.5, + "width": 200, + "x": 729, + "y": 1024.5 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", + "tool_version": null, + "type": "data_input", + "uuid": "92f16705-a19c-4fb9-b278-3ae8e11f09d8", + "workflow_outputs": [] + }, + "5": { + "annotation": "Derived from Regulatory_sites.gz found at https://www.phosphosite.org/staticDownloads (free for non-commercial use - see that link for citation.)", + "content_id": null, + "errors": null, + "id": 5, + "input_connections": {}, + "inputs": [ + { + "description": "Derived from Regulatory_sites.gz found at https://www.phosphosite.org/staticDownloads (free for non-commercial use - see that link for citation.)", + "name": "PSP_Regulatory_sites.tabular" + } + ], + "label": "PSP_Regulatory_sites.tabular", + "name": "Input dataset", + "outputs": [], + "position": { + "bottom": 1251.3999938964844, + "height": 81.89999389648438, + "left": 745, + "right": 945, + "top": 1169.5, + "width": 200, + "x": 745, + "y": 1169.5 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", + "tool_version": null, + "type": "data_input", + "uuid": "5ab49d93-11e4-4e91-b30b-92269b319879", + "workflow_outputs": [] + }, + "6": { + "annotation": "List of alpha cutoff values for significance testing; text file having no header and a single line for each cutoff value.", + "content_id": null, + "errors": null, + "id": 6, + "input_connections": {}, + "inputs": [ + { + "description": "List of alpha cutoff values for significance testing; text file having no header and a single line for each cutoff value.", + "name": "alpha_levels.tabular" + } + ], + "label": "alpha_levels.tabular", + "name": "Input dataset", + "outputs": [], + "position": { + "bottom": 1501.8999938964844, + "height": 81.89999389648438, + "left": 727, + "right": 927, + "top": 1420, + "width": 200, + "x": 727, + "y": 1420 + }, + "tool_id": null, + "tool_state": "{\"optional\": false, \"format\": [\"tabular\"]}", + "tool_version": null, + "type": "data_input", + "uuid": "481c627c-a4ce-45d7-b659-4f54692aafc7", + "workflow_outputs": [] + }, + "7": { + "annotation": "", + "content_id": "mqppep_preproc", + "errors": null, + "id": 7, + "input_connections": { + "networkin": { + "id": 2, + "output_name": "output" + }, + "p_sty_motifs": { + "id": 3, + "output_name": "output" + }, + "phosphoSites": { + "id": 0, + "output_name": "output" + }, + "protein_fasta": { + "id": 1, + "output_name": "output" + }, + "psp_kinase_substrate": { + "id": 4, + "output_name": "output" + }, + "psp_regulatory_sites": { + "id": 5, + "output_name": "output" + } + }, + "inputs": [], + "label": null, + "name": "MaxQuant Phosphopeptide Preprocessing", + "outputs": [ + { + "name": "phosphoPepIntensities", + "type": "tabular" + }, + { + "name": "enrichGraph", + "type": "pdf" + }, + { + "name": "locProbCutoffGraph", + "type": "pdf" + }, + { + "name": "enrichGraph_svg", + "type": "svg" + }, + { + "name": "locProbCutoffGraph_svg", + "type": "svg" + }, + { + "name": "filteredData_tabular", + "type": "tabular" + }, + { + "name": "quantData_tabular", + "type": "tabular" + }, + { + "name": "mapped_phophopeptides", + "type": "tabular" + }, + { + "name": "melted_phophopeptide_map", + "type": "tabular" + }, + { + "name": "mqppep_output_sqlite", + "type": "sqlite" + }, + { + "name": "preproc_tab", + "type": "tabular" + }, + { + "name": "preproc_csv", + "type": "csv" + }, + { + "name": "preproc_sqlite", + "type": "sqlite" + } + ], + "position": { + "bottom": 1408.7000122070312, + "height": 793.2000122070312, + "left": 1138.5, + "right": 1338.5, + "top": 615.5, + "width": 200, + "x": 1138.5, + "y": 615.5 + }, + "post_job_actions": { + "RenameDatasetActionenrichGraph": { + "action_arguments": { + "newname": "#{phosphoSites}.enrichGraph_pdf" + }, + "action_type": "RenameDatasetAction", + "output_name": "enrichGraph" + }, + "RenameDatasetActionenrichGraph_svg": { + "action_arguments": { + "newname": "#{phosphoSites}.enrichGraph_svg" + }, + "action_type": "RenameDatasetAction", + "output_name": "enrichGraph_svg" + }, + "RenameDatasetActionfilteredData_tabular": { + "action_arguments": { + "newname": "#{phosphoSites}.filteredData" + }, + "action_type": "RenameDatasetAction", + "output_name": "filteredData_tabular" + }, + "RenameDatasetActionlocProbCutoffGraph": { + "action_arguments": { + "newname": "#{phosphoSites}.locProbCutoffGraph_pdf" + }, + "action_type": "RenameDatasetAction", + "output_name": "locProbCutoffGraph" + }, + "RenameDatasetActionlocProbCutoffGraph_svg": { + "action_arguments": { + "newname": "#{phosphoSites}.locProbCutoffGraph_svg" + }, + "action_type": "RenameDatasetAction", + "output_name": "locProbCutoffGraph_svg" + }, + "RenameDatasetActionmapped_phophopeptides": { + "action_arguments": { + "newname": "#{phosphoSites}.ppep_map" + }, + "action_type": "RenameDatasetAction", + "output_name": "mapped_phophopeptides" + }, + "RenameDatasetActionmelted_phophopeptide_map": { + "action_arguments": { + "newname": "#{phosphoSites}.melted" + }, + "action_type": "RenameDatasetAction", + "output_name": "melted_phophopeptide_map" + }, + "RenameDatasetActionmqppep_output_sqlite": { + "action_arguments": { + "newname": "#{phosphoSites}.ppep_mapping_sqlite" + }, + "action_type": "RenameDatasetAction", + "output_name": "mqppep_output_sqlite" + }, + "RenameDatasetActionphosphoPepIntensities": { + "action_arguments": { + "newname": "#{phosphoSites}.ppep_intensities" + }, + "action_type": "RenameDatasetAction", + "output_name": "phosphoPepIntensities" + }, + "RenameDatasetActionpreproc_csv": { + "action_arguments": { + "newname": "#{phosphoSites}.preproc_csv" + }, + "action_type": "RenameDatasetAction", + "output_name": "preproc_csv" + }, + "RenameDatasetActionpreproc_sqlite": { + "action_arguments": { + "newname": "#{phosphoSites}.preproc_sqlite" + }, + "action_type": "RenameDatasetAction", + "output_name": "preproc_sqlite" + }, + "RenameDatasetActionpreproc_tab": { + "action_arguments": { + "newname": "#{phosphoSites}.preproc_tab" + }, + "action_type": "RenameDatasetAction", + "output_name": "preproc_tab" + }, + "RenameDatasetActionquantData_tabular": { + "action_arguments": { + "newname": "#{phosphoSites}.quantData" + }, + "action_type": "RenameDatasetAction", + "output_name": "quantData_tabular" + } + }, + "tool_id": "mqppep_preproc", + "tool_state": "{\"collapseFunc\": \"sum\", \"intervalCol\": \"1\", \"localProbCutoff\": \"0.75\", \"merge_function\": \"sum\", \"networkin\": {\"__class__\": \"ConnectedValue\"}, \"p_sty_motifs\": {\"__class__\": \"ConnectedValue\"}, \"phosphoCol\": \"^Number of Phospho [(]STY[)]$\", \"phosphoSites\": {\"__class__\": \"ConnectedValue\"}, \"protein_fasta\": {\"__class__\": \"ConnectedValue\"}, \"psp_kinase_substrate\": {\"__class__\": \"ConnectedValue\"}, \"psp_regulatory_sites\": {\"__class__\": \"ConnectedValue\"}, \"pst_not_py\": \"true\", \"species\": \"human\", \"startCol\": \"^Intensity[^_]\", \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": null, + "type": "tool", + "uuid": "1e983dba-edca-4aed-a589-49b1651b4a85", + "workflow_outputs": [ + { + "label": "preproc_csv", + "output_name": "preproc_csv", + "uuid": "8cba5367-b25c-40e0-a324-552225b1aa1d" + }, + { + "label": "locProbCutoffGraph_pdf", + "output_name": "locProbCutoffGraph", + "uuid": "641c5959-dab4-42d1-986d-8e6aaeb74ef6" + }, + { + "label": "melted_phosphopeptide_map", + "output_name": "melted_phophopeptide_map", + "uuid": "878dc817-26a3-4061-9dd4-56e737b3c4f7" + }, + { + "label": "enrichGraph_svg", + "output_name": "enrichGraph_svg", + "uuid": "4492366c-945e-492f-8381-1c97c4da2264" + }, + { + "label": "locProbCutoffGraph_svg", + "output_name": "locProbCutoffGraph_svg", + "uuid": "06faf93c-5f04-4cb3-9e41-58e465f6180e" + }, + { + "label": "filteredData", + "output_name": "filteredData_tabular", + "uuid": "76e2e268-f728-45f0-9973-793fbde0dd0a" + }, + { + "label": "ppep_map", + "output_name": "mapped_phophopeptides", + "uuid": "d0fea028-2ea5-4862-8a92-c2088edfcbe1" + }, + { + "label": "ppep_mapping_sqlite", + "output_name": "mqppep_output_sqlite", + "uuid": "eb996931-c548-4f3b-aaaa-39cc711df516" + }, + { + "label": "preproc_tab", + "output_name": "preproc_tab", + "uuid": "c9410cf1-44a2-4aa6-b3df-06cef74f3a45" + }, + { + "label": "preproc_sqlite", + "output_name": "preproc_sqlite", + "uuid": "4eb22cc3-5879-4625-89c0-e0fddb01a197" + }, + { + "label": "ppep_intensities", + "output_name": "phosphoPepIntensities", + "uuid": "c704fd66-5ac3-4779-ad40-536955cd81e3" + }, + { + "label": "enrichGraph_pdf", + "output_name": "enrichGraph", + "uuid": "5bf2a478-0431-4d32-84a9-7d46aad80ec5" + }, + { + "label": "quantData", + "output_name": "quantData_tabular", + "uuid": "cc922a75-6e72-4e60-add2-4b6ed8f73cdb" + } + ] + }, + "8": { + "annotation": "Perform ANOVA. For imputing missing values, use median of non-missing values from the same treatment group.", + "content_id": "mqppep_anova", + "errors": null, + "id": 8, + "input_connections": { + "alpha_file": { + "id": 6, + "output_name": "output" + }, + "input_file": { + "id": 7, + "output_name": "preproc_tab" + } + }, + "inputs": [], + "label": "MaxQuant Phosphopeptide ANOVA group-median imputed", + "name": "MaxQuant Phosphopeptide ANOVA", + "outputs": [ + { + "name": "imputed_data_file", + "type": "tabular" + }, + { + "name": "report_file", + "type": "pdf" + } + ], + "position": { + "bottom": 1775.6000061035156, + "height": 255.60000610351562, + "left": 1370, + "right": 1570, + "top": 1520, + "width": 200, + "x": 1370, + "y": 1520 + }, + "post_job_actions": { + "RenameDatasetActionimputed_data_file": { + "action_arguments": { + "newname": "#{input_file}.intensities_group-mean-imputed_QN_LT" + }, + "action_type": "RenameDatasetAction", + "output_name": "imputed_data_file" + }, + "RenameDatasetActionreport_file": { + "action_arguments": { + "newname": "#{input_file}.intensities_group-mean-imputed_report (download/unzip to view)" + }, + "action_type": "RenameDatasetAction", + "output_name": "report_file" + } + }, + "tool_id": "mqppep_anova", + "tool_state": "{\"alpha_file\": {\"__class__\": \"ConnectedValue\"}, \"first_data_column\": \"Intensity\", \"imputation\": {\"imputation_method\": \"group-median\", \"__current_case__\": 0}, \"input_file\": {\"__class__\": \"ConnectedValue\"}, \"sample_grouping_regex\": \"(\\\\d+)\", \"sample_names_regex\": \"\\\\.(\\\\d+)[A-Z]$\", \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "tool_version": null, + "type": "tool", + "uuid": "ffa771c3-c52d-42a4-b78f-a60a39678792", + "workflow_outputs": [ + { + "label": "intensities_group-mean-imputed_QN_LT", + "output_name": "imputed_data_file", + "uuid": "169d677f-0acb-4c56-b057-21f4aaf2b920" + }, + { + "label": "intensities_group-mean-imputed_report", + "output_name": "report_file", + "uuid": "25edae88-3bb6-4ec9-8b98-686fded7ed79" + } + ] + }, + "9": { + "annotation": "Perform ANOVA. For imputing missing values, create random values.", + "content_id": "mqppep_anova", + "errors": null, + "id": 9, + "input_connections": { + "alpha_file": { + "id": 6, + "output_name": "output" + }, + "input_file": { + "id": 7, + "output_name": "preproc_tab" + } + }, + "inputs": [], + "label": "MaxQuant Phosphopeptide ANOVA randomly imputed", + "name": "MaxQuant Phosphopeptide ANOVA", + "outputs": [ + { + "name": "imputed_data_file", + "type": "tabular" + }, + { + "name": "report_file", + "type": "pdf" + } + ], + "position": { + "bottom": 1609.6000061035156, + "height": 255.60000610351562, + "left": 1617, + "right": 1817, + "top": 1354, + "width": 200, + "x": 1617, + "y": 1354 + }, + "post_job_actions": { + "RenameDatasetActionimputed_data_file": { + "action_arguments": { + "newname": "#{input_file}.intensities_randomly-imputed_QN_LT" + }, + "action_type": "RenameDatasetAction", + "output_name": "imputed_data_file" + }, + "RenameDatasetActionreport_file": { + "action_arguments": { + "newname": "#{input_file}.intensities_randomly-imputed_report (download/unzip to view)" + }, + "action_type": "RenameDatasetAction", + "output_name": "report_file" + } + }, + "tool_id": "mqppep_anova", + "tool_state": "{\"alpha_file\": {\"__class__\": \"ConnectedValue\"}, \"first_data_column\": \"Intensity\", \"imputation\": {\"imputation_method\": \"random\", \"__current_case__\": 3, \"meanPercentile\": \"1\", \"sdPercentile\": \"0.2\"}, \"input_file\": {\"__class__\": \"ConnectedValue\"}, \"sample_grouping_regex\": \"(\\\\d+)\", \"sample_names_regex\": \"\\\\.(\\\\d+)[A-Z]$\", \"__page__\": null, \"__rerun_remap_job_id__\": null}", + "type": "tool", + "uuid": "f1f2bdf9-fbc0-4205-b834-9a8af5814dc9", + "workflow_outputs": [ + { + "label": "intensities_randomly-imputed_QN_LT", + "output_name": "imputed_data_file", + "uuid": "d70a3476-fb42-4533-831b-4fcb2bda74fc" + }, + { + "label": "intensities_randomly-imputed_report", + "output_name": "report_file", + "uuid": "d6701a61-357b-4a27-8154-ca41eb16d8a6" + } + ] + } + }, + "tags": [ + "ppenrich" + ], + "uuid": "445a0eb0-25c7-44c0-8259-a3346b01cbf3", + "version": 3 +}