Mercurial > repos > bgruening > sklearn_stacking_ensemble_models
annotate ml_visualization_ex.py @ 4:17f173a4a745 draft
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 02087ce2966cf8b4aac9197a41171e7f986c11d1-dirty"
| author | bgruening | 
|---|---|
| date | Wed, 02 Oct 2019 03:28:39 -0400 | 
| parents | 963e449636d3 | 
| children | 00819b7f2f55 | 
| rev | line source | 
|---|---|
| 3 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 1 import argparse | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 2 import json | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 3 import numpy as np | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 4 import pandas as pd | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 5 import plotly | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 6 import plotly.graph_objs as go | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 7 import warnings | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 8 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 9 from keras.models import model_from_json | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 10 from keras.utils import plot_model | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 11 from sklearn.feature_selection.base import SelectorMixin | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 12 from sklearn.metrics import precision_recall_curve, average_precision_score | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 13 from sklearn.metrics import roc_curve, auc | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 14 from sklearn.pipeline import Pipeline | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 15 from galaxy_ml.utils import load_model, read_columns, SafeEval | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 16 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 17 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 18 safe_eval = SafeEval() | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 19 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 20 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 21 def main(inputs, infile_estimator=None, infile1=None, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 22 infile2=None, outfile_result=None, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 23 outfile_object=None, groups=None, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 24 ref_seq=None, intervals=None, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 25 targets=None, fasta_path=None, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 26 model_config=None): | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 27 """ | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 28 Parameter | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 29 --------- | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 30 inputs : str | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 31 File path to galaxy tool parameter | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 32 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 33 infile_estimator : str, default is None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 34 File path to estimator | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 35 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 36 infile1 : str, default is None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 37 File path to dataset containing features or true labels. | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 38 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 39 infile2 : str, default is None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 40 File path to dataset containing target values or predicted | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 41 probabilities. | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 42 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 43 outfile_result : str, default is None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 44 File path to save the results, either cv_results or test result | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 45 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 46 outfile_object : str, default is None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 47 File path to save searchCV object | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 48 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 49 groups : str, default is None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 50 File path to dataset containing groups labels | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 51 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 52 ref_seq : str, default is None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 53 File path to dataset containing genome sequence file | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 54 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 55 intervals : str, default is None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 56 File path to dataset containing interval file | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 57 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 58 targets : str, default is None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 59 File path to dataset compressed target bed file | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 60 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 61 fasta_path : str, default is None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 62 File path to dataset containing fasta file | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 63 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 64 model_config : str, default is None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 65 File path to dataset containing JSON config for neural networks | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 66 """ | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 67 warnings.simplefilter('ignore') | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 68 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 69 with open(inputs, 'r') as param_handler: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 70 params = json.load(param_handler) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 71 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 72 title = params['plotting_selection']['title'].strip() | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 73 plot_type = params['plotting_selection']['plot_type'] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 74 if plot_type == 'feature_importances': | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 75 with open(infile_estimator, 'rb') as estimator_handler: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 76 estimator = load_model(estimator_handler) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 77 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 78 column_option = (params['plotting_selection'] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 79 ['column_selector_options'] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 80 ['selected_column_selector_option']) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 81 if column_option in ['by_index_number', 'all_but_by_index_number', | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 82 'by_header_name', 'all_but_by_header_name']: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 83 c = (params['plotting_selection'] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 84 ['column_selector_options']['col1']) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 85 else: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 86 c = None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 87 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 88 _, input_df = read_columns(infile1, c=c, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 89 c_option=column_option, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 90 return_df=True, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 91 sep='\t', header='infer', | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 92 parse_dates=True) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 93 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 94 feature_names = input_df.columns.values | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 95 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 96 if isinstance(estimator, Pipeline): | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 97 for st in estimator.steps[:-1]: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 98 if isinstance(st[-1], SelectorMixin): | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 99 mask = st[-1].get_support() | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 100 feature_names = feature_names[mask] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 101 estimator = estimator.steps[-1][-1] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 102 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 103 if hasattr(estimator, 'coef_'): | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 104 coefs = estimator.coef_ | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 105 else: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 106 coefs = getattr(estimator, 'feature_importances_', None) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 107 if coefs is None: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 108 raise RuntimeError('The classifier does not expose ' | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 109 '"coef_" or "feature_importances_" ' | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 110 'attributes') | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 111 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 112 threshold = params['plotting_selection']['threshold'] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 113 if threshold is not None: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 114 mask = (coefs > threshold) | (coefs < -threshold) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 115 coefs = coefs[mask] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 116 feature_names = feature_names[mask] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 117 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 118 # sort | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 119 indices = np.argsort(coefs)[::-1] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 120 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 121 trace = go.Bar(x=feature_names[indices], | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 122 y=coefs[indices]) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 123 layout = go.Layout(title=title or "Feature Importances") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 124 fig = go.Figure(data=[trace], layout=layout) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 125 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 126 elif plot_type == 'pr_curve': | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 127 df1 = pd.read_csv(infile1, sep='\t', header=None) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 128 df2 = pd.read_csv(infile2, sep='\t', header=None) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 129 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 130 precision = {} | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 131 recall = {} | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 132 ap = {} | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 133 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 134 pos_label = params['plotting_selection']['pos_label'].strip() \ | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 135 or None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 136 for col in df1.columns: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 137 y_true = df1[col].values | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 138 y_score = df2[col].values | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 139 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 140 precision[col], recall[col], _ = precision_recall_curve( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 141 y_true, y_score, pos_label=pos_label) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 142 ap[col] = average_precision_score( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 143 y_true, y_score, pos_label=pos_label or 1) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 144 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 145 if len(df1.columns) > 1: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 146 precision["micro"], recall["micro"], _ = precision_recall_curve( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 147 df1.values.ravel(), df2.values.ravel(), pos_label=pos_label) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 148 ap['micro'] = average_precision_score( | 
| 4 
17f173a4a745
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 02087ce2966cf8b4aac9197a41171e7f986c11d1-dirty"
 bgruening parents: 
3diff
changeset | 149 df1.values, df2.values, average='micro', | 
| 
17f173a4a745
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 02087ce2966cf8b4aac9197a41171e7f986c11d1-dirty"
 bgruening parents: 
3diff
changeset | 150 pos_label=pos_label or 1) | 
| 3 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 151 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 152 data = [] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 153 for key in precision.keys(): | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 154 trace = go.Scatter( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 155 x=recall[key], | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 156 y=precision[key], | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 157 mode='lines', | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 158 name='%s (area = %.2f)' % (key, ap[key]) if key == 'micro' | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 159 else 'column %s (area = %.2f)' % (key, ap[key]) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 160 ) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 161 data.append(trace) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 162 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 163 layout = go.Layout( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 164 title=title or "Precision-Recall curve", | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 165 xaxis=dict(title='Recall'), | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 166 yaxis=dict(title='Precision') | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 167 ) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 168 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 169 fig = go.Figure(data=data, layout=layout) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 170 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 171 elif plot_type == 'roc_curve': | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 172 df1 = pd.read_csv(infile1, sep='\t', header=None) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 173 df2 = pd.read_csv(infile2, sep='\t', header=None) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 174 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 175 fpr = {} | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 176 tpr = {} | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 177 roc_auc = {} | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 178 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 179 pos_label = params['plotting_selection']['pos_label'].strip() \ | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 180 or None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 181 for col in df1.columns: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 182 y_true = df1[col].values | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 183 y_score = df2[col].values | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 184 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 185 fpr[col], tpr[col], _ = roc_curve( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 186 y_true, y_score, pos_label=pos_label) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 187 roc_auc[col] = auc(fpr[col], tpr[col]) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 188 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 189 if len(df1.columns) > 1: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 190 fpr["micro"], tpr["micro"], _ = roc_curve( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 191 df1.values.ravel(), df2.values.ravel(), pos_label=pos_label) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 192 roc_auc['micro'] = auc(fpr["micro"], tpr["micro"]) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 193 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 194 data = [] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 195 for key in fpr.keys(): | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 196 trace = go.Scatter( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 197 x=fpr[key], | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 198 y=tpr[key], | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 199 mode='lines', | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 200 name='%s (area = %.2f)' % (key, roc_auc[key]) if key == 'micro' | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 201 else 'column %s (area = %.2f)' % (key, roc_auc[key]) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 202 ) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 203 data.append(trace) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 204 | 
| 4 
17f173a4a745
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 02087ce2966cf8b4aac9197a41171e7f986c11d1-dirty"
 bgruening parents: 
3diff
changeset | 205 trace = go.Scatter(x=[0, 1], y=[0, 1], | 
| 3 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 206 mode='lines', | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 207 line=dict(color='black', dash='dash'), | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 208 showlegend=False) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 209 data.append(trace) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 210 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 211 layout = go.Layout( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 212 title=title or "Receiver operating characteristic curve", | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 213 xaxis=dict(title='False Positive Rate'), | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 214 yaxis=dict(title='True Positive Rate') | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 215 ) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 216 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 217 fig = go.Figure(data=data, layout=layout) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 218 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 219 elif plot_type == 'rfecv_gridscores': | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 220 input_df = pd.read_csv(infile1, sep='\t', header='infer') | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 221 scores = input_df.iloc[:, 0] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 222 steps = params['plotting_selection']['steps'].strip() | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 223 steps = safe_eval(steps) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 224 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 225 data = go.Scatter( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 226 x=list(range(len(scores))), | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 227 y=scores, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 228 text=[str(_) for _ in steps] if steps else None, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 229 mode='lines' | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 230 ) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 231 layout = go.Layout( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 232 xaxis=dict(title="Number of features selected"), | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 233 yaxis=dict(title="Cross validation score"), | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 234 title=title or None | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 235 ) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 236 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 237 fig = go.Figure(data=[data], layout=layout) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 238 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 239 elif plot_type == 'learning_curve': | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 240 input_df = pd.read_csv(infile1, sep='\t', header='infer') | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 241 plot_std_err = params['plotting_selection']['plot_std_err'] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 242 data1 = go.Scatter( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 243 x=input_df['train_sizes_abs'], | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 244 y=input_df['mean_train_scores'], | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 245 error_y=dict( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 246 array=input_df['std_train_scores'] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 247 ) if plot_std_err else None, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 248 mode='lines', | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 249 name="Train Scores", | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 250 ) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 251 data2 = go.Scatter( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 252 x=input_df['train_sizes_abs'], | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 253 y=input_df['mean_test_scores'], | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 254 error_y=dict( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 255 array=input_df['std_test_scores'] | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 256 ) if plot_std_err else None, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 257 mode='lines', | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 258 name="Test Scores", | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 259 ) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 260 layout = dict( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 261 xaxis=dict( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 262 title='No. of samples' | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 263 ), | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 264 yaxis=dict( | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 265 title='Performance Score' | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 266 ), | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 267 title=title or 'Learning Curve' | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 268 ) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 269 fig = go.Figure(data=[data1, data2], layout=layout) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 270 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 271 elif plot_type == 'keras_plot_model': | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 272 with open(model_config, 'r') as f: | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 273 model_str = f.read() | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 274 model = model_from_json(model_str) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 275 plot_model(model, to_file="output.png") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 276 __import__('os').rename('output.png', 'output') | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 277 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 278 return 0 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 279 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 280 plotly.offline.plot(fig, filename="output.html", | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 281 auto_open=False) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 282 # to be discovered by `from_work_dir` | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 283 __import__('os').rename('output.html', 'output') | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 284 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 285 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 286 if __name__ == '__main__': | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 287 aparser = argparse.ArgumentParser() | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 288 aparser.add_argument("-i", "--inputs", dest="inputs", required=True) | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 289 aparser.add_argument("-e", "--estimator", dest="infile_estimator") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 290 aparser.add_argument("-X", "--infile1", dest="infile1") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 291 aparser.add_argument("-y", "--infile2", dest="infile2") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 292 aparser.add_argument("-O", "--outfile_result", dest="outfile_result") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 293 aparser.add_argument("-o", "--outfile_object", dest="outfile_object") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 294 aparser.add_argument("-g", "--groups", dest="groups") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 295 aparser.add_argument("-r", "--ref_seq", dest="ref_seq") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 296 aparser.add_argument("-b", "--intervals", dest="intervals") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 297 aparser.add_argument("-t", "--targets", dest="targets") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 298 aparser.add_argument("-f", "--fasta_path", dest="fasta_path") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 299 aparser.add_argument("-c", "--model_config", dest="model_config") | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 300 args = aparser.parse_args() | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 301 | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 302 main(args.inputs, args.infile_estimator, args.infile1, args.infile2, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 303 args.outfile_result, outfile_object=args.outfile_object, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 304 groups=args.groups, ref_seq=args.ref_seq, intervals=args.intervals, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 305 targets=args.targets, fasta_path=args.fasta_path, | 
| 
963e449636d3
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ba6a47bdf76bbf4cb276206ac1a8cbf61332fd16"
 bgruening parents: diff
changeset | 306 model_config=args.model_config) | 
