sklearn_stacking_ensemble_models: train_test

comparison train_test_split.py @ 11:0380f10c4e04 draft

"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit ea12f973df4b97a2691d9e4ce6bf6fae59d57717"

author	bgruening
date	Fri, 30 Apr 2021 23:23:56 +0000
parents	2d890789ac48
children

comparison

equal deleted inserted replaced

-:2d890789ac48
+:0380f10c4e04
 nth_split = params["mode_selection"]["nth_split"]
 # read groups
 if infile_groups:
-header = "infer" if (params["mode_selection"]["cv_selector"]["groups_selector"]["header_g"]) else None
+header = (
-column_option = params["mode_selection"]["cv_selector"]["groups_selector"]["column_selector_options_g"][
+"infer"
-"selected_column_selector_option_g"
+if (params["mode_selection"]["cv_selector"]["groups_selector"]["header_g"])
-]
+else None
+)
+column_option = params["mode_selection"]["cv_selector"]["groups_selector"][
+"column_selector_options_g"
+]["selected_column_selector_option_g"]
 if column_option in [
 "by_index_number",
 "all_but_by_index_number",
 "by_header_name",
 "all_but_by_header_name",
 ]:
-c = params["mode_selection"]["cv_selector"]["groups_selector"]["column_selector_options_g"]["col_g"]
+c = params["mode_selection"]["cv_selector"]["groups_selector"][
+"column_selector_options_g"
+]["col_g"]
 else:
 c = None
 groups = read_columns(
 infile_groups,
 # construct the cv splitter object
 splitter, groups = get_cv(params["mode_selection"]["cv_selector"])
 total_n_splits = splitter.get_n_splits(array.values, y=y, groups=groups)
 if nth_split > total_n_splits:
-raise ValueError("Total number of splits is {}, but got `nth_split` " "= {}".format(total_n_splits, nth_split))
+raise ValueError(
+"Total number of splits is {}, but got `nth_split` "
+"= {}".format(total_n_splits, nth_split)
+)
 i = 1
 for train_index, test_index in splitter.split(array.values, y=y, groups=groups):
 # suppose nth_split >= 1
 if i == nth_split:
 train, test = train_test_split(array, **options)
 # cv splitter
 else:
-train, test = _get_single_cv_split(params, array, infile_labels=infile_labels, infile_groups=infile_groups)
+train, test = _get_single_cv_split(
+params, array, infile_labels=infile_labels, infile_groups=infile_groups
+)
 print("Input shape: %s" % repr(array.shape))
 print("Train shape: %s" % repr(train.shape))
 print("Test shape: %s" % repr(test.shape))
 train.to_csv(outfile_train, sep="\t", header=input_header, index=False)

Mercurial > repos > bgruening > sklearn_stacking_ensemble_models

comparison train_test_split.py @ 11:0380f10c4e04 draft