annotate feature_selection.xml @ 35:d3ab5b9028b9 draft default tip

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 80417bf0158a9b596e485dd66408f738f405145a
author bgruening
date Mon, 02 Oct 2023 09:15:54 +0000
parents b9d86fc6359d
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
34
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
1 <tool id="sklearn_feature_selection" name="Feature Selection" version="@VERSION@" profile="@PROFILE@">
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
2 <description>module, including univariate filter selection methods and recursive feature elimination algorithm</description>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
3 <macros>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
4 <import>main_macros.xml</import>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
5 </macros>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
6 <expand macro="python_requirements" />
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
7 <!--TODO: Add imblearn package support-->
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
8 <expand macro="macro_stdio" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
9 <version_command>echo "@VERSION@"</version_command>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
10 <command>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
11 <![CDATA[
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
12 python "$feature_selection_script" '$inputs'
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
13 ]]>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
14 </command>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
15 <configfiles>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
16 <inputs name="inputs" />
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
17 <configfile name="feature_selection_script">
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
18 <![CDATA[
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
19 import json
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
20 import sklearn.feature_selection
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
21 import skrebate
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
22 import pandas
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
23 import sys
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
24 import warnings
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
25 import xgboost
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
26 from sklearn import (
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
27 cluster, compose, decomposition, ensemble, feature_extraction,
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
28 feature_selection, gaussian_process, kernel_approximation, metrics,
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
29 model_selection, naive_bayes, neighbors, pipeline, preprocessing,
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
30 svm, linear_model, tree, discriminant_analysis)
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
31 from imblearn.pipeline import Pipeline as imbPipeline
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
32 from sklearn.pipeline import Pipeline
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
33
34
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
34 from galaxy_ml.model_persist import dump_model_to_h5
20
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
35 from galaxy_ml.utils import (SafeEval, feature_selector,
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
36 read_columns, get_module)
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
37
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
38
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
39 warnings.simplefilter('ignore')
13
467550472f7d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 10
diff changeset
40
467550472f7d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 10
diff changeset
41 safe_eval = SafeEval()
3
0dc80ab8ec21 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 4ed8c4f6ef9ece81797a398b17a99bbaf49a6978
bgruening
parents: 2
diff changeset
42
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
43 input_json_path = sys.argv[1]
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
44 with open(input_json_path, 'r') as param_handler:
9
7701da597d1d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 6
diff changeset
45 params = json.load(param_handler)
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
46
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
47 ## handle cheetah
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
48 #if $fs_algorithm_selector.selected_algorithm == 'SelectFromModel'\
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
49 and $fs_algorithm_selector.model_inputter.input_mode == 'prefitted':
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
50 params['fs_algorithm_selector']['model_inputter']['fitted_estimator'] =\
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
51 '$fs_algorithm_selector.model_inputter.fitted_estimator'
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
52 #end if
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
53
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
54 #if $fs_algorithm_selector.selected_algorithm == 'SelectFromModel'\
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
55 and $fs_algorithm_selector.model_inputter.input_mode == 'new'\
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
56 and $fs_algorithm_selector.model_inputter.estimator_selector.selected_module == 'custom_estimator':
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
57 params['fs_algorithm_selector']['model_inputter']['estimator_selector']['c_estimator'] =\
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
58 '$fs_algorithm_selector.model_inputter.estimator_selector.c_estimator'
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
59 #end if
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
60
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
61 #if $fs_algorithm_selector.selected_algorithm in ['RFE', 'RFECV', 'DyRFECV']\
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
62 and $fs_algorithm_selector.estimator_selector.selected_module == 'custom_estimator':
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
63 params['fs_algorithm_selector']['estimator_selector']['c_estimator'] =\
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
64 '$fs_algorithm_selector.estimator_selector.c_estimator'
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
65 #end if
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
66
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
67 #if $fs_algorithm_selector.selected_algorithm in ['RFECV', 'DyRFECV']\
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
68 and $fs_algorithm_selector.options.cv_selector.selected_cv\
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
69 in ['GroupKFold', 'GroupShuffleSplit', 'LeaveOneGroupOut', 'LeavePGroupsOut']:
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
70 params['fs_algorithm_selector']['options']['cv_selector']['groups_selector']['infile_g'] =\
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
71 '$fs_algorithm_selector.options.cv_selector.groups_selector.infile_g'
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
72 #end if
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
73
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
74 ## Read features
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
75 features_has_header = params['input_options']['header1']
20
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
76 #if $input_options.selected_input == 'tabular'
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
77 header = 'infer' if features_has_header else None
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
78 column_option = params['input_options']['column_selector_options_1']['selected_column_selector_option']
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
79 if column_option in ['by_index_number', 'all_but_by_index_number', 'by_header_name', 'all_but_by_header_name']:
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
80 c = params['input_options']['column_selector_options_1']['col1']
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
81 else:
20
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
82 c = None
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
83 X, input_df = read_columns(
34
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
84 '$input_options.infile1',
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
85 c = c,
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
86 c_option = column_option,
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
87 return_df = True,
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
88 sep='\t',
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
89 header=header,
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
90 parse_dates=True,
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
91 )
20
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
92 X = X.astype(float)
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
93 #elif $input_options.selected_input == 'seq_fasta'
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
94 fasta_file = '$input_options.fasta_file'
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
95 pyfaidx = get_module('pyfaidx')
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
96 sequences = pyfaidx.Fasta(fasta_file)
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
97 n_seqs = len(sequences.keys())
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
98 X = np.arange(n_seqs)[:, np.newaxis]
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
99 for param in estimator_params.keys():
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
100 if param.endswith('fasta_path'):
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
101 estimator.set_params(
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
102 **{param: fasta_file})
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
103 else:
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
104 raise ValueError(
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
105 "The selected estimator doesn't support "
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
106 "fasta file input! Please consider using "
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
107 "KerasGBatchClassifier with "
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
108 "FastaDNABatchGenerator/FastaProteinBatchGenerator "
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
109 "or having GenomeOneHotEncoder/ProteinOneHotEncoder "
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
110 "in pipeline!")
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
111 #elif $input_options.selected_input == 'sparse'
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
112 X = mmread('$input_options.infile1')
547fb1cde4cc planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 60f0fbc0eafd7c11bc60fb6c77f2937782efd8a9-dirty
bgruening
parents: 18
diff changeset
113 #end if
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
114
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
115 ## Read labels
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
116 header = 'infer' if params['input_options']['header2'] else None
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
117 column_option = params['input_options']['column_selector_options_2']['selected_column_selector_option2']
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
118 if column_option in ['by_index_number', 'all_but_by_index_number', 'by_header_name', 'all_but_by_header_name']:
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
119 c = params['input_options']['column_selector_options_2']['col2']
4
73c12f296b1c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 3
diff changeset
120 else:
73c12f296b1c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 3
diff changeset
121 c = None
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
122 y = read_columns(
34
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
123 '$input_options.infile2',
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
124 c = c,
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
125 c_option = column_option,
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
126 sep='\t',
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
127 header=header,
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
128 parse_dates=True,
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
129 )
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
130 y = y.ravel()
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
131
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
132 ## Create feature selector
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
133 new_selector = feature_selector(params['fs_algorithm_selector'], X=X, y=y)
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
134 if params['fs_algorithm_selector']['selected_algorithm'] != 'SelectFromModel'\
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
135 or params['fs_algorithm_selector']['model_inputter']['input_mode'] != 'prefitted' :
2
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
136 new_selector.fit(X, y)
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
137
2
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
138 ## Transform to select features
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
139 selected_names = None
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
140
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
141 res = new_selector.transform(X)
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
142 if features_has_header:
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
143 selected_names = input_df.columns[new_selector.get_support(indices=True)]
2
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
144 res = pandas.DataFrame(res, columns = selected_names)
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
145 res.to_csv(path_or_buf='$outfile', sep='\t', index=False)
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
146
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
147 #if $save:
34
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
148 dump_model_to_h5(new_selector, '$outfile_selector')
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
149 #end if
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
150
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
151 ]]>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
152 </configfile>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
153 </configfiles>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
154 <inputs>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
155 <expand macro="feature_selection_fs" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
156 <param name="save" type="boolean" truevalue="booltrue" falsevalue="boolfalse" checked="false" label="Save the fitted selector?" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
157 <expand macro="sl_mixed_input_plus_sequence" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
158 </inputs>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
159 <outputs>
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
160 <data format="tabular" name="outfile" />
34
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
161 <data format="h5mlm" name="outfile_selector" label="${fs_algorithm_selector.selected_algorithm}">
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
162 <filter>save</filter>
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
163 </data>
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
164 </outputs>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
165 <tests>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
166 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
167 <param name="selected_algorithm" value="SelectFromModel" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
168 <param name="input_mode" value="new" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
169 <param name="selected_module" value="ensemble" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
170 <param name="selected_estimator" value="RandomForestRegressor" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
171 <param name="text_params" value="n_estimators=10, random_state=10" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
172 <param name="infile1" value="regression_train.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
173 <param name="header1" value="false" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
174 <param name="col1" value="1,2,3,4,5" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
175 <param name="infile2" value="regression_train.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
176 <param name="col2" value="6" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
177 <param name="header2" value="false" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
178 <output name="outfile" file="feature_selection_result01" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
179 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
180 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
181 <param name="selected_algorithm" value="GenericUnivariateSelect" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
182 <param name="param" value="20" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
183 <param name="infile1" value="regression_X.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
184 <param name="header1" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
185 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
186 <param name="infile2" value="regression_y.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
187 <param name="col2" value="1" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
188 <param name="header2" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
189 <output name="outfile" file="feature_selection_result02" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
190 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
191 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
192 <param name="selected_algorithm" value="SelectPercentile" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
193 <param name="infile1" value="regression_X.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
194 <param name="header1" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
195 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
196 <param name="infile2" value="regression_y.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
197 <param name="col2" value="1" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
198 <param name="header2" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
199 <output name="outfile" file="feature_selection_result03" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
200 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
201 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
202 <param name="selected_algorithm" value="SelectKBest" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
203 <param name="infile1" value="regression_X.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
204 <param name="header1" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
205 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
206 <param name="infile2" value="regression_y.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
207 <param name="col2" value="1" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
208 <param name="header2" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
209 <output name="outfile" file="feature_selection_result04" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
210 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
211 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
212 <param name="selected_algorithm" value="SelectFpr" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
213 <param name="alpha" value="0.05" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
214 <param name="infile1" value="regression_X.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
215 <param name="header1" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
216 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
217 <param name="infile2" value="regression_y.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
218 <param name="col2" value="1" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
219 <param name="header2" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
220 <output name="outfile" file="feature_selection_result05" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
221 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
222 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
223 <param name="selected_algorithm" value="SelectFdr" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
224 <param name="alpha" value="0.05" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
225 <param name="infile1" value="regression_X.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
226 <param name="header1" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
227 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
228 <param name="infile2" value="regression_y.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
229 <param name="col2" value="1" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
230 <param name="header2" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
231 <output name="outfile" file="feature_selection_result06" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
232 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
233 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
234 <param name="selected_algorithm" value="SelectFwe" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
235 <param name="alpha" value="0.05" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
236 <param name="infile1" value="regression_X.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
237 <param name="header1" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
238 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
239 <param name="infile2" value="regression_y.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
240 <param name="col2" value="1" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
241 <param name="header2" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
242 <output name="outfile" file="feature_selection_result07" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
243 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
244 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
245 <param name="selected_algorithm" value="RFE" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
246 <param name="input_mode" value="new" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
247 <param name="selected_module" value="ensemble" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
248 <param name="selected_estimator" value="RandomForestRegressor" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
249 <param name="text_params" value="n_estimators=10, random_state=10" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
250 <param name="infile1" value="regression_train.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
251 <param name="header1" value="false" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
252 <param name="col1" value="1,2,3,4,5" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
253 <param name="infile2" value="regression_train.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
254 <param name="col2" value="6" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
255 <param name="header2" value="false" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
256 <output name="outfile" file="feature_selection_result08" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
257 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
258 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
259 <param name="selected_algorithm" value="RFECV" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
260 <param name="input_mode" value="new" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
261 <param name="selected_module" value="ensemble" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
262 <param name="selected_estimator" value="RandomForestRegressor" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
263 <param name="text_params" value="n_estimators=10, random_state=10" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
264 <param name="infile1" value="regression_train.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
265 <param name="header1" value="false" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
266 <param name="col1" value="1,2,3,4,5" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
267 <param name="infile2" value="regression_train.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
268 <param name="col2" value="6" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
269 <param name="header2" value="false" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
270 <output name="outfile" file="feature_selection_result09" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
271 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
272 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
273 <param name="selected_algorithm" value="VarianceThreshold" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
274 <param name="threshold" value="0.1" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
275 <param name="infile1" value="regression_X.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
276 <param name="header1" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
277 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
278 <param name="infile2" value="regression_y.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
279 <param name="col2" value="1" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
280 <param name="header2" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
281 <output name="outfile" file="feature_selection_result10" />
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
282 </test>
6
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
283 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
284 <param name="selected_algorithm" value="SelectKBest" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
285 <param name="k" value="3" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
286 <param name="infile1" value="test3.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
287 <param name="header1" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
288 <param name="selected_column_selector_option" value="all_but_by_header_name" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
289 <param name="col1" value="target" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
290 <param name="infile2" value="test3.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
291 <param name="header2" value="True" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
292 <param name="selected_column_selector_option2" value="by_header_name" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
293 <param name="col2" value="target" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
294 <output name="outfile" file="feature_selection_result11" />
6
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
295 </test>
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
296 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
297 <param name="selected_algorithm" value="SelectFromModel" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
298 <param name="input_mode" value="prefitted" />
34
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
299 <param name="fitted_estimator" value="searchCV03" ftype="h5mlm" />
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
300 <param name="infile1" value="regression_X.tabular" ftype="tabular" />
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
301 <param name="header1" value="true" />
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
302 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17" />
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
303 <param name="infile2" value="regression_y.tabular" ftype="tabular" />
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
304 <param name="col2" value="1" />
34
b9d86fc6359d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 9981e25b00de29ed881b2229a173a8c812ded9bb
bgruening
parents: 28
diff changeset
305 <param name="header2" value="true" />
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
306 <output name="outfile" file="feature_selection_result12" />
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
307 </test>
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
308 <test>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
309 <param name="selected_algorithm" value="RFECV" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
310 <param name="input_mode" value="new" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
311 <param name="selected_module" value="ensemble" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
312 <param name="selected_estimator" value="RandomForestRegressor" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
313 <param name="text_params" value="n_estimators=10, random_state=10" />
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
314 <section name="groups_selector">
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
315 <param name="infile_groups" value="regression_y.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
316 <param name="header_g" value="true" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
317 <param name="selected_column_selector_option_g" value="by_index_number" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
318 <param name="col_g" value="1" />
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
319 </section>
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
320 <param name="selected_cv" value="GroupShuffleSplit" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
321 <param name="random_state" value="0" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
322 <param name="infile1" value="regression_X.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
323 <param name="header1" value="true" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
324 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
325 <param name="infile2" value="regression_y.tabular" ftype="tabular" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
326 <param name="col2" value="1" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
327 <param name="header2" value="true" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
328 <output name="outfile" file="feature_selection_result13" />
18
15d8ba35c23c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c0a3a186966888e5787335a7628bf0a4382637e7
bgruening
parents: 17
diff changeset
329 </test>
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
330 </tests>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
331 <help>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
332 <![CDATA[
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
333 **What it does**
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
334 This tool provides several loss, score, and utility functions to measure classification performance. Some metrics might require probability estimates of the positive class, confidence values, or binary decisions values. This tool is based on
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
335 sklearn.metrics package.
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
336 For information about classification metric functions and their parameter settings please refer to `Scikit-learn classification metrics`_.
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
337
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
338 .. _`Scikit-learn classification metrics`: http://scikit-learn.org/stable/modules/model_evaluation.html#classification-metrics
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
339 ]]>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
340 </help>
14
93428e8fdab2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 8cf3d813ec755166ee0bd517b4ecbbd4f84d4df1
bgruening
parents: 13
diff changeset
341 <expand macro="sklearn_citation">
28
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
342 <expand macro="skrebate_citation" />
2ac77e0aec82 "planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
bgruening
parents: 22
diff changeset
343 <expand macro="xgboost_citation" />
14
93428e8fdab2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 8cf3d813ec755166ee0bd517b4ecbbd4f84d4df1
bgruening
parents: 13
diff changeset
344 </expand>
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
345 </tool>