annotate feature_selection.xml @ 17:cc5b841f040b draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
author bgruening
date Sun, 30 Dec 2018 01:41:30 -0500
parents 3232ad8fee41
children 15d8ba35c23c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
1 <tool id="sklearn_feature_selection" name="Feature Selection" version="@VERSION@.1">
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
2 <description>module, including univariate filter selection methods and recursive feature elimination algorithm</description>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
3 <macros>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
4 <import>main_macros.xml</import>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
5 </macros>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
6 <expand macro="python_requirements"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
7 <expand macro="macro_stdio"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
8 <version_command>echo "@VERSION@"</version_command>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
9 <command>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
10 <![CDATA[
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
11 python "$feature_selection_script" '$inputs'
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
12 ]]>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
13 </command>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
14 <configfiles>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
15 <inputs name="inputs" />
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
16 <configfile name="feature_selection_script">
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
17 <![CDATA[
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
18 import json
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
19 import sklearn.feature_selection
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
20
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
21 with open('$__tool_directory__/sk_whitelist.json', 'r') as f:
15
3232ad8fee41 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 2a058459e6daf0486871f93845f00fdb4a4eaca1
bgruening
parents: 14
diff changeset
22 sk_whitelist = json.load(f)
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
23 exec(open('$__tool_directory__/utils.py').read(), globals())
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
24
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
25 warnings.simplefilter('ignore')
13
467550472f7d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 10
diff changeset
26
467550472f7d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 10
diff changeset
27 safe_eval = SafeEval()
3
0dc80ab8ec21 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 4ed8c4f6ef9ece81797a398b17a99bbaf49a6978
bgruening
parents: 2
diff changeset
28
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
29 input_json_path = sys.argv[1]
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
30 with open(input_json_path, 'r') as param_handler:
9
7701da597d1d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 6
diff changeset
31 params = json.load(param_handler)
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
32
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
33 #handle cheetah
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
34 #if $fs_algorithm_selector.selected_algorithm == 'SelectFromModel'\
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
35 and $fs_algorithm_selector.model_inputter.input_mode == 'prefitted':
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
36 params['fs_algorithm_selector']['model_inputter']['fitted_estimator'] =\
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
37 '$fs_algorithm_selector.model_inputter.fitted_estimator'
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
38 #end if
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
39
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
40 #if $fs_algorithm_selector.selected_algorithm == 'SelectFromModel'\
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
41 and $fs_algorithm_selector.model_inputter.input_mode == 'new'\
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
42 and $fs_algorithm_selector.model_inputter.estimator_selector.selected_module == 'customer_estimator':
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
43 params['fs_algorithm_selector']['model_inputter']['estimator_selector']['c_estimator'] =\
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
44 '$fs_algorithm_selector.model_inputter.estimator_selector.c_estimator'
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
45 #end if
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
46
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
47 #if $fs_algorithm_selector.selected_algorithm in ['RFE', 'RFECV']\
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
48 and $fs_algorithm_selector.estimator_selector.selected_module == 'customer_estimator':
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
49 params['fs_algorithm_selector']['estimator_selector']['c_estimator'] =\
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
50 '$fs_algorithm_selector.estimator_selector.c_estimator'
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
51 #end if
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
52
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
53 # Read features
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
54 features_has_header = params['input_options']['header1']
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
55 input_type = params['input_options']['selected_input']
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
56 if input_type == 'tabular':
2
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
57 header = 'infer' if features_has_header else None
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
58 column_option = params['input_options']['column_selector_options_1']['selected_column_selector_option']
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
59 if column_option in ['by_index_number', 'all_but_by_index_number', 'by_header_name', 'all_but_by_header_name']:
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
60 c = params['input_options']['column_selector_options_1']['col1']
4
73c12f296b1c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 3
diff changeset
61 else:
73c12f296b1c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 3
diff changeset
62 c = None
2
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
63 X, input_df = read_columns(
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
64 '$input_options.infile1',
4
73c12f296b1c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 3
diff changeset
65 c = c,
73c12f296b1c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 3
diff changeset
66 c_option = column_option,
2
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
67 return_df = True,
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
68 sep='\t',
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
69 header=header,
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
70 parse_dates=True
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
71 )
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
72 else:
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
73 X = mmread('$input_options.infile1')
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
74
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
75 # Read labels
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
76 header = 'infer' if params['input_options']['header2'] else None
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
77 column_option = params['input_options']['column_selector_options_2']['selected_column_selector_option2']
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
78 if column_option in ['by_index_number', 'all_but_by_index_number', 'by_header_name', 'all_but_by_header_name']:
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
79 c = params['input_options']['column_selector_options_2']['col2']
4
73c12f296b1c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 3
diff changeset
80 else:
73c12f296b1c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 3
diff changeset
81 c = None
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
82 y = read_columns(
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
83 '$input_options.infile2',
4
73c12f296b1c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 3
diff changeset
84 c = c,
73c12f296b1c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 3
diff changeset
85 c_option = column_option,
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
86 sep='\t',
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
87 header=header,
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
88 parse_dates=True
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
89 )
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
90 y=y.ravel()
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
91
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
92 # Create feature selector
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
93 new_selector = feature_selector(params['fs_algorithm_selector'])
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
94 if params['fs_algorithm_selector']['selected_algorithm'] != 'SelectFromModel'\
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
95 or params['fs_algorithm_selector']['model_inputter']['input_mode'] != 'prefitted' :
2
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
96 new_selector.fit(X, y)
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
97
2
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
98 ## Transform to select features
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
99 selected_names = None
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
100
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
101 res = new_selector.transform(X)
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
102 if features_has_header:
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
103 selected_names = input_df.columns[new_selector.get_support(indices=True)]
2
5a06c81f044d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 79fe42239dcf077b13f85cbcd6c6e30d7e1e4832
bgruening
parents: 0
diff changeset
104 res = pandas.DataFrame(res, columns = selected_names)
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
105 res.to_csv(path_or_buf='$outfile', sep='\t', index=False)
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
106
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
107 #if $save:
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
108 with open('$outfile_selector', 'wb') as output_handler:
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
109 pickle.dump(new_selector, output_handler, pickle.HIGHEST_PROTOCOL)
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
110 #end if
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
111
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
112 ]]>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
113 </configfile>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
114 </configfiles>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
115 <inputs>
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
116 <expand macro="feature_selection_fs"/>
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
117 <param name="save" type="boolean" truevalue="booltrue" falsevalue="boolfalse" checked="false" label="Save the fitted selector?"/>
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
118 <expand macro="sl_mixed_input"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
119 </inputs>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
120 <outputs>
17
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
121 <data format="tabular" name="outfile" />
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
122 <data format="zip" name="outfile_selector" label="${fs_algorithm_selector.selected_algorithm}">
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
123 <filter>save</filter>
cc5b841f040b planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 57f4407e278a615f47a377a3328782b1d8e0b54d
bgruening
parents: 15
diff changeset
124 </data>
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
125 </outputs>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
126 <tests>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
127 <test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
128 <param name="selected_algorithm" value="SelectFromModel"/>
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
129 <param name="input_mode" value="new"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
130 <param name="selected_module" value="ensemble"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
131 <param name="selected_estimator" value="RandomForestRegressor"/>
13
467550472f7d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 10
diff changeset
132 <param name="text_params" value="n_estimators=10, random_state=10"/>
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
133 <param name="infile1" value="regression_train.tabular" ftype="tabular"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
134 <param name="header1" value="false"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
135 <param name="col1" value="1,2,3,4,5"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
136 <param name="infile2" value="regression_train.tabular" ftype="tabular"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
137 <param name="col2" value="6"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
138 <param name="header2" value="false"/>
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
139 <output name="outfile" file="feature_selection_result01"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
140 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
141 <test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
142 <param name="selected_algorithm" value="GenericUnivariateSelect"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
143 <param name="param" value="20"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
144 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
145 <param name="header1" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
146 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
147 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
148 <param name="col2" value="1"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
149 <param name="header2" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
150 <output name="outfile" file="feature_selection_result02"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
151 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
152 <test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
153 <param name="selected_algorithm" value="SelectPercentile"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
154 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
155 <param name="header1" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
156 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
157 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
158 <param name="col2" value="1"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
159 <param name="header2" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
160 <output name="outfile" file="feature_selection_result03"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
161 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
162 <test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
163 <param name="selected_algorithm" value="SelectKBest"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
164 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
165 <param name="header1" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
166 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
167 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
168 <param name="col2" value="1"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
169 <param name="header2" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
170 <output name="outfile" file="feature_selection_result04"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
171 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
172 <test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
173 <param name="selected_algorithm" value="SelectFpr"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
174 <param name="alpha" value="0.05"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
175 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
176 <param name="header1" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
177 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
178 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
179 <param name="col2" value="1"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
180 <param name="header2" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
181 <output name="outfile" file="feature_selection_result05"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
182 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
183 <test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
184 <param name="selected_algorithm" value="SelectFdr"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
185 <param name="alpha" value="0.05"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
186 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
187 <param name="header1" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
188 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
189 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
190 <param name="col2" value="1"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
191 <param name="header2" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
192 <output name="outfile" file="feature_selection_result06"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
193 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
194 <test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
195 <param name="selected_algorithm" value="SelectFwe"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
196 <param name="alpha" value="0.05"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
197 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
198 <param name="header1" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
199 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
200 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
201 <param name="col2" value="1"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
202 <param name="header2" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
203 <output name="outfile" file="feature_selection_result07"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
204 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
205 <test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
206 <param name="selected_algorithm" value="RFE"/>
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
207 <param name="input_mode" value="new"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
208 <param name="selected_module" value="ensemble"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
209 <param name="selected_estimator" value="RandomForestRegressor"/>
13
467550472f7d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 10
diff changeset
210 <param name="text_params" value="n_estimators=10, random_state=10"/>
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
211 <param name="infile1" value="regression_train.tabular" ftype="tabular"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
212 <param name="header1" value="false"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
213 <param name="col1" value="1,2,3,4,5"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
214 <param name="infile2" value="regression_train.tabular" ftype="tabular"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
215 <param name="col2" value="6"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
216 <param name="header2" value="false"/>
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
217 <output name="outfile" file="feature_selection_result08"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
218 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
219 <test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
220 <param name="selected_algorithm" value="RFECV"/>
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
221 <param name="input_mode" value="new"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
222 <param name="selected_module" value="ensemble"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
223 <param name="selected_estimator" value="RandomForestRegressor"/>
13
467550472f7d planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 10
diff changeset
224 <param name="text_params" value="n_estimators=10, random_state=10"/>
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
225 <param name="infile1" value="regression_train.tabular" ftype="tabular"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
226 <param name="header1" value="false"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
227 <param name="col1" value="1,2,3,4,5"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
228 <param name="infile2" value="regression_train.tabular" ftype="tabular"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
229 <param name="col2" value="6"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
230 <param name="header2" value="false"/>
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
231 <output name="outfile" file="feature_selection_result09"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
232 </test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
233 <test>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
234 <param name="selected_algorithm" value="VarianceThreshold"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
235 <param name="threshold" value="0.1"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
236 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
237 <param name="header1" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
238 <param name="col1" value="1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
239 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
240 <param name="col2" value="1"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
241 <param name="header2" value="True"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
242 <output name="outfile" file="feature_selection_result10"/>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
243 </test>
6
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
244 <test>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
245 <param name="selected_algorithm" value="SelectKBest"/>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
246 <param name="k" value="3"/>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
247 <param name="infile1" value="test3.tabular" ftype="tabular"/>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
248 <param name="header1" value="True"/>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
249 <param name="selected_column_selector_option" value="all_but_by_header_name"/>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
250 <param name="col1" value="target"/>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
251 <param name="infile2" value="test3.tabular" ftype="tabular"/>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
252 <param name="header2" value="True"/>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
253 <param name="selected_column_selector_option2" value="by_header_name"/>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
254 <param name="col2" value="target"/>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
255 <output name="outfile" file="feature_selection_result11"/>
dc574d9778bd planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit cd4a8b019168acd5a513c57a1b1f380622f230f6
bgruening
parents: 5
diff changeset
256 </test>
10
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
257 <test>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
258 <param name="selected_algorithm" value="SelectFromModel"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
259 <param name="input_mode" value="prefitted"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
260 <param name="fitted_estimator" value="rfr_model01" ftype="zip"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
261 <param name="infile1" value="regression_train.tabular" ftype="tabular"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
262 <param name="header1" value="false"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
263 <param name="col1" value="1,2,3,4,5"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
264 <param name="infile2" value="regression_train.tabular" ftype="tabular"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
265 <param name="col2" value="1"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
266 <param name="header2" value="false"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
267 <output name="outfile" file="feature_selection_result12"/>
d00e89558c18 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 76583c1fcd9d06a4679cc46ffaee44117b9e22cd
bgruening
parents: 9
diff changeset
268 </test>
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
269 </tests>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
270 <help>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
271 <![CDATA[
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
272 **What it does**
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
273 This tool provides several loss, score, and utility functions to measure classification performance. Some metrics might require probability estimates of the positive class, confidence values, or binary decisions values. This tool is based on
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
274 sklearn.metrics package.
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
275 For information about classification metric functions and their parameter settings please refer to `Scikit-learn classification metrics`_.
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
276
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
277 .. _`Scikit-learn classification metrics`: http://scikit-learn.org/stable/modules/model_evaluation.html#classification-metrics
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
278 ]]>
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
279 </help>
14
93428e8fdab2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 8cf3d813ec755166ee0bd517b4ecbbd4f84d4df1
bgruening
parents: 13
diff changeset
280 <expand macro="sklearn_citation">
93428e8fdab2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 8cf3d813ec755166ee0bd517b4ecbbd4f84d4df1
bgruening
parents: 13
diff changeset
281 <expand macro="skrebate_citation"/>
93428e8fdab2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 8cf3d813ec755166ee0bd517b4ecbbd4f84d4df1
bgruening
parents: 13
diff changeset
282 <expand macro="xgboost_citation"/>
93428e8fdab2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 8cf3d813ec755166ee0bd517b4ecbbd4f84d4df1
bgruening
parents: 13
diff changeset
283 </expand>
0
2bbacfaadb5c planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 7a31960686122d7e53054fef4996525f04ebd254
bgruening
parents:
diff changeset
284 </tool>