Mercurial > repos > bgruening > sklearn_numeric_clustering
comparison numeric_clustering.xml @ 40:006e27f0a7ef draft
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
| author | bgruening |
|---|---|
| date | Tue, 13 Apr 2021 20:52:41 +0000 |
| parents | 80bb86a40de6 |
| children | 0e4066f5751d |
comparison
equal
deleted
inserted
replaced
| 39:14346b365787 | 40:006e27f0a7ef |
|---|---|
| 1 <tool id="sklearn_numeric_clustering" name="Numeric Clustering" version="@VERSION@"> | 1 <tool id="sklearn_numeric_clustering" name="Numeric Clustering" version="@VERSION@" profile="20.05"> |
| 2 <description></description> | 2 <description></description> |
| 3 <macros> | 3 <macros> |
| 4 <import>main_macros.xml</import> | 4 <import>main_macros.xml</import> |
| 5 </macros> | 5 </macros> |
| 6 <expand macro="python_requirements"/> | 6 <expand macro="python_requirements" /> |
| 7 <expand macro="macro_stdio"/> | 7 <expand macro="macro_stdio" /> |
| 8 <version_command>echo "@VERSION@"</version_command> | 8 <version_command>echo "@VERSION@"</version_command> |
| 9 <command><![CDATA[ | 9 <command><![CDATA[ |
| 10 python "$cluster_script" '$inputs' | 10 python "$cluster_script" '$inputs' |
| 11 ]]> | 11 ]]> |
| 12 </command> | 12 </command> |
| 13 <configfiles> | 13 <configfiles> |
| 14 <inputs name="inputs"/> | 14 <inputs name="inputs" /> |
| 15 <configfile name="cluster_script"> | 15 <configfile name="cluster_script"> |
| 16 <![CDATA[ | 16 <![CDATA[ |
| 17 import sys | 17 import sys |
| 18 import json | 18 import json |
| 19 import numpy as np | 19 import numpy as np |
| 20 import sklearn.cluster | 20 import sklearn.cluster |
| 21 import pandas | 21 import pandas |
| 87 <param name="selected_input_type" type="select" label="Select the format of input data"> | 87 <param name="selected_input_type" type="select" label="Select the format of input data"> |
| 88 <option value="tabular" selected="true">Tabular Format (tabular, txt)</option> | 88 <option value="tabular" selected="true">Tabular Format (tabular, txt)</option> |
| 89 <option value="sparse">Sparse Vector Representation (mtx)</option> | 89 <option value="sparse">Sparse Vector Representation (mtx)</option> |
| 90 </param> | 90 </param> |
| 91 <when value="sparse"> | 91 <when value="sparse"> |
| 92 <param name="infile" type="data" format="txt" label="Sparse vector (scipy.sparse.csr_matrix) file:" help="The following clustering algorithms support sparse matrix operations: ''Birch'', ''DBSCAN'', ''KMeans'', ''Mini BatchK Means'', and ''Spectral Clustering''. If your data is in tabular format, please use other clustering algorithms."/> | 92 <param name="infile" type="data" format="txt" label="Sparse vector (scipy.sparse.csr_matrix) file:" help="The following clustering algorithms support sparse matrix operations: ''Birch'', ''DBSCAN'', ''KMeans'', ''Mini BatchK Means'', and ''Spectral Clustering''. If your data is in tabular format, please use other clustering algorithms." /> |
| 93 <expand macro="clustering_algorithms_options"/> | 93 <expand macro="clustering_algorithms_options" /> |
| 94 </when> | 94 </when> |
| 95 <when value="tabular"> | 95 <when value="tabular"> |
| 96 <param name="infile" type="data" format="tabular" label="Data file with numeric values"/> | 96 <param name="infile" type="data" format="tabular" label="Data file with numeric values" /> |
| 97 <param name="header" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="True" label="Does the dataset contain header:" /> | 97 <param name="header" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="True" label="Does the dataset contain header:" /> |
| 98 <conditional name="column_selector_options"> | 98 <conditional name="column_selector_options"> |
| 99 <expand macro="samples_column_selector_options" col_name="col" multiple="true" infile="infile"/> | 99 <expand macro="samples_column_selector_options" col_name="col" multiple="true" infile="infile" /> |
| 100 </conditional> | 100 </conditional> |
| 101 <!--expand macro="clustering_algorithms_options"--> | 101 <!--expand macro="clustering_algorithms_options"--> |
| 102 <conditional name="algorithm_options"> | 102 <conditional name="algorithm_options"> |
| 103 <param name="selected_algorithm" type="select" label="Clustering Algorithm"> | 103 <param name="selected_algorithm" type="select" label="Clustering Algorithm"> |
| 104 <option value="AgglomerativeClustering">Hierarchical Agglomerative Clustering</option> | 104 <option value="AgglomerativeClustering">Hierarchical Agglomerative Clustering</option> |
| 109 <option value="KMeans">KMeans</option> | 109 <option value="KMeans">KMeans</option> |
| 110 <option value="DBSCAN">DBSCAN</option> | 110 <option value="DBSCAN">DBSCAN</option> |
| 111 <option value="Birch">Birch</option> | 111 <option value="Birch">Birch</option> |
| 112 </param> | 112 </param> |
| 113 <when value="KMeans"> | 113 <when value="KMeans"> |
| 114 <expand macro="kmeans_advanced_options"/> | 114 <expand macro="kmeans_advanced_options" /> |
| 115 </when> | 115 </when> |
| 116 <when value="DBSCAN"> | 116 <when value="DBSCAN"> |
| 117 <expand macro="dbscan_advanced_options"/> | 117 <expand macro="dbscan_advanced_options" /> |
| 118 </when> | 118 </when> |
| 119 <when value="Birch"> | 119 <when value="Birch"> |
| 120 <expand macro="birch_advanced_options"/> | 120 <expand macro="birch_advanced_options" /> |
| 121 </when> | 121 </when> |
| 122 <when value="SpectralClustering"> | 122 <when value="SpectralClustering"> |
| 123 <expand macro="spectral_clustering_advanced_options"/> | 123 <expand macro="spectral_clustering_advanced_options" /> |
| 124 </when> | 124 </when> |
| 125 <when value="MiniBatchKMeans"> | 125 <when value="MiniBatchKMeans"> |
| 126 <expand macro="minibatch_kmeans_advanced_options"/> | 126 <expand macro="minibatch_kmeans_advanced_options" /> |
| 127 </when> | 127 </when> |
| 128 <when value="AffinityPropagation"> | 128 <when value="AffinityPropagation"> |
| 129 <section name="options" title="Advanced Options" expanded="False"> | 129 <section name="options" title="Advanced Options" expanded="False"> |
| 130 <param argument="damping" type="float" optional="true" value="0.5" label="Damping factor" help="Damping factor between 0.5 and 1."/> | 130 <param argument="damping" type="float" optional="true" value="0.5" label="Damping factor" help="Damping factor between 0.5 and 1." /> |
| 131 <expand macro="max_iter" default_value="200"/> | 131 <expand macro="max_iter" default_value="200" /> |
| 132 <param argument="convergence_iter" type="integer" optional="true" value="15" label="Number of iterations at each convergence step" help="Number of iterations with no change in the number of estimated clusters that stops the convergence."/> | 132 <param argument="convergence_iter" type="integer" optional="true" value="15" label="Number of iterations at each convergence step" help="Number of iterations with no change in the number of estimated clusters that stops the convergence." /> |
| 133 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Copy" help="If False, the affinity matrix is modified inplace by the algorithm, for memory efficiency."/> | 133 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Copy" help="If False, the affinity matrix is modified inplace by the algorithm, for memory efficiency." /> |
| 134 <!--param argument="preference"/--> | 134 <!--param argument="preference"/--> |
| 135 <param argument="affinity" type="select" label="Affinity" help="Affinity to use; euclidean uses the negative squared euclidean distance between points."> | 135 <param argument="affinity" type="select" label="Affinity" help="Affinity to use; euclidean uses the negative squared euclidean distance between points."> |
| 136 <option value="euclidean">Euclidean</option> | 136 <option value="euclidean">Euclidean</option> |
| 137 <option value="precomputed">precomputed</option> | 137 <option value="precomputed">precomputed</option> |
| 138 </param> | 138 </param> |
| 139 </section> | 139 </section> |
| 140 </when> | 140 </when> |
| 141 <when value="MeanShift"> | 141 <when value="MeanShift"> |
| 142 <section name="options" title="Advanced Options" expanded="False"> | 142 <section name="options" title="Advanced Options" expanded="False"> |
| 143 <param argument="bandwidth" type="float" optional="true" value="" label="Kernel bandwidth" help="Bandwidth used in the RBF kernel. If not given, it will be computed using a heuristic based on the median of all pairwise distances."/> | 143 <param argument="bandwidth" type="float" optional="true" value="" label="Kernel bandwidth" help="Bandwidth used in the RBF kernel. If not given, it will be computed using a heuristic based on the median of all pairwise distances." /> |
| 144 <!--param argument="seeds"/--> | 144 <!--param argument="seeds"/--> |
| 145 <param argument="bin_seeding" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Discretize initial kernel locations" help="If true, initial kernel locations are the bins grid whose coarseness corresponds to the bandwidth, speeding up the algorithm."/> | 145 <param argument="bin_seeding" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Discretize initial kernel locations" help="If true, initial kernel locations are the bins grid whose coarseness corresponds to the bandwidth, speeding up the algorithm." /> |
| 146 <param argument="min_bin_freq" type="integer" optional="true" value="1" label="Minimum number of seeds per bin" help="To speed up the algorithm, accept only those bins with at least min_bin_freq points as seeds."/> | 146 <param argument="min_bin_freq" type="integer" optional="true" value="1" label="Minimum number of seeds per bin" help="To speed up the algorithm, accept only those bins with at least min_bin_freq points as seeds." /> |
| 147 <param argument="cluster_all" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Cluster all" help="If true, all points (including orphans) are clustered. If false, orphans are given cluster label -1."/> | 147 <param argument="cluster_all" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Cluster all" help="If true, all points (including orphans) are clustered. If false, orphans are given cluster label -1." /> |
| 148 </section> | 148 </section> |
| 149 </when> | 149 </when> |
| 150 <when value="AgglomerativeClustering"> | 150 <when value="AgglomerativeClustering"> |
| 151 <section name="options" title="Advanced Options" expanded="False"> | 151 <section name="options" title="Advanced Options" expanded="False"> |
| 152 <expand macro="n_clusters" default_value="2" /> | 152 <expand macro="n_clusters" default_value="2" /> |
| 174 </conditional> | 174 </conditional> |
| 175 </when> | 175 </when> |
| 176 </conditional> | 176 </conditional> |
| 177 </inputs> | 177 </inputs> |
| 178 <outputs> | 178 <outputs> |
| 179 <data format="tabular" name="outfile"/> | 179 <data format="tabular" name="outfile" /> |
| 180 </outputs> | 180 </outputs> |
| 181 <tests> | 181 <tests> |
| 182 <test> | 182 <test> |
| 183 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 183 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 184 <param name="selected_input_type" value="tabular"/> | 184 <param name="selected_input_type" value="tabular" /> |
| 185 <param name="selected_algorithm" value="KMeans"/> | 185 <param name="selected_algorithm" value="KMeans" /> |
| 186 <param name="col" value="2,3,4" /> | 186 <param name="col" value="2,3,4" /> |
| 187 <param name="n_clusters" value="4" /> | 187 <param name="n_clusters" value="4" /> |
| 188 <param name="init" value="k-means++" /> | 188 <param name="init" value="k-means++" /> |
| 189 <param name="random_state" value="100"/> | 189 <param name="random_state" value="100" /> |
| 190 <output name="outfile" file="cluster_result01.txt"/> | 190 <output name="outfile" file="cluster_result01.txt" /> |
| 191 </test> | 191 </test> |
| 192 <test> | 192 <test> |
| 193 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 193 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 194 <param name="selected_algorithm" value="KMeans"/> | 194 <param name="selected_algorithm" value="KMeans" /> |
| 195 <param name="selected_input_type" value="tabular"/> | 195 <param name="selected_input_type" value="tabular" /> |
| 196 <param name="col" value="2,3,4" /> | 196 <param name="col" value="2,3,4" /> |
| 197 <param name="n_clusters" value="4" /> | 197 <param name="n_clusters" value="4" /> |
| 198 <param name="init" value="random" /> | 198 <param name="init" value="random" /> |
| 199 <param name="random_state" value="100"/> | 199 <param name="random_state" value="100" /> |
| 200 <output name="outfile" file="cluster_result02.txt"/> | 200 <output name="outfile" file="cluster_result02.txt" /> |
| 201 </test> | 201 </test> |
| 202 <test> | 202 <test> |
| 203 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 203 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 204 <param name="selected_algorithm" value="DBSCAN"/> | 204 <param name="selected_algorithm" value="DBSCAN" /> |
| 205 <param name="selected_input_type" value="tabular"/> | 205 <param name="selected_input_type" value="tabular" /> |
| 206 <param name="col" value="2,3,4" /> | 206 <param name="col" value="2,3,4" /> |
| 207 <param name="algorithm" value="kd_tree"/> | 207 <param name="algorithm" value="kd_tree" /> |
| 208 <param name="leaf_size" value="10"/> | 208 <param name="leaf_size" value="10" /> |
| 209 <param name="eps" value="1.0"/> | 209 <param name="eps" value="1.0" /> |
| 210 <output name="outfile" file="cluster_result03.txt"/> | 210 <output name="outfile" file="cluster_result03.txt" /> |
| 211 </test> | 211 </test> |
| 212 <test> | 212 <test> |
| 213 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 213 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 214 <param name="selected_algorithm" value="Birch"/> | 214 <param name="selected_algorithm" value="Birch" /> |
| 215 <param name="selected_input_type" value="tabular"/> | 215 <param name="selected_input_type" value="tabular" /> |
| 216 <param name="col" value="2,3,4" /> | 216 <param name="col" value="2,3,4" /> |
| 217 <param name="n_clusters" value="4"/> | 217 <param name="n_clusters" value="4" /> |
| 218 <param name="threshold" value="0.008"/> | 218 <param name="threshold" value="0.008" /> |
| 219 <output name="outfile" file="cluster_result04.txt"/> | 219 <output name="outfile" file="cluster_result04.txt" /> |
| 220 </test> | 220 </test> |
| 221 <test> | 221 <test> |
| 222 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 222 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 223 <param name="selected_algorithm" value="Birch"/> | 223 <param name="selected_algorithm" value="Birch" /> |
| 224 <param name="selected_input_type" value="tabular"/> | 224 <param name="selected_input_type" value="tabular" /> |
| 225 <param name="col" value="2,3,4" /> | 225 <param name="col" value="2,3,4" /> |
| 226 <param name="branching_factor" value="20"/> | 226 <param name="branching_factor" value="20" /> |
| 227 <output name="outfile" file="cluster_result05.txt"/> | 227 <output name="outfile" file="cluster_result05.txt" /> |
| 228 </test> | 228 </test> |
| 229 <test> | 229 <test> |
| 230 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 230 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 231 <param name="selected_algorithm" value="AffinityPropagation"/> | 231 <param name="selected_algorithm" value="AffinityPropagation" /> |
| 232 <param name="selected_input_type" value="tabular"/> | 232 <param name="selected_input_type" value="tabular" /> |
| 233 <param name="col" value="2,3,4" /> | 233 <param name="col" value="2,3,4" /> |
| 234 <param name="affinity" value="euclidean"/> | 234 <param name="affinity" value="euclidean" /> |
| 235 <param name="copy" value="false"/> | 235 <param name="copy" value="false" /> |
| 236 <output name="outfile" file="cluster_result06.txt"/> | 236 <output name="outfile" file="cluster_result06.txt" /> |
| 237 </test> | 237 </test> |
| 238 <test> | 238 <test> |
| 239 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 239 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 240 <param name="selected_algorithm" value="AffinityPropagation"/> | 240 <param name="selected_algorithm" value="AffinityPropagation" /> |
| 241 <param name="selected_input_type" value="tabular"/> | 241 <param name="selected_input_type" value="tabular" /> |
| 242 <param name="col" value="2,3,4" /> | 242 <param name="col" value="2,3,4" /> |
| 243 <param name="damping" value="0.8"/> | 243 <param name="damping" value="0.8" /> |
| 244 <output name="outfile" file="cluster_result07.txt"/> | 244 <output name="outfile" file="cluster_result07.txt" /> |
| 245 </test> | 245 </test> |
| 246 <test> | 246 <test> |
| 247 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 247 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 248 <param name="selected_algorithm" value="MeanShift"/> | 248 <param name="selected_algorithm" value="MeanShift" /> |
| 249 <param name="selected_input_type" value="tabular"/> | 249 <param name="selected_input_type" value="tabular" /> |
| 250 <param name="col" value="2,3,4" /> | 250 <param name="col" value="2,3,4" /> |
| 251 <param name="min_bin_freq" value="3"/> | 251 <param name="min_bin_freq" value="3" /> |
| 252 <output name="outfile" file="cluster_result08.txt"/> | 252 <output name="outfile" file="cluster_result08.txt" /> |
| 253 </test> | 253 </test> |
| 254 <test> | 254 <test> |
| 255 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 255 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 256 <param name="selected_algorithm" value="MeanShift"/> | 256 <param name="selected_algorithm" value="MeanShift" /> |
| 257 <param name="selected_input_type" value="tabular"/> | 257 <param name="selected_input_type" value="tabular" /> |
| 258 <param name="col" value="2,3,4" /> | 258 <param name="col" value="2,3,4" /> |
| 259 <param name="cluster_all" value="False"/> | 259 <param name="cluster_all" value="False" /> |
| 260 <output name="outfile" file="cluster_result09.txt"/> | 260 <output name="outfile" file="cluster_result09.txt" /> |
| 261 </test> | 261 </test> |
| 262 <test> | 262 <test> |
| 263 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 263 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 264 <param name="selected_algorithm" value="AgglomerativeClustering"/> | 264 <param name="selected_algorithm" value="AgglomerativeClustering" /> |
| 265 <param name="selected_input_type" value="tabular"/> | 265 <param name="selected_input_type" value="tabular" /> |
| 266 <param name="col" value="2,3,4" /> | 266 <param name="col" value="2,3,4" /> |
| 267 <param name="affinity" value="euclidean"/> | 267 <param name="affinity" value="euclidean" /> |
| 268 <param name="linkage" value="average"/> | 268 <param name="linkage" value="average" /> |
| 269 <param name="n_clusters" value="4"/> | 269 <param name="n_clusters" value="4" /> |
| 270 <output name="outfile" file="cluster_result10.txt"/> | 270 <output name="outfile" file="cluster_result10.txt" /> |
| 271 </test> | 271 </test> |
| 272 <test> | 272 <test> |
| 273 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 273 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 274 <param name="selected_algorithm" value="AgglomerativeClustering"/> | 274 <param name="selected_algorithm" value="AgglomerativeClustering" /> |
| 275 <param name="selected_input_type" value="tabular"/> | 275 <param name="selected_input_type" value="tabular" /> |
| 276 <param name="col" value="2,3,4" /> | 276 <param name="col" value="2,3,4" /> |
| 277 <param name="linkage" value="complete"/> | 277 <param name="linkage" value="complete" /> |
| 278 <param name="n_clusters" value="4"/> | 278 <param name="n_clusters" value="4" /> |
| 279 <output name="outfile" file="cluster_result11.txt"/> | 279 <output name="outfile" file="cluster_result11.txt" /> |
| 280 </test> | 280 </test> |
| 281 <test> | 281 <test> |
| 282 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 282 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 283 <param name="selected_algorithm" value="SpectralClustering"/> | 283 <param name="selected_algorithm" value="SpectralClustering" /> |
| 284 <param name="selected_input_type" value="tabular"/> | 284 <param name="selected_input_type" value="tabular" /> |
| 285 <param name="col" value="2,3,4" /> | 285 <param name="col" value="2,3,4" /> |
| 286 <param name="eigen_solver" value="arpack"/> | 286 <param name="eigen_solver" value="arpack" /> |
| 287 <param name="n_neighbors" value="12"/> | 287 <param name="n_neighbors" value="12" /> |
| 288 <param name="n_clusters" value="4"/> | 288 <param name="n_clusters" value="4" /> |
| 289 <param name="assign_labels" value="discretize"/> | 289 <param name="assign_labels" value="discretize" /> |
| 290 <param name="random_state" value="100"/> | 290 <param name="random_state" value="100" /> |
| 291 <output name="outfile" file="cluster_result12.txt" compare="sim_size" /> | 291 <output name="outfile" file="cluster_result12.txt" compare="sim_size" /> |
| 292 </test> | 292 </test> |
| 293 <test> | 293 <test> |
| 294 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 294 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 295 <param name="selected_algorithm" value="SpectralClustering"/> | 295 <param name="selected_algorithm" value="SpectralClustering" /> |
| 296 <param name="selected_input_type" value="tabular"/> | 296 <param name="selected_input_type" value="tabular" /> |
| 297 <param name="col" value="2,3,4" /> | 297 <param name="col" value="2,3,4" /> |
| 298 <param name="assign_labels" value="discretize"/> | 298 <param name="assign_labels" value="discretize" /> |
| 299 <param name="random_state" value="100"/> | 299 <param name="random_state" value="100" /> |
| 300 <param name="degree" value="2"/> | 300 <param name="degree" value="2" /> |
| 301 <output name="outfile" file="cluster_result13.txt" compare="sim_size" /> | 301 <output name="outfile" file="cluster_result13.txt" compare="sim_size" /> |
| 302 </test> | 302 </test> |
| 303 <test> | 303 <test> |
| 304 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 304 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 305 <param name="selected_algorithm" value="MiniBatchKMeans"/> | 305 <param name="selected_algorithm" value="MiniBatchKMeans" /> |
| 306 <param name="selected_input_type" value="tabular"/> | 306 <param name="selected_input_type" value="tabular" /> |
| 307 <param name="col" value="2,3,4" /> | 307 <param name="col" value="2,3,4" /> |
| 308 <param name="tol" value="0.5"/> | 308 <param name="tol" value="0.5" /> |
| 309 <param name="random_state" value="100"/> | 309 <param name="random_state" value="100" /> |
| 310 <output name="outfile" file="cluster_result14.txt"/> | 310 <output name="outfile" file="cluster_result14.txt" /> |
| 311 </test> | 311 </test> |
| 312 <test> | 312 <test> |
| 313 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 313 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 314 <param name="selected_algorithm" value="MiniBatchKMeans"/> | 314 <param name="selected_algorithm" value="MiniBatchKMeans" /> |
| 315 <param name="selected_input_type" value="tabular"/> | 315 <param name="selected_input_type" value="tabular" /> |
| 316 <param name="n_init" value="5"/> | 316 <param name="n_init" value="5" /> |
| 317 <param name="col" value="2,3,4" /> | 317 <param name="col" value="2,3,4" /> |
| 318 <param name="batch_size" value="10"/> | 318 <param name="batch_size" value="10" /> |
| 319 <param name="n_clusters" value="4"/> | 319 <param name="n_clusters" value="4" /> |
| 320 <param name="random_state" value="100"/> | 320 <param name="random_state" value="100" /> |
| 321 <param name="reassignment_ratio" value="1.0"/> | 321 <param name="reassignment_ratio" value="1.0" /> |
| 322 <output name="outfile" file="cluster_result15.txt"/> | 322 <output name="outfile" file="cluster_result15.txt" /> |
| 323 </test> | 323 </test> |
| 324 <test> | 324 <test> |
| 325 <param name="infile" value="numeric_values.tabular" ftype="tabular"/> | 325 <param name="infile" value="numeric_values.tabular" ftype="tabular" /> |
| 326 <param name="selected_algorithm" value="KMeans"/> | 326 <param name="selected_algorithm" value="KMeans" /> |
| 327 <param name="selected_input_type" value="tabular"/> | 327 <param name="selected_input_type" value="tabular" /> |
| 328 <param name="col" value="1" /> | 328 <param name="col" value="1" /> |
| 329 <param name="n_clusters" value="4" /> | 329 <param name="n_clusters" value="4" /> |
| 330 <param name="random_state" value="100"/> | 330 <param name="random_state" value="100" /> |
| 331 <output name="outfile" file="cluster_result16.txt"/> | 331 <output name="outfile" file="cluster_result16.txt" /> |
| 332 </test> | 332 </test> |
| 333 <test> | 333 <test> |
| 334 <param name="infile" value="sparse.mtx" ftype="txt"/> | 334 <param name="infile" value="sparse.mtx" ftype="txt" /> |
| 335 <param name="selected_input_type" value="sparse"/> | 335 <param name="selected_input_type" value="sparse" /> |
| 336 <param name="selected_algorithm" value="KMeans"/> | 336 <param name="selected_algorithm" value="KMeans" /> |
| 337 <param name="n_clusters" value="2" /> | 337 <param name="n_clusters" value="2" /> |
| 338 <param name="init" value="k-means++" /> | 338 <param name="init" value="k-means++" /> |
| 339 <param name="random_state" value="100"/> | 339 <param name="random_state" value="100" /> |
| 340 <output name="outfile" file="cluster_result17.txt"/> | 340 <output name="outfile" file="cluster_result17.txt" /> |
| 341 </test> | 341 </test> |
| 342 <test> | 342 <test> |
| 343 <param name="infile" value="sparse.mtx" ftype="txt"/> | 343 <param name="infile" value="sparse.mtx" ftype="txt" /> |
| 344 <param name="selected_algorithm" value="DBSCAN"/> | 344 <param name="selected_algorithm" value="DBSCAN" /> |
| 345 <param name="selected_input_type" value="sparse"/> | 345 <param name="selected_input_type" value="sparse" /> |
| 346 <param name="algorithm" value="kd_tree"/> | 346 <param name="algorithm" value="kd_tree" /> |
| 347 <param name="leaf_size" value="10"/> | 347 <param name="leaf_size" value="10" /> |
| 348 <param name="eps" value="1.0"/> | 348 <param name="eps" value="1.0" /> |
| 349 <output name="outfile" file="cluster_result18.txt"/> | 349 <output name="outfile" file="cluster_result18.txt" /> |
| 350 </test> | 350 </test> |
| 351 <test> | 351 <test> |
| 352 <param name="infile" value="sparse.mtx" ftype="txt"/> | 352 <param name="infile" value="sparse.mtx" ftype="txt" /> |
| 353 <param name="selected_algorithm" value="Birch"/> | 353 <param name="selected_algorithm" value="Birch" /> |
| 354 <param name="selected_input_type" value="sparse"/> | 354 <param name="selected_input_type" value="sparse" /> |
| 355 <param name="n_clusters" value="2"/> | 355 <param name="n_clusters" value="2" /> |
| 356 <param name="threshold" value="0.008"/> | 356 <param name="threshold" value="0.008" /> |
| 357 <output name="outfile" file="cluster_result19.txt"/> | 357 <output name="outfile" file="cluster_result19.txt" /> |
| 358 </test> | 358 </test> |
| 359 <test> | 359 <test> |
| 360 <param name="infile" value="sparse.mtx" ftype="txt"/> | 360 <param name="infile" value="sparse.mtx" ftype="txt" /> |
| 361 <param name="selected_algorithm" value="MiniBatchKMeans"/> | 361 <param name="selected_algorithm" value="MiniBatchKMeans" /> |
| 362 <param name="selected_input_type" value="sparse"/> | 362 <param name="selected_input_type" value="sparse" /> |
| 363 <param name="n_init" value="5"/> | 363 <param name="n_init" value="5" /> |
| 364 <param name="batch_size" value="10"/> | 364 <param name="batch_size" value="10" /> |
| 365 <param name="n_clusters" value="2"/> | 365 <param name="n_clusters" value="2" /> |
| 366 <param name="random_state" value="100"/> | 366 <param name="random_state" value="100" /> |
| 367 <param name="reassignment_ratio" value="1.0"/> | 367 <param name="reassignment_ratio" value="1.0" /> |
| 368 <output name="outfile" file="cluster_result20.txt"/> | 368 <output name="outfile" file="cluster_result20.txt" /> |
| 369 </test> | 369 </test> |
| 370 <test> | 370 <test> |
| 371 <param name="infile" value="sparse.mtx" ftype="txt"/> | 371 <param name="infile" value="sparse.mtx" ftype="txt" /> |
| 372 <param name="selected_algorithm" value="SpectralClustering"/> | 372 <param name="selected_algorithm" value="SpectralClustering" /> |
| 373 <param name="selected_input_type" value="sparse"/> | 373 <param name="selected_input_type" value="sparse" /> |
| 374 <param name="assign_labels" value="discretize"/> | 374 <param name="assign_labels" value="discretize" /> |
| 375 <param name="n_clusters" value="2"/> | 375 <param name="n_clusters" value="2" /> |
| 376 <param name="random_state" value="100"/> | 376 <param name="random_state" value="100" /> |
| 377 <param name="degree" value="2"/> | 377 <param name="degree" value="2" /> |
| 378 <output name="outfile" file="cluster_result21.txt"/> | 378 <output name="outfile" file="cluster_result21.txt" /> |
| 379 </test> | 379 </test> |
| 380 </tests> | 380 </tests> |
| 381 <help><![CDATA[ | 381 <help><![CDATA[ |
| 382 **What it does** | 382 **What it does** |
| 383 This tool offers different clustering algorithms which are provided by | 383 This tool offers different clustering algorithms which are provided by |
| 384 scikit-learn to find similarities among samples and cluster the samples based on these similarities. | 384 scikit-learn to find similarities among samples and cluster the samples based on these similarities. |
| 385 ]]></help> | 385 ]]> </help> |
| 386 <expand macro="sklearn_citation"/> | 386 <expand macro="sklearn_citation" /> |
| 387 </tool> | 387 </tool> |
