comparison main_macros.xml @ 0:0985b0dd6f1a draft

"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit eb703290e2589561ea215c84aa9f71bcfe1712c6"
author bgruening
date Fri, 01 Nov 2019 17:26:59 -0400
parents
children 5a092779412e
comparison
equal deleted inserted replaced
-1:000000000000 0:0985b0dd6f1a
1 <macros>
2 <token name="@VERSION@">1.0.7.12</token>
3
4 <token name="@ENSEMBLE_VERSION@">0.2.0</token>
5
6 <xml name="python_requirements">
7 <requirements>
8 <requirement type="package" version="3.6">python</requirement>
9 <requirement type="package" version="0.7.12">Galaxy-ML</requirement>
10 <yield/>
11 </requirements>
12 </xml>
13
14 <xml name="macro_stdio">
15 <stdio>
16 <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error"/>
17 </stdio>
18 </xml>
19
20
21 <!--Generic interface-->
22
23 <xml name="sl_Conditional" token_train="tabular" token_data="tabular" token_model="txt">
24 <conditional name="selected_tasks">
25 <param name="selected_task" type="select" label="Select a Classification Task">
26 <option value="train" selected="true">Train a model</option>
27 <option value="load">Load a model and predict</option>
28 </param>
29 <when value="load">
30 <param name="infile_model" type="data" format="@MODEL@" label="Models" help="Select a model file."/>
31 <param name="infile_data" type="data" format="@DATA@" label="Data (tabular)" help="Select the dataset you want to classify."/>
32 <param name="header" type="boolean" optional="True" truevalue="booltrue" falsevalue="boolfalse" checked="False" label="Does the dataset contain header:" />
33 <conditional name="prediction_options">
34 <param name="prediction_option" type="select" label="Select the type of prediction">
35 <option value="predict">Predict class labels</option>
36 <option value="advanced">Include advanced options</option>
37 </param>
38 <when value="predict">
39 </when>
40 <when value="advanced">
41 </when>
42 </conditional>
43 </when>
44 <when value="train">
45 <conditional name="selected_algorithms">
46 <yield />
47 </conditional>
48 </when>
49 </conditional>
50 </xml>
51
52 <xml name="advanced_section">
53 <section name="options" title="Advanced Options" expanded="False">
54 <yield />
55 </section>
56 </xml>
57
58
59 <!--Generalized Linear Models-->
60 <xml name="loss" token_help=" " token_select="false">
61 <param argument="loss" type="select" label="Loss function" help="@HELP@">
62 <option value="squared_loss" selected="@SELECT@">squared loss</option>
63 <option value="huber">huber</option>
64 <option value="epsilon_insensitive">epsilon insensitive</option>
65 <option value="squared_epsilon_insensitive">squared epsilon insensitive</option>
66 <yield/>
67 </param>
68 </xml>
69
70 <xml name="penalty" token_help=" ">
71 <param argument="penalty" type="select" label="Penalty (regularization term)" help="@HELP@">
72 <option value="l2" selected="true">l2</option>
73 <option value="l1">l1</option>
74 <option value="elasticnet">elastic net</option>
75 <option value="none">none</option>
76 <yield/>
77 </param>
78 </xml>
79
80 <xml name="l1_ratio" token_default_value="0.15" token_help=" ">
81 <param argument="l1_ratio" type="float" value="@DEFAULT_VALUE@" label="Elastic Net mixing parameter" help="@HELP@"/>
82 </xml>
83
84 <xml name="epsilon" token_default_value="0.1" token_help="Used if loss is ‘huber’, ‘epsilon_insensitive’, or ‘squared_epsilon_insensitive’. ">
85 <param argument="epsilon" type="float" value="@DEFAULT_VALUE@" label="Epsilon (epsilon-sensitive loss functions only)" help="@HELP@"/>
86 </xml>
87
88 <xml name="learning_rate_s" token_help=" " token_selected1="false" token_selected2="false">
89 <param argument="learning_rate" type="select" optional="true" label="Learning rate schedule" help="@HELP@">
90 <option value="optimal" selected="@SELECTED1@">optimal</option>
91 <option value="constant">constant</option>
92 <option value="invscaling" selected="@SELECTED2@">inverse scaling</option>
93 <yield/>
94 </param>
95 </xml>
96
97 <xml name="eta0" token_default_value="0.0" token_help="Used with ‘constant’ or ‘invscaling’ schedules. ">
98 <param argument="eta0" type="float" value="@DEFAULT_VALUE@" label="Initial learning rate" help="@HELP@"/>
99 </xml>
100
101 <xml name="power_t" token_default_value="0.5" token_help=" ">
102 <param argument="power_t" type="float" value="@DEFAULT_VALUE@" label="Exponent for inverse scaling learning rate" help="@HELP@"/>
103 </xml>
104
105 <xml name="normalize" token_checked="false" token_help=" ">
106 <param argument="normalize" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="@CHECKED@" label="Normalize samples before training" help=" "/>
107 </xml>
108
109 <xml name="copy_X" token_checked="true" token_help=" ">
110 <param argument="copy_X" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="@CHECKED@" label="Use a copy of samples" help="If false, samples would be overwritten. "/>
111 </xml>
112
113 <xml name="ridge_params">
114 <expand macro="normalize"/>
115 <expand macro="alpha" default_value="1.0"/>
116 <expand macro="fit_intercept"/>
117 <expand macro="max_iter" default_value=""/>
118 <expand macro="tol" default_value="0.001" help_text="Precision of the solution. "/>
119 <!--class_weight-->
120 <expand macro="copy_X"/>
121 <param argument="solver" type="select" value="" label="Solver to use in the computational routines" help=" ">
122 <option value="auto" selected="true">auto</option>
123 <option value="svd">svd</option>
124 <option value="cholesky">cholesky</option>
125 <option value="lsqr">lsqr</option>
126 <option value="sparse_cg">sparse_cg</option>
127 <option value="sag">sag</option>
128 </param>
129 <expand macro="random_state"/>
130 </xml>
131
132 <!--Ensemble methods-->
133 <xml name="n_estimators" token_default_value="10" token_help=" ">
134 <param argument="n_estimators" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Number of trees in the forest" help="@HELP@"/>
135 </xml>
136
137 <xml name="max_depth" token_default_value="" token_help=" ">
138 <param argument="max_depth" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Maximum depth of the tree" help="@HELP@"/>
139 </xml>
140
141 <xml name="min_samples_split" token_type="integer" token_default_value="2" token_help=" ">
142 <param argument="min_samples_split" type="@TYPE@" optional="true" value="@DEFAULT_VALUE@" label="Minimum number of samples required to split an internal node" help="@HELP@"/>
143 </xml>
144
145 <xml name="min_samples_leaf" token_type="integer" token_default_value="1" token_label="Minimum number of samples in newly created leaves" token_help=" ">
146 <param argument="min_samples_leaf" type="@TYPE@" optional="true" value="@DEFAULT_VALUE@" label="@LABEL@" help="@HELP@"/>
147 </xml>
148
149 <xml name="min_weight_fraction_leaf" token_default_value="0.0" token_help=" ">
150 <param argument="min_weight_fraction_leaf" type="float" optional="true" value="@DEFAULT_VALUE@" label="Minimum weighted fraction of the input samples required to be at a leaf node" help="@HELP@"/>
151 </xml>
152
153 <xml name="max_leaf_nodes" token_default_value="" token_help=" ">
154 <param argument="max_leaf_nodes" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Maximum number of leaf nodes in best-first method" help="@HELP@"/>
155 </xml>
156
157 <xml name="min_impurity_decrease" token_default_value="0" token_help=" ">
158 <param argument="min_impurity_decrease" type="float" value="@DEFAULT_VALUE@" optional="true" label="The threshold value of impurity for stopping node splitting" help="@HELP@"/>
159 </xml>
160
161 <xml name="bootstrap" token_checked="true" token_help=" ">
162 <param argument="bootstrap" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="@CHECKED@" label="Use bootstrap samples for building trees." help="@HELP@"/>
163 </xml>
164
165 <xml name="criterion" token_help=" ">
166 <param argument="criterion" type="select" label="Function to measure the quality of a split" help=" ">
167 <option value="gini" selected="true">Gini impurity</option>
168 <option value="entropy">Information gain</option>
169 <yield/>
170 </param>
171 </xml>
172
173 <xml name="criterion2" token_help="">
174 <param argument="criterion" type="select" label="Function to measure the quality of a split" >
175 <option value="mse">mse - mean squared error</option>
176 <option value="mae">mae - mean absolute error</option>
177 <yield/>
178 </param>
179 </xml>
180
181 <xml name="oob_score" token_checked="false" token_help=" ">
182 <param argument="oob_score" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="@CHECKED@" label="Use out-of-bag samples to estimate the generalization error" help="@HELP@"/>
183 </xml>
184
185 <xml name="max_features">
186 <conditional name="select_max_features">
187 <param argument="max_features" type="select" label="max_features">
188 <option value="auto" selected="true">auto - max_features=n_features</option>
189 <option value="sqrt">sqrt - max_features=sqrt(n_features)</option>
190 <option value="log2">log2 - max_features=log2(n_features)</option>
191 <option value="number_input">I want to type the number in or input None type</option>
192 </param>
193 <when value="auto">
194 </when>
195 <when value="sqrt">
196 </when>
197 <when value="log2">
198 </when>
199 <when value="number_input">
200 <param name="num_max_features" type="float" value="" optional="true" label="Input max_features number:" help="If int, consider the number of features at each split; If float, then max_features is a percentage and int(max_features * n_features) features are considered at each split."/>
201 </when>
202 </conditional>
203 </xml>
204
205 <xml name="verbose" token_default_value="0" token_help="If 1 then it prints progress and performance once in a while. If greater than 1 then it prints progress and performance for every tree.">
206 <param argument="verbose" type="integer" value="@DEFAULT_VALUE@" optional="true" label="Enable verbose output" help="@HELP@"/>
207 </xml>
208
209 <xml name="learning_rate" token_default_value="1.0" token_help=" ">
210 <param argument="learning_rate" type="float" optional="true" value="@DEFAULT_VALUE@" label="Learning rate" help="@HELP@"/>
211 </xml>
212
213 <xml name="subsample" token_help=" ">
214 <param argument="subsample" type="float" value="1.0" optional="true" label="The fraction of samples to be used for fitting the individual base learners" help="@HELP@"/>
215 </xml>
216
217 <xml name="presort">
218 <param argument="presort" type="select" label="Whether to presort the data to speed up the finding of best splits in fitting" >
219 <option value="auto" selected="true">auto</option>
220 <option value="true">true</option>
221 <option value="false">false</option>
222 </param>
223 </xml>
224
225 <!--Parameters-->
226 <xml name="tol" token_default_value="0.0" token_help_text="Early stopping heuristics based on the relative center changes. Set to default (0.0) to disable this convergence detection.">
227 <param argument="tol" type="float" optional="true" value="@DEFAULT_VALUE@" label="Tolerance" help="@HELP_TEXT@"/>
228 </xml>
229
230 <xml name="n_clusters" token_default_value="8">
231 <param argument="n_clusters" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Number of clusters" help=" "/>
232 </xml>
233
234 <xml name="fit_intercept" token_checked="true">
235 <param argument="fit_intercept" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="@CHECKED@" label="Estimate the intercept" help="If false, the data is assumed to be already centered."/>
236 </xml>
237
238 <xml name="n_iter" token_default_value="5" token_help_text="The number of passes over the training data (aka epochs). ">
239 <param argument="n_iter" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Number of iterations" help="@HELP_TEXT@"/>
240 </xml>
241
242 <xml name="shuffle" token_checked="true" token_help_text=" " token_label="Shuffle data after each iteration">
243 <param argument="shuffle" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="@CHECKED@" label="@LABEL@" help="@HELP_TEXT@"/>
244 </xml>
245
246 <xml name="random_state" token_default_value="" token_help_text="Integer number. The seed of the pseudo random number generator to use when shuffling the data. A fixed seed allows reproducible results. default=None.">
247 <param argument="random_state" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Random seed number" help="@HELP_TEXT@"/>
248 </xml>
249
250 <xml name="warm_start" token_checked="true" token_help_text="When set to True, reuse the solution of the previous call to fit as initialization,otherwise, just erase the previous solution.">
251 <param argument="warm_start" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="@CHECKED@" label="Perform warm start" help="@HELP_TEXT@"/>
252 </xml>
253
254 <xml name="C" token_default_value="1.0" token_help_text="Penalty parameter C of the error term.">
255 <param argument="C" type="float" optional="true" value="@DEFAULT_VALUE@" label="Penalty parameter" help="@HELP_TEXT@"/>
256 </xml>
257
258 <!--xml name="class_weight" token_default_value="" token_help_text="">
259 <param argument="class_weight" type="" optional="true" value="@DEFAULT_VALUE@" label="" help="@HELP_TEXT@"/>
260 </xml-->
261
262 <xml name="alpha" token_default_value="0.0001" token_help_text="Constant that multiplies the regularization term if regularization is used. ">
263 <param argument="alpha" type="float" optional="true" value="@DEFAULT_VALUE@" label="Regularization coefficient" help="@HELP_TEXT@"/>
264 </xml>
265
266 <xml name="n_samples" token_default_value="100" token_help_text="The total number of points equally divided among clusters.">
267 <param argument="n_samples" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Number of samples" help="@HELP_TEXT@"/>
268 </xml>
269
270 <xml name="n_features" token_default_value="2" token_help_text="Number of different numerical properties produced for each sample.">
271 <param argument="n_features" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Number of features" help="@HELP_TEXT@"/>
272 </xml>
273
274 <xml name="noise" token_default_value="0.0" token_help_text="Floating point number. ">
275 <param argument="noise" type="float" optional="true" value="@DEFAULT_VALUE@" label="Standard deviation of the Gaussian noise added to the data" help="@HELP_TEXT@"/>
276 </xml>
277
278 <xml name="C" token_default_value="1.0" token_help_text="Penalty parameter C of the error term. ">
279 <param argument="C" type="float" optional="true" value="@DEFAULT_VALUE@" label="Penalty parameter" help="@HELP_TEXT@"/>
280 </xml>
281
282 <xml name="max_iter" token_default_value="300" token_label="Maximum number of iterations per single run" token_help_text=" ">
283 <param argument="max_iter" type="integer" optional="true" value="@DEFAULT_VALUE@" label="@LABEL@" help="@HELP_TEXT@"/>
284 </xml>
285
286 <xml name="n_init" token_default_value="10" >
287 <param argument="n_init" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Number of runs with different centroid seeds" help=" "/>
288 </xml>
289
290 <xml name="init">
291 <param argument="init" type="select" label="Centroid initialization method" help="''k-means++'' selects initial cluster centers that speed up convergence. ''random'' chooses k observations (rows) at random from data as initial centroids.">
292 <option value="k-means++">k-means++</option>
293 <option value="random">random</option>
294 </param>
295 </xml>
296
297 <xml name="gamma" token_default_value="1.0" token_label="Scaling parameter" token_help_text=" ">
298 <param argument="gamma" type="float" optional="true" value="@DEFAULT_VALUE@" label="@LABEL@" help="@HELP_TEXT@"/>
299 </xml>
300
301 <xml name="degree" token_default_value="3" token_label="Degree of the polynomial" token_help_text=" ">
302 <param argument="degree" type="integer" optional="true" value="@DEFAULT_VALUE@" label="@LABEL@" help="@HELP_TEXT@"/>
303 </xml>
304
305 <xml name="coef0" token_default_value="1" token_label="Zero coefficient" token_help_text=" ">
306 <param argument="coef0" type="integer" optional="true" value="@DEFAULT_VALUE@" label="@LABEL@" help="@HELP_TEXT@"/>
307 </xml>
308
309 <xml name="pos_label" token_default_value="">
310 <param argument="pos_label" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Label of the positive class" help=" "/>
311 </xml>
312
313 <xml name="average">
314 <param argument="average" type="select" optional="true" label="Averaging type" help=" ">
315 <option value="micro">Calculate metrics globally by counting the total true positives, false negatives and false positives. (micro)</option>
316 <option value="samples">Calculate metrics for each instance, and find their average. Only meaningful for multilabel. (samples)</option>
317 <option value="macro">Calculate metrics for each label, and find their unweighted mean. This does not take label imbalance into account. (macro)</option>
318 <option value="weighted">Calculate metrics for each label, and find their average, weighted by support (the number of true instances for each label). This alters ‘macro’ to account for label imbalance; it can result in an F-score that is not between precision and recall. (weighted)</option>
319 <option value="None">None</option>
320 <yield/>
321 </param>
322 </xml>
323
324 <xml name="beta">
325 <param argument="beta" type="float" value="1.0" label="The strength of recall versus precision in the F-score" help=" "/>
326 </xml>
327
328
329 <!--Data interface-->
330
331 <xml name="samples_tabular" token_label1="Training samples dataset:" token_multiple1="false" token_multiple2="false">
332 <param name="infile1" type="data" format="tabular" label="@LABEL1@"/>
333 <param name="header1" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="False" label="Does the dataset contain header:" />
334 <conditional name="column_selector_options_1">
335 <expand macro="samples_column_selector_options" multiple="@MULTIPLE1@"/>
336 </conditional>
337 <param name="infile2" type="data" format="tabular" label="Dataset containing class labels or target values:"/>
338 <param name="header2" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="False" label="Does the dataset contain header:" />
339 <conditional name="column_selector_options_2">
340 <expand macro="samples_column_selector_options" column_option="selected_column_selector_option2" col_name="col2" multiple="@MULTIPLE2@" infile="infile2"/>
341 </conditional>
342 <yield/>
343 </xml>
344
345 <xml name="samples_column_selector_options" token_column_option="selected_column_selector_option" token_col_name="col1" token_multiple="False" token_infile="infile1">
346 <param name="@COLUMN_OPTION@" type="select" label="Choose how to select data by column:">
347 <option value="by_index_number" selected="true">Select columns by column index number(s)</option>
348 <option value="all_but_by_index_number">All columns EXCLUDING some by column index number(s)</option>
349 <option value="by_header_name">Select columns by column header name(s)</option>
350 <option value="all_but_by_header_name">All columns EXCLUDING some by column header name(s)</option>
351 <option value="all_columns">All columns</option>
352 </param>
353 <when value="by_index_number">
354 <param name="@COL_NAME@" multiple="@MULTIPLE@" type="data_column" use_header_names="true" data_ref="@INFILE@" label="Select target column(s):"/>
355 </when>
356 <when value="all_but_by_index_number">
357 <param name="@COL_NAME@" multiple="@MULTIPLE@" type="data_column" use_header_names="true" data_ref="@INFILE@" label="Select target column(s):"/>
358 </when>
359 <when value="by_header_name">
360 <param name="@COL_NAME@" type="text" value="" label="Type header name(s):" help="Comma-separated string. For example: target1,target2"/>
361 </when>
362 <when value="all_but_by_header_name">
363 <param name="@COL_NAME@" type="text" value="" label="Type header name(s):" help="Comma-separated string. For example: target1,target2"/>
364 </when>
365 <when value="all_columns">
366 </when>
367 </xml>
368
369 <xml name="clf_inputs_extended" token_label1=" " token_label2=" " token_multiple="False">
370 <conditional name="true_columns">
371 <param name="selected_input1" type="select" label="Select the input type of true labels dataset:">
372 <option value="tabular" selected="true">Tabular</option>
373 <option value="sparse">Sparse</option>
374 </param>
375 <when value="tabular">
376 <param name="infile1" type="data" label="@LABEL1@"/>
377 <param name="col1" type="data_column" data_ref="infile1" label="Select the target column:"/>
378 </when>
379 <when value="sparse">
380 <param name="infile1" type="data" format="txt" label="@LABEL1@"/>
381 </when>
382 </conditional>
383 <conditional name="predicted_columns">
384 <param name="selected_input2" type="select" label="Select the input type of predicted labels dataset:">
385 <option value="tabular" selected="true">Tabular</option>
386 <option value="sparse">Sparse</option>
387 </param>
388 <when value="tabular">
389 <param name="infile2" type="data" label="@LABEL2@"/>
390 <param name="col2" multiple="@MULTIPLE@" type="data_column" data_ref="infile2" label="Select target column(s):"/>
391 </when>
392 <when value="sparse">
393 <param name="infile2" type="data" format="txt" label="@LABEL1@"/>
394 </when>
395 </conditional>
396 </xml>
397
398 <xml name="clf_inputs" token_label1="Dataset containing true labels (tabular):" token_label2="Dataset containing predicted values (tabular):" token_multiple1="False" token_multiple="False">
399 <param name="infile1" type="data" format="tabular" label="@LABEL1@"/>
400 <param name="header1" type="boolean" optional="True" truevalue="booltrue" falsevalue="boolfalse" checked="False" label="Does the dataset contain header:" />
401 <conditional name="column_selector_options_1">
402 <expand macro="samples_column_selector_options" multiple="@MULTIPLE1@"/>
403 </conditional>
404 <param name="infile2" type="data" format="tabular" label="@LABEL2@"/>
405 <param name="header2" type="boolean" optional="True" truevalue="booltrue" falsevalue="boolfalse" checked="False" label="Does the dataset contain header:" />
406 <conditional name="column_selector_options_2">
407 <expand macro="samples_column_selector_options" column_option="selected_column_selector_option2" col_name="col2" multiple="@MULTIPLE@" infile="infile2"/>
408 </conditional>
409 </xml>
410
411 <xml name="multiple_input" token_name="input_files" token_max_num="10" token_format="txt" token_label="Sparse matrix file (.mtx, .txt)" token_help_text="Specify a sparse matrix file in .txt format.">
412 <repeat name="@NAME@" min="1" max="@MAX_NUM@" title="Select input file(s):">
413 <param name="input" type="data" format="@FORMAT@" label="@LABEL@" help="@HELP_TEXT@"/>
414 </repeat>
415 </xml>
416
417 <xml name="sparse_target" token_label1="Select a sparse matrix:" token_label2="Select the tabular containing true labels:" token_multiple="False" token_format1="txt" token_format2="tabular" token_help1="" token_help2="">
418 <param name="infile1" type="data" format="@FORMAT1@" label="@LABEL1@" help="@HELP1@"/>
419 <expand macro="input_tabular_target"/>
420 </xml>
421
422 <xml name="sl_mixed_input">
423 <conditional name="input_options">
424 <expand macro="data_input_options"/>
425 <expand macro="data_input_whens"/>
426 </conditional>
427 </xml>
428
429 <xml name="sl_mixed_input_plus_sequence">
430 <conditional name="input_options">
431 <expand macro="data_input_options">
432 <option value="seq_fasta">sequnences in a fasta file</option>
433 <option value="refseq_and_interval">reference genome and intervals</option>
434 </expand>
435 <expand macro="data_input_whens">
436 <when value="seq_fasta">
437 <expand macro="inputs_seq_fasta"/>
438 </when>
439 <when value="refseq_and_interval">
440 <expand macro="inputs_refseq_and_interval"/>
441 </when>
442 </expand>
443 </conditional>
444 </xml>
445
446 <xml name="data_input_options">
447 <param name="selected_input" type="select" label="Select input type:">
448 <option value="tabular" selected="true">tabular data</option>
449 <option value="sparse">sparse matrix</option>
450 <yield/>
451 </param>
452 </xml>
453
454 <xml name="data_input_whens">
455 <when value="tabular">
456 <expand macro="samples_tabular" multiple1="true" multiple2="false"/>
457 </when>
458 <when value="sparse">
459 <expand macro="sparse_target"/>
460 </when>
461 <yield/>
462 </xml>
463
464 <xml name="input_tabular_target">
465 <param name="infile2" type="data" format="tabular" label="Dataset containing class labels or target values:"/>
466 <param name="header2" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="false" label="Does the dataset contain header:" />
467 <conditional name="column_selector_options_2">
468 <expand macro="samples_column_selector_options" column_option="selected_column_selector_option2" col_name="col2" multiple="false" infile="infile2"/>
469 </conditional>
470 </xml>
471
472 <xml name="inputs_seq_fasta">
473 <param name="fasta_path" type="data" format="fasta" label="Dataset containing fasta genomic/protein sequences" help="Sequences will be one-hot encoded to arrays."/>
474 <expand macro="input_tabular_target"/>
475 </xml>
476
477 <xml name="inputs_refseq_and_interval">
478 <param name="ref_genome_file" type="data" format="fasta" label="Dataset containing reference genomic sequence"/>
479 <param name="interval_file" type="data" format="interval" label="Dataset containing sequence intervals for training" help="interval. Sequences will be retrieved from the reference genome and one-hot encoded to training arrays."/>
480 <param name="target_file" type="data" format="bed" label="Dataset containing positions and features for target values." help="bed. The file will be compressed with `bgzip` and then indexed using `tabix`."/>
481 <param name="infile2" type="data" format="tabular" label="Dataset containing the feature list for prediction"/>
482 <param name="header2" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="false" label="Does the dataset contain header:" />
483 <conditional name="column_selector_options_2">
484 <expand macro="samples_column_selector_options" column_option="selected_column_selector_option2" col_name="col2" multiple="true" infile="infile2"/>
485 </conditional>
486 </xml>
487
488 <!--Advanced options-->
489 <xml name="nn_advanced_options">
490 <section name="options" title="Advanced Options" expanded="False">
491 <yield/>
492 <param argument="weights" type="select" label="Weight function" help="Used in prediction.">
493 <option value="uniform" selected="true">Uniform weights. All points in each neighborhood are weighted equally. (Uniform)</option>
494 <option value="distance">Weight points by the inverse of their distance. (Distance)</option>
495 </param>
496 <param argument="algorithm" type="select" label="Neighbor selection algorithm" help=" ">
497 <option value="auto" selected="true">Auto</option>
498 <option value="ball_tree">BallTree</option>
499 <option value="kd_tree">KDTree</option>
500 <option value="brute">Brute-force</option>
501 </param>
502 <param argument="leaf_size" type="integer" value="30" label="Leaf size" help="Used with BallTree and KDTree. Affects the time and memory usage of the constructed tree."/>
503 <!--param name="metric"-->
504 <!--param name="p"-->
505 <!--param name="metric_params"-->
506 </section>
507 </xml>
508
509 <xml name="svc_advanced_options">
510 <section name="options" title="Advanced Options" expanded="False">
511 <yield/>
512 <param argument="kernel" type="select" optional="true" label="Kernel type" help="Kernel type to be used in the algorithm. If none is given, ‘rbf’ will be used.">
513 <option value="rbf" selected="true">rbf</option>
514 <option value="linear">linear</option>
515 <option value="poly">poly</option>
516 <option value="sigmoid">sigmoid</option>
517 <option value="precomputed">precomputed</option>
518 </param>
519 <param argument="degree" type="integer" optional="true" value="3" label="Degree of the polynomial (polynomial kernel only)" help="Ignored by other kernels. dafault : 3 "/>
520 <!--TODO: param argument="gamma" float, optional (default=’auto’) -->
521 <param argument="coef0" type="float" optional="true" value="0.0" label="Zero coefficient (polynomial and sigmoid kernels only)"
522 help="Independent term in kernel function. dafault: 0.0 "/>
523 <param argument="shrinking" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="true"
524 label="Use the shrinking heuristic" help=" "/>
525 <param argument="probability" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="false"
526 label="Enable probability estimates. " help="This must be enabled prior to calling fit, and will slow down that method."/>
527 <!-- param argument="cache_size"-->
528 <!--expand macro="class_weight"/-->
529 <expand macro="tol" default_value="0.001" help_text="Tolerance for stopping criterion. "/>
530 <expand macro="max_iter" default_value="-1" label="Solver maximum number of iterations" help_text="Hard limit on iterations within solver, or -1 for no limit."/>
531 <!--param argument="decision_function_shape"-->
532 <expand macro="random_state" help_text="Integer number. The seed of the pseudo random number generator to use when shuffling the data for probability estimation. A fixed seed allows reproducible results."/>
533 </section>
534 </xml>
535
536 <xml name="spectral_clustering_advanced_options">
537 <section name="options" title="Advanced Options" expanded="False">
538 <expand macro="n_clusters"/>
539 <param argument="eigen_solver" type="select" value="" label="Eigen solver" help="The eigenvalue decomposition strategy to use.">
540 <option value="arpack" selected="true">arpack</option>
541 <option value="lobpcg">lobpcg</option>
542 <option value="amg">amg</option>
543 <!--None-->
544 </param>
545 <expand macro="random_state"/>
546 <expand macro="n_init"/>
547 <param argument="gamma" type="float" optional="true" value="1.0" label="Kernel scaling factor" help="Scaling factor of RBF, polynomial, exponential chi^2 and sigmoid affinity kernel. Ignored for affinity=''nearest_neighbors''."/>
548 <param argument="affinity" type="select" label="Affinity" help="Affinity kernel to use. ">
549 <option value="rbf" selected="true">RBF</option>
550 <option value="precomputed">precomputed</option>
551 <option value="nearest_neighbors">Nearset neighbors</option>
552 </param>
553 <param argument="n_neighbors" type="integer" optional="true" value="10" label="Number of neighbors" help="Number of neighbors to use when constructing the affinity matrix using the nearest neighbors method. Ignored for affinity=''rbf''"/>
554 <!--param argument="eigen_tol"-->
555 <param argument="assign_labels" type="select" label="Assign labels" help="The strategy to use to assign labels in the embedding space.">
556 <option value="kmeans" selected="true">kmeans</option>
557 <option value="discretize">discretize</option>
558 </param>
559 <param argument="degree" type="integer" optional="true" value="3"
560 label="Degree of the polynomial (polynomial kernel only)" help="Ignored by other kernels. dafault : 3 "/>
561 <param argument="coef0" type="integer" optional="true" value="1"
562 label="Zero coefficient (polynomial and sigmoid kernels only)" help="Ignored by other kernels. dafault : 1 "/>
563 <!--param argument="kernel_params"-->
564 </section>
565 </xml>
566
567 <xml name="minibatch_kmeans_advanced_options">
568 <section name="options" title="Advanced Options" expanded="False">
569 <expand macro="n_clusters"/>
570 <expand macro="init"/>
571 <expand macro="n_init" default_value="3"/>
572 <expand macro="max_iter" default_value="100"/>
573 <expand macro="tol" help_text="Early stopping heuristics based on normalized center change. To disable set to 0.0 ."/>
574 <expand macro="random_state"/>
575 <param argument="batch_size" type="integer" optional="true" value="100" label="Batch size" help="Size of the mini batches."/>
576 <!--param argument="compute_labels"-->
577 <param argument="max_no_improvement" type="integer" optional="true" value="10" label="Maximum number of improvement attempts" help="
578 Convergence detection based on inertia (the consecutive number of mini batches that doe not yield an improvement on the smoothed inertia).
579 To disable, set max_no_improvement to None. "/>
580 <param argument="init_size" type="integer" optional="true" value="" label="Number of random initialization samples" help="Number of samples to randomly sample for speeding up the initialization . ( default: 3 * batch_size )"/>
581 <param argument="reassignment_ratio" type="float" optional="true" value="0.01" label="Re-assignment ratio" help="Controls the fraction of the maximum number of counts for a center to be reassigned. Higher values yield better clustering results."/>
582 </section>
583 </xml>
584
585 <xml name="kmeans_advanced_options">
586 <section name="options" title="Advanced Options" expanded="False">
587 <expand macro="n_clusters"/>
588 <expand macro="init"/>
589 <expand macro="n_init"/>
590 <expand macro="max_iter"/>
591 <expand macro="tol" default_value="0.0001" help_text="Relative tolerance with regards to inertia to declare convergence."/>
592 <!--param argument="precompute_distances"/-->
593 <expand macro="random_state"/>
594 <param argument="copy_x" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="true" label="Use a copy of data for precomputing distances" help="Mofifying the original data introduces small numerical differences caused by subtracting and then adding the data mean."/>
595 <expand macro="kmeans_algorithm"/>
596 </section>
597 </xml>
598
599 <xml name="kmeans_algorithm">
600 <param argument="algorithm" type="select" label="K-means algorithm to use:">
601 <option value="auto" selected="true">auto</option>
602 <option value="full">full</option>
603 <option value="elkan">elkan</option>
604 </param>
605 </xml>
606
607 <xml name="birch_advanced_options">
608 <section name="options" title="Advanced Options" expanded="False">
609 <param argument="threshold" type="float" optional="true" value="0.5" label="Subcluster radius threshold" help="The radius of the subcluster obtained by merging a new sample; the closest subcluster should be less than the threshold to avoid a new subcluster."/>
610 <param argument="branching_factor" type="integer" optional="true" value="50" label="Maximum number of subclusters per branch" help="Maximum number of CF subclusters in each node."/>
611 <expand macro="n_clusters" default_value="3"/>
612 <!--param argument="compute_labels"/-->
613 </section>
614 </xml>
615
616 <xml name="dbscan_advanced_options">
617 <section name="options" title="Advanced Options" expanded="False">
618 <param argument="eps" type="float" optional="true" value="0.5" label="Maximum neighborhood distance" help="The maximum distance between two samples for them to be considered as in the same neighborhood."/>
619 <param argument="min_samples" type="integer" optional="true" value="5" label="Minimal core point density" help="The number of samples (or total weight) in a neighborhood for a point (including the point itself) to be considered as a core point."/>
620 <param argument="metric" type="text" optional="true" value="euclidean" label="Metric" help="The metric to use when calculating distance between instances in a feature array."/>
621 <param argument="algorithm" type="select" label="Pointwise distance computation algorithm" help="The algorithm to be used by the NearestNeighbors module to compute pointwise distances and find nearest neighbors.">
622 <option value="auto" selected="true">auto</option>
623 <option value="ball_tree">ball_tree</option>
624 <option value="kd_tree">kd_tree</option>
625 <option value="brute">brute</option>
626 </param>
627 <param argument="leaf_size" type="integer" optional="true" value="30" label="Leaf size" help="Leaf size passed to BallTree or cKDTree. Memory and time efficieny factor in tree constrution and querying."/>
628 </section>
629 </xml>
630
631 <xml name="clustering_algorithms_options">
632 <conditional name="algorithm_options">
633 <param name="selected_algorithm" type="select" label="Clustering Algorithm">
634 <option value="KMeans" selected="true">KMeans</option>
635 <option value="SpectralClustering">Spectral Clustering</option>
636 <option value="MiniBatchKMeans">Mini Batch KMeans</option>
637 <option value="DBSCAN">DBSCAN</option>
638 <option value="Birch">Birch</option>
639 </param>
640 <when value="KMeans">
641 <expand macro="kmeans_advanced_options"/>
642 </when>
643 <when value="DBSCAN">
644 <expand macro="dbscan_advanced_options"/>
645 </when>
646 <when value="Birch">
647 <expand macro="birch_advanced_options"/>
648 </when>
649 <when value="SpectralClustering">
650 <expand macro="spectral_clustering_advanced_options"/>
651 </when>
652 <when value="MiniBatchKMeans">
653 <expand macro="minibatch_kmeans_advanced_options"/>
654 </when>
655 </conditional>
656 </xml>
657
658 <xml name="distance_metrics">
659 <param argument="metric" type="select" label="Distance metric" help=" ">
660 <option value="euclidean" selected="true">euclidean</option>
661 <option value="cityblock">cityblock</option>
662 <option value="cosine">cosine</option>
663 <option value="l1">l1</option>
664 <option value="l2">l2</option>
665 <option value="manhattan">manhattan</option>
666 <yield/>
667 </param>
668 </xml>
669
670 <xml name="distance_nonsparse_metrics">
671 <option value="braycurtis">braycurtis</option>
672 <option value="canberra">canberra</option>
673 <option value="chebyshev">chebyshev</option>
674 <option value="correlation">correlation</option>
675 <option value="dice">dice</option>
676 <option value="hamming">hamming</option>
677 <option value="jaccard">jaccard</option>
678 <option value="kulsinski">kulsinski</option>
679 <option value="mahalanobis">mahalanobis</option>
680 <option value="matching">matching</option>
681 <option value="minkowski">minkowski</option>
682 <option value="rogerstanimoto">rogerstanimoto</option>
683 <option value="russellrao">russellrao</option>
684 <option value="seuclidean">seuclidean</option>
685 <option value="sokalmichener">sokalmichener</option>
686 <option value="sokalsneath">sokalsneath</option>
687 <option value="sqeuclidean">sqeuclidean</option>
688 <option value="yule">yule</option>
689 </xml>
690
691 <xml name="pairwise_kernel_metrics">
692 <param argument="metric" type="select" label="Pirwise Kernel metric" help=" ">
693 <option value="rbf" selected="true">rbf</option>
694 <option value="sigmoid">sigmoid</option>
695 <option value="polynomial">polynomial</option>
696 <option value="linear" selected="true">linear</option>
697 <option value="chi2">chi2</option>
698 <option value="additive_chi2">additive_chi2</option>
699 </param>
700 </xml>
701
702 <xml name="sparse_pairwise_metric_functions">
703 <param name="selected_metric_function" type="select" label="Select the pairwise metric you want to compute:">
704 <option value="euclidean_distances" selected="true">Euclidean distance matrix</option>
705 <option value="pairwise_distances">Distance matrix</option>
706 <option value="pairwise_distances_argmin">Minimum distances between one point and a set of points</option>
707 <yield/>
708 </param>
709 </xml>
710
711 <xml name="pairwise_metric_functions">
712 <option value="additive_chi2_kernel" >Additive chi-squared kernel</option>
713 <option value="chi2_kernel">Exponential chi-squared kernel</option>
714 <option value="linear_kernel">Linear kernel</option>
715 <option value="manhattan_distances">L1 distances</option>
716 <option value="pairwise_kernels">Kernel</option>
717 <option value="polynomial_kernel">Polynomial kernel</option>
718 <option value="rbf_kernel">Gaussian (rbf) kernel</option>
719 <option value="laplacian_kernel">Laplacian kernel</option>
720 </xml>
721
722 <xml name="sparse_pairwise_condition">
723 <when value="pairwise_distances">
724 <section name="options" title="Advanced Options" expanded="False">
725 <expand macro="distance_metrics">
726 <yield/>
727 </expand>
728 </section>
729 </when>
730 <when value="euclidean_distances">
731 <section name="options" title="Advanced Options" expanded="False">
732 <param argument="squared" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="false"
733 label="Return squared Euclidean distances" help=" "/>
734 </section>
735 </when>
736 </xml>
737
738 <xml name="argmin_distance_condition">
739 <when value="pairwise_distances_argmin">
740 <section name="options" title="Advanced Options" expanded="False">
741 <param argument="axis" type="integer" optional="true" value="1" label="Axis" help="Axis along which the argmin and distances are to be computed."/>
742 <expand macro="distance_metrics">
743 <yield/>
744 </expand>
745 <param argument="batch_size" type="integer" optional="true" value="500" label="Batch size" help="Number of rows to be processed in each batch run."/>
746 </section>
747 </when>
748 </xml>
749
750 <xml name="sparse_preprocessors">
751 <param name="selected_pre_processor" type="select" label="Select a preprocessor:">
752 <option value="StandardScaler" selected="true">Standard Scaler (Standardizes features by removing the mean and scaling to unit variance)</option>
753 <option value="Binarizer">Binarizer (Binarizes data)</option>
754 <option value="MaxAbsScaler">Max Abs Scaler (Scales features by their maximum absolute value)</option>
755 <option value="Normalizer">Normalizer (Normalizes samples individually to unit norm)</option>
756 <yield/>
757 </param>
758 </xml>
759
760 <xml name="sparse_preprocessors_ext">
761 <expand macro="sparse_preprocessors">
762 <option value="KernelCenterer">Kernel Centerer (Centers a kernel matrix)</option>
763 <option value="MinMaxScaler">Minmax Scaler (Scales features to a range)</option>
764 <option value="PolynomialFeatures">Polynomial Features (Generates polynomial and interaction features)</option>
765 <option value="RobustScaler">Robust Scaler (Scales features using outlier-invariance statistics)</option>
766 </expand>
767 </xml>
768
769 <xml name="sparse_preprocessor_options">
770 <when value="Binarizer">
771 <section name="options" title="Advanced Options" expanded="False">
772 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="true"
773 label="Use a copy of data for precomputing binarization" help=" "/>
774 <param argument="threshold" type="float" optional="true" value="0.0"
775 label="Threshold"
776 help="Feature values below or equal to this are replaced by 0, above it by 1. Threshold may not be less than 0 for operations on sparse matrices. "/>
777 </section>
778 </when>
779 <when value="StandardScaler">
780 <section name="options" title="Advanced Options" expanded="False">
781 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="true"
782 label="Use a copy of data for performing inplace scaling" help=" "/>
783 <param argument="with_mean" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="true"
784 label="Center the data before scaling" help=" "/>
785 <param argument="with_std" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="true"
786 label="Scale the data to unit variance (or unit standard deviation)" help=" "/>
787 </section>
788 </when>
789 <when value="MaxAbsScaler">
790 <section name="options" title="Advanced Options" expanded="False">
791 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="true"
792 label="Use a copy of data for precomputing scaling" help=" "/>
793 </section>
794 </when>
795 <when value="Normalizer">
796 <section name="options" title="Advanced Options" expanded="False">
797 <param argument="norm" type="select" optional="true" label="The norm to use to normalize non zero samples" help=" ">
798 <option value="l1" selected="true">l1</option>
799 <option value="l2">l2</option>
800 <option value="max">max</option>
801 </param>
802 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="true"
803 label="Use a copy of data for precomputing row normalization" help=" "/>
804 </section>
805 </when>
806 <yield/>
807 </xml>
808
809 <xml name="sparse_preprocessor_options_ext">
810 <expand macro="sparse_preprocessor_options">
811 <when value="KernelCenterer">
812 <section name="options" title="Advanced Options" expanded="False">
813 </section>
814 </when>
815 <when value="MinMaxScaler">
816 <section name="options" title="Advanced Options" expanded="False">
817 <param argument="feature_range" type="text" value="(0, 1)" optional="true" help="Desired range of transformed data. None or tuple (min, max). None equals to (0, 1)"/>
818 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true"
819 label="Use a copy of data for precomputing normalization" help=" "/>
820 </section>
821 </when>
822 <when value="PolynomialFeatures">
823 <section name="options" title="Advanced Options" expanded="False">
824 <param argument="degree" type="integer" optional="true" value="2" label="The degree of the polynomial features " help=""/>
825 <param argument="interaction_only" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="false" label="Produce interaction features only" help="(Features that are products of at most degree distinct input features) "/>
826 <param argument="include_bias" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Include a bias column" help="Feature in which all polynomial powers are zero "/>
827 </section>
828 </when>
829 <when value="RobustScaler">
830 <section name="options" title="Advanced Options" expanded="False">
831 <!--=True, =True, copy=True-->
832 <param argument="with_centering" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true"
833 label="Center the data before scaling" help=" "/>
834 <param argument="with_scaling" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true"
835 label="Scale the data to interquartile range" help=" "/>
836 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true"
837 label="Use a copy of data for inplace scaling" help=" "/>
838 </section>
839 </when>
840 </expand>
841 </xml>
842
843 <xml name="cv_splitter">
844 <option value="default" selected="true">default splitter</option>
845 <option value="KFold">KFold</option>
846 <option value="StratifiedKFold">StratifiedKFold</option>
847 <option value="LeaveOneOut">LeaveOneOut</option>
848 <option value="LeavePOut">LeavePOut</option>
849 <option value="RepeatedKFold">RepeatedKFold</option>
850 <option value="RepeatedStratifiedKFold">RepeatedStratifiedKFold</option>
851 <option value="ShuffleSplit">ShuffleSplit</option>
852 <option value="StratifiedShuffleSplit">StratifiedShuffleSplit</option>
853 <option value="TimeSeriesSplit">TimeSeriesSplit</option>
854 <option value="PredefinedSplit">PredefinedSplit</option>
855 <option value="OrderedKFold">OrderedKFold</option>
856 <option value="RepeatedOrderedKFold">RepeatedOrderedKFold</option>
857 <yield/>
858 </xml>
859
860 <xml name="cv_splitter_options">
861 <when value="default">
862 <expand macro="cv_n_splits"/>
863 </when>
864 <when value="KFold">
865 <expand macro="cv_n_splits"/>
866 <expand macro="cv_shuffle"/>
867 <expand macro="random_state"/>
868 </when>
869 <when value="StratifiedKFold">
870 <expand macro="cv_n_splits"/>
871 <expand macro="cv_shuffle"/>
872 <expand macro="random_state"/>
873 </when>
874 <when value="LeaveOneOut">
875 </when>
876 <when value="LeavePOut">
877 <param argument="p" type="integer" value="" label="p" help="Integer. Size of the test sets."/>
878 </when>
879 <when value="RepeatedKFold">
880 <expand macro="cv_n_splits" value="5"/>
881 <param argument="n_repeats" type="integer" value="10" label="n_repeats" help="Number of times cross-validator needs to be repeated." />
882 <expand macro="random_state" />
883 </when>
884 <when value="RepeatedStratifiedKFold">
885 <expand macro="cv_n_splits" value="5"/>
886 <param argument="n_repeats" type="integer" value="10" label="n_repeats" help="Number of times cross-validator needs to be repeated." />
887 <expand macro="random_state" />
888 </when>
889 <when value="ShuffleSplit">
890 <expand macro="cv_n_splits" value="10" help="Number of re-shuffling and splitting iterations."/>
891 <expand macro="cv_test_size" value="0.1" />
892 <expand macro="random_state"/>
893 </when>
894 <when value="StratifiedShuffleSplit">
895 <expand macro="cv_n_splits" value="10" help="Number of re-shuffling and splitting iterations."/>
896 <expand macro="cv_test_size" value="0.1" />
897 <expand macro="random_state"/>
898 </when>
899 <when value="TimeSeriesSplit">
900 <expand macro="cv_n_splits"/>
901 <param argument="max_train_size" type="integer" value="" optional="true" label="Maximum size of the training set" help="Maximum size for a single training set." />
902 </when>
903 <when value="PredefinedSplit">
904 <param argument="test_fold" type="text" value="" area="true" label="test_fold" help="List, e.g., [0, 1, -1, 1], represents two test sets, [X[0]] and [X[1], X[3]], X[2] is excluded from any test set due to '-1'."/>
905 </when>
906 <when value="OrderedKFold">
907 <expand macro="cv_n_splits"/>
908 <expand macro="cv_shuffle"/>
909 <expand macro="random_state"/>
910 </when>
911 <when value="RepeatedOrderedKFold">
912 <expand macro="cv_n_splits"/>
913 <param argument="n_repeats" type="integer" value="5"/>
914 <expand macro="random_state"/>
915 </when>
916 <yield/>
917 </xml>
918
919 <xml name="cv">
920 <conditional name="cv_selector">
921 <param name="selected_cv" type="select" label="Select the cv splitter:">
922 <expand macro="cv_splitter">
923 <option value="GroupKFold">GroupKFold</option>
924 <option value="GroupShuffleSplit">GroupShuffleSplit</option>
925 <option value="LeaveOneGroupOut">LeaveOneGroupOut</option>
926 <option value="LeavePGroupsOut">LeavePGroupsOut</option>
927 </expand>
928 </param>
929 <expand macro="cv_splitter_options">
930 <when value="GroupKFold">
931 <expand macro="cv_n_splits"/>
932 <expand macro="cv_groups" />
933 </when>
934 <when value="GroupShuffleSplit">
935 <expand macro="cv_n_splits" value="5"/>
936 <expand macro="cv_test_size"/>
937 <expand macro="random_state"/>
938 <expand macro="cv_groups"/>
939 </when>
940 <when value="LeaveOneGroupOut">
941 <expand macro="cv_groups"/>
942 </when>
943 <when value="LeavePGroupsOut">
944 <param argument="n_groups" type="integer" value="" label="n_groups" help="Number of groups (p) to leave out in the test split." />
945 <expand macro="cv_groups"/>
946 </when>
947 </expand>
948 </conditional>
949 </xml>
950
951 <xml name="cv_reduced" token_label="Select the cv splitter">
952 <conditional name="cv_selector">
953 <param name="selected_cv" type="select" label="@LABEL@">
954 <expand macro="cv_splitter"/>
955 </param>
956 <expand macro="cv_splitter_options"/>
957 </conditional>
958 </xml>
959
960 <xml name="cv_n_splits" token_value="3" token_help="Number of folds. Must be at least 2.">
961 <param argument="n_splits" type="integer" value="@VALUE@" min="1" label="n_splits" help="@HELP@"/>
962 </xml>
963
964 <xml name="cv_shuffle">
965 <param argument="shuffle" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="false" label="Whether to shuffle data before splitting" />
966 </xml>
967
968 <xml name="cv_test_size" token_value="0.2">
969 <param argument="test_size" type="float" value="@VALUE@" min="0.0" label="Portion or number of the test set" help="0.0-1.0, proportion of the dataset to include in the test split; >1, integer only, the absolute number of test samples "/>
970 </xml>
971
972 <xml name="cv_groups" >
973 <section name="groups_selector" title="Groups column selector" expanded="true">
974 <param name="infile_g" type="data" format="tabular" label="Choose dataset containing groups info:"/>
975 <param name="header_g" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="False" label="Does the dataset contain header:" />
976 <conditional name="column_selector_options_g">
977 <expand macro="samples_column_selector_options" column_option="selected_column_selector_option_g" col_name="col_g" multiple="False" infile="infile_g"/>
978 </conditional>
979 </section>
980 </xml>
981
982 <xml name="train_test_split_params">
983 <conditional name="split_algos">
984 <param name="shuffle" type="select" label="Select the splitting method">
985 <option value="None">No shuffle</option>
986 <option value="simple" selected="true">ShuffleSplit</option>
987 <option value="stratified">StratifiedShuffleSplit -- target values serve as class labels</option>
988 <option value="group">GroupShuffleSplit or split by group names</option>
989 </param>
990 <when value="None">
991 <expand macro="train_test_split_test_size"/>
992 </when>
993 <when value="simple">
994 <expand macro="train_test_split_test_size"/>
995 <expand macro="random_state"/>
996 </when>
997 <when value="stratified">
998 <expand macro="train_test_split_test_size"/>
999 <expand macro="random_state"/>
1000 </when>
1001 <when value="group">
1002 <expand macro="train_test_split_test_size" optional="true"/>
1003 <expand macro="random_state"/>
1004 <param argument="group_names" type="text" value="" optional="true" label="Type in group names instead"
1005 help="For example: chr6, chr7. This parameter is optional. If used, it will override the holdout size and random seed."/>
1006 <yield/>
1007 </when>
1008 </conditional>
1009 <!--param argument="train_size" type="float" optional="True" value="" label="Train size:"/>-->
1010 </xml>
1011
1012 <xml name="train_test_split_test_size" token_optional="false">
1013 <param name="test_size" type="float" value="0.2" optional="@OPTIONAL@" label="Holdout size" help="Leass than 1, for preportion; greater than 1 (integer), for number of samples."/>
1014 </xml>
1015
1016 <xml name="feature_selection_algorithms">
1017 <option value="SelectKBest" selected="true">SelectKBest - Select features according to the k highest scores</option>
1018 <option value="GenericUnivariateSelect">GenericUnivariateSelect - Univariate feature selector with configurable strategy</option>
1019 <option value="SelectPercentile">SelectPercentile - Select features according to a percentile of the highest scores</option>
1020 <option value="SelectFpr">SelectFpr - Filter: Select the p-values below alpha based on a FPR test</option>
1021 <option value="SelectFdr">SelectFdr - Filter: Select the p-values for an estimated false discovery rate</option>
1022 <option value="SelectFwe">SelectFwe - Filter: Select the p-values corresponding to Family-wise error rate</option>
1023 <option value="VarianceThreshold">VarianceThreshold - Feature selector that removes all low-variance features</option>
1024 <option value="SelectFromModel">SelectFromModel - Meta-transformer for selecting features based on importance weights</option>
1025 <option value="RFE">RFE - Feature ranking with recursive feature elimination</option>
1026 <option value="RFECV">RFECV - Feature ranking with recursive feature elimination and cross-validated selection of the best number of features</option>
1027 <yield/>
1028 </xml>
1029
1030 <xml name="feature_selection_algorithm_details">
1031 <when value="GenericUnivariateSelect">
1032 <expand macro="feature_selection_score_function" />
1033 <section name="options" title="Advanced Options" expanded="False">
1034 <param argument="mode" type="select" label="Feature selection mode">
1035 <option value="percentile">percentile</option>
1036 <option value="k_best">k_best</option>
1037 <option value="fpr">fpr</option>
1038 <option value="fdr">fdr</option>
1039 <option value="fwe">fwe</option>
1040 </param>
1041 <param argument="param" type="float" value="" optional="true" label="Parameter of the corresponding mode" help="float or int depending on the feature selection mode" />
1042 </section>
1043 </when>
1044 <when value="SelectPercentile">
1045 <expand macro="feature_selection_score_function" />
1046 <section name="options" title="Advanced Options" expanded="False">
1047 <param argument="percentile" type="integer" value="10" optional="True" label="Percent of features to keep" />
1048 </section>
1049 </when>
1050 <when value="SelectKBest">
1051 <expand macro="feature_selection_score_function" />
1052 <section name="options" title="Advanced Options" expanded="False">
1053 <param argument="k" type="integer" value="10" optional="True" label="Number of top features to select" help="No 'all' option is supported." />
1054 </section>
1055 </when>
1056 <when value="SelectFpr">
1057 <expand macro="feature_selection_score_function" />
1058 <section name="options" title="Advanced Options" expanded="False">
1059 <param argument="alpha" type="float" value="" optional="True" label="Alpha" help="The highest p-value for features to be kept."/>
1060 </section>
1061 </when>
1062 <when value="SelectFdr">
1063 <expand macro="feature_selection_score_function" />
1064 <section name="options" title="Advanced Options" expanded="False">
1065 <param argument="alpha" type="float" value="" optional="True" label="Alpha" help="The highest uncorrected p-value for features to keep."/>
1066 </section>
1067 </when>
1068 <when value="SelectFwe">
1069 <expand macro="feature_selection_score_function" />
1070 <section name="options" title="Advanced Options" expanded="False">
1071 <param argument="alpha" type="float" value="" optional="True" label="Alpha" help="The highest uncorrected p-value for features to keep."/>
1072 </section>
1073 </when>
1074 <when value="VarianceThreshold">
1075 <section name="options" title="Options" expanded="False">
1076 <param argument="threshold" type="float" value="0.0" optional="True" label="Threshold" help="Features with a training-set variance lower than this threshold will be removed."/>
1077 </section>
1078 </when>
1079 </xml>
1080
1081 <xml name="feature_selection_SelectFromModel">
1082 <when value="SelectFromModel">
1083 <conditional name="model_inputter">
1084 <param name="input_mode" type="select" label="Construct a new estimator from a selection list?" >
1085 <option value="new" selected="true">Yes</option>
1086 <option value="prefitted">No. Load a prefitted estimator</option>
1087 </param>
1088 <when value="new">
1089 <expand macro="estimator_selector_fs"/>
1090 </when>
1091 <when value="prefitted">
1092 <param name="fitted_estimator" type="data" format='zip' label="Load a prefitted estimator" />
1093 </when>
1094 </conditional>
1095 <expand macro="feature_selection_SelectFromModel_options"/>
1096 </when>
1097 </xml>
1098
1099 <xml name="feature_selection_SelectFromModel_no_prefitted">
1100 <when value="SelectFromModel">
1101 <conditional name="model_inputter">
1102 <param name="input_mode" type="select" label="Construct a new estimator from a selection list?" >
1103 <option value="new" selected="true">Yes</option>
1104 </param>
1105 <when value="new">
1106 <expand macro="estimator_selector_all"/>
1107 </when>
1108 </conditional>
1109 <expand macro="feature_selection_SelectFromModel_options"/>
1110 </when>
1111 </xml>
1112
1113 <xml name="feature_selection_SelectFromModel_options">
1114 <section name="options" title="Advanced Options" expanded="False">
1115 <param argument="threshold" type="text" value="" optional="true" label="threshold" help="The threshold value to use for feature selection. e.g. 'mean', 'median', '1.25*mean'." />
1116 <param argument="norm_order" type="integer" value="1" label="norm_order" help="Order of the norm used to filter the vectors of coefficients below threshold in the case where the coef_ attribute of the estimator is of dimension 2. " />
1117 <param argument="max_features" type="integer" value="" optional="true" label="The maximum number of features selected scoring above threshold" help="To disable threshold and only select based on max_features, set threshold=-np.inf."/>
1118 </section>
1119 </xml>
1120
1121 <xml name="feature_selection_RFE">
1122 <when value="RFE">
1123 <yield/>
1124 <section name="options" title="Advanced Options" expanded="False">
1125 <param argument="n_features_to_select" type="integer" value="" optional="true" label="n_features_to_select" help="The number of features to select. If None, half of the features are selected." />
1126 <param argument="step" type="float" value="1" label="step" optional="true" help="Default = 1. " />
1127 <param argument="verbose" type="integer" value="0" label="verbose" help="Controls verbosity of output." />
1128 </section>
1129 </when>
1130 </xml>
1131
1132 <xml name="feature_selection_RFECV_fs">
1133 <when value="RFECV">
1134 <yield/>
1135 <section name="options" title="Advanced Options" expanded="False">
1136 <param argument="step" type="float" value="1" label="step" optional="true" help="Default = 1. " />
1137 <param argument="min_features_to_select" type="integer" value="1" optional="true" label="The minimum number of features to be selected"/>
1138 <expand macro="cv"/>
1139 <expand macro="scoring_selection"/>
1140 <param argument="verbose" type="integer" value="0" label="verbose" help="Controls verbosity of output." />
1141 </section>
1142 </when>
1143 </xml>
1144
1145 <xml name="feature_selection_RFECV_pipeline">
1146 <when value="RFECV">
1147 <yield/>
1148 <section name="options" title="Advanced Options" expanded="False">
1149 <param argument="step" type="float" value="1" label="step" optional="true" help="Default = 1. " />
1150 <param argument="min_features_to_select" type="integer" value="1" optional="true" label="The minimum number of features to be selected"/>
1151 <expand macro="cv_reduced"/>
1152 <!-- TODO: group splitter support-->
1153 <expand macro="scoring_selection"/>
1154 <param argument="verbose" type="integer" value="0" label="verbose" help="Controls verbosity of output." />
1155 </section>
1156 </when>
1157 </xml>
1158
1159 <xml name="feature_selection_DyRFECV_fs">
1160 <when value="DyRFECV">
1161 <yield/>
1162 <section name="options" title="Advanced Options" expanded="False">
1163 <param argument="step" type="text" size="30" value="1" label="step" optional="true" help="Default = 1. Support float, int and list." >
1164 <sanitizer>
1165 <valid initial="default">
1166 <add value="["/>
1167 <add value="]"/>
1168 </valid>
1169 </sanitizer>
1170 </param>
1171 <param argument="min_features_to_select" type="integer" value="1" optional="true" label="The minimum number of features to be selected"/>
1172 <expand macro="cv"/>
1173 <expand macro="scoring_selection"/>
1174 <param argument="verbose" type="integer" value="0" label="verbose" help="Controls verbosity of output." />
1175 </section>
1176 </when>
1177 </xml>
1178
1179 <xml name="feature_selection_pipeline">
1180 <!--compare to `feature_selection_fs`, no fitted estimator for SelectFromModel and no custom estimator for RFE and RFECV-->
1181 <conditional name="fs_algorithm_selector">
1182 <param name="selected_algorithm" type="select" label="Select a feature selection algorithm">
1183 <expand macro="feature_selection_algorithms"/>
1184 </param>
1185 <expand macro="feature_selection_algorithm_details"/>
1186 <expand macro="feature_selection_SelectFromModel_no_prefitted"/>
1187 <expand macro="feature_selection_RFE">
1188 <expand macro="estimator_selector_all"/>
1189 </expand>
1190 <expand macro="feature_selection_RFECV_pipeline">
1191 <expand macro="estimator_selector_all"/>
1192 </expand>
1193 <!-- TODO: add DyRFECV to pipeline-->
1194 </conditional>
1195 </xml>
1196
1197 <xml name="feature_selection_fs">
1198 <conditional name="fs_algorithm_selector">
1199 <param name="selected_algorithm" type="select" label="Select a feature selection algorithm">
1200 <expand macro="feature_selection_algorithms">
1201 <option value="DyRFECV">DyRFECV - Extended RFECV with changeable steps</option>
1202 </expand>
1203 </param>
1204 <expand macro="feature_selection_algorithm_details"/>
1205 <expand macro="feature_selection_SelectFromModel"/>
1206 <expand macro="feature_selection_RFE">
1207 <expand macro="estimator_selector_fs"/>
1208 </expand>
1209 <expand macro="feature_selection_RFECV_fs">
1210 <expand macro="estimator_selector_fs"/>
1211 </expand>
1212 <expand macro="feature_selection_DyRFECV_fs">
1213 <expand macro="estimator_selector_fs"/>
1214 </expand>
1215 </conditional>
1216 </xml>
1217
1218 <xml name="feature_selection_score_function">
1219 <param argument="score_func" type="select" label="Select a score function">
1220 <option value="chi2">chi2 - Compute chi-squared stats between each non-negative feature and class</option>
1221 <option value="f_classif">f_classif - Compute the ANOVA F-value for the provided sample</option>
1222 <option value="f_regression">f_regression - Univariate linear regression tests</option>
1223 <option value="mutual_info_classif">mutual_info_classif - Estimate mutual information for a discrete target variable</option>
1224 <option value="mutual_info_regression">mutual_info_regression - Estimate mutual information for a continuous target variable</option>
1225 </param>
1226 </xml>
1227
1228 <xml name="model_validation_common_options">
1229 <expand macro="cv"/>
1230 <expand macro="verbose"/>
1231 <yield/>
1232 </xml>
1233
1234 <xml name="scoring_selection">
1235 <conditional name="scoring">
1236 <param name="primary_scoring" type="select" multiple="false" label="Select the primary metric (scoring):" help="Metric to refit the best estimator.">
1237 <option value="default" selected="true">default with estimator</option>
1238 <option value="accuracy">Classification -- 'accuracy'</option>
1239 <option value="balanced_accuracy">Classification -- 'balanced_accuracy'</option>
1240 <option value="average_precision">Classification -- 'average_precision'</option>
1241 <option value="f1">Classification -- 'f1'</option>
1242 <option value="f1_micro">Classification -- 'f1_micro'</option>
1243 <option value="f1_macro">Classification -- 'f1_macro'</option>
1244 <option value="f1_weighted">Classification -- 'f1_weighted'</option>
1245 <option value="f1_samples">Classification -- 'f1_samples'</option>
1246 <option value="neg_log_loss">Classification -- 'neg_log_loss'</option>
1247 <option value="precision">Classification -- 'precision'</option>
1248 <option value="precision_micro">Classification -- 'precision_micro'</option>
1249 <option value="precision_macro">Classification -- 'precision_macro'</option>
1250 <option value="precision_wighted">Classification -- 'precision_wighted'</option>
1251 <option value="precision_samples">Classification -- 'precision_samples'</option>
1252 <option value="recall">Classification -- 'recall'</option>
1253 <option value="recall_micro">Classification -- 'recall_micro'</option>
1254 <option value="recall_macro">Classification -- 'recall_macro'</option>
1255 <option value="recall_wighted">Classification -- 'recall_wighted'</option>
1256 <option value="recall_samples">Classification -- 'recall_samples'</option>
1257 <option value="roc_auc">Classification -- 'roc_auc'</option>
1258 <option value="explained_variance">Regression -- 'explained_variance'</option>
1259 <option value="neg_mean_absolute_error">Regression -- 'neg_mean_absolute_error'</option>
1260 <option value="neg_mean_squared_error">Regression -- 'neg_mean_squared_error'</option>
1261 <option value="neg_mean_squared_log_error">Regression -- 'neg_mean_squared_log_error'</option>
1262 <option value="neg_median_absolute_error">Regression -- 'neg_median_absolute_error'</option>
1263 <option value="r2">Regression -- 'r2'</option>
1264 <option value="binarize_auc_scorer">anomaly detection -- binarize_auc_scorer</option>
1265 <option value="binarize_average_precision_scorer">anomaly detection -- binarize_average_precision_scorer</option>
1266 </param>
1267 <when value="default"/>
1268 <when value="accuracy"><expand macro="secondary_scoring_selection_classification"/></when>
1269 <when value="balanced_accuracy"><expand macro="secondary_scoring_selection_classification"/></when>
1270 <when value="average_precision"><expand macro="secondary_scoring_selection_classification"/></when>
1271 <when value="f1"><expand macro="secondary_scoring_selection_classification"/></when>
1272 <when value="f1_micro"><expand macro="secondary_scoring_selection_classification"/></when>
1273 <when value="f1_macro"><expand macro="secondary_scoring_selection_classification"/></when>
1274 <when value="f1_weighted"><expand macro="secondary_scoring_selection_classification"/></when>
1275 <when value="f1_samples"><expand macro="secondary_scoring_selection_classification"/></when>
1276 <when value="neg_log_loss"><expand macro="secondary_scoring_selection_classification"/></when>
1277 <when value="precision"><expand macro="secondary_scoring_selection_classification"/></when>
1278 <when value="precision_micro"><expand macro="secondary_scoring_selection_classification"/></when>
1279 <when value="precision_macro"><expand macro="secondary_scoring_selection_classification"/></when>
1280 <when value="precision_wighted"><expand macro="secondary_scoring_selection_classification"/></when>
1281 <when value="precision_samples"><expand macro="secondary_scoring_selection_classification"/></when>
1282 <when value="recall"><expand macro="secondary_scoring_selection_classification"/></when>
1283 <when value="recall_micro"><expand macro="secondary_scoring_selection_classification"/></when>
1284 <when value="recall_macro"><expand macro="secondary_scoring_selection_classification"/></when>
1285 <when value="recall_wighted"><expand macro="secondary_scoring_selection_classification"/></when>
1286 <when value="recall_samples"><expand macro="secondary_scoring_selection_classification"/></when>
1287 <when value="roc_auc"><expand macro="secondary_scoring_selection_classification"/></when>
1288 <when value="explained_variance"><expand macro="secondary_scoring_selection_regression"/></when>
1289 <when value="neg_mean_absolute_error"><expand macro="secondary_scoring_selection_regression"/></when>
1290 <when value="neg_mean_squared_error"><expand macro="secondary_scoring_selection_regression"/></when>
1291 <when value="neg_mean_squared_log_error"><expand macro="secondary_scoring_selection_regression"/></when>
1292 <when value="neg_median_absolute_error"><expand macro="secondary_scoring_selection_regression"/></when>
1293 <when value="r2"><expand macro="secondary_scoring_selection_regression"/></when>
1294 <when value="binarize_auc_scorer"><expand macro="secondary_scoring_selection_anormaly"/></when>
1295 <when value="binarize_average_precision_scorer"><expand macro="secondary_scoring_selection_anormaly"/></when>
1296 </conditional>
1297 </xml>
1298
1299 <xml name="secondary_scoring_selection_classification">
1300 <param name="secondary_scoring" type="select" multiple="true" label="Additional scoring used in multi-metric mode:" help="If the same metric with the primary is chosen, the metric will be ignored.">
1301 <option value="accuracy">Classification -- 'accuracy'</option>
1302 <option value="balanced_accuracy">Classification -- 'balanced_accuracy'</option>
1303 <option value="average_precision">Classification -- 'average_precision'</option>
1304 <option value="f1">Classification -- 'f1'</option>
1305 <option value="f1_micro">Classification -- 'f1_micro'</option>
1306 <option value="f1_macro">Classification -- 'f1_macro'</option>
1307 <option value="f1_weighted">Classification -- 'f1_weighted'</option>
1308 <option value="f1_samples">Classification -- 'f1_samples'</option>
1309 <option value="neg_log_loss">Classification -- 'neg_log_loss'</option>
1310 <option value="precision">Classification -- 'precision'</option>
1311 <option value="precision_micro">Classification -- 'precision_micro'</option>
1312 <option value="precision_macro">Classification -- 'precision_macro'</option>
1313 <option value="precision_wighted">Classification -- 'precision_wighted'</option>
1314 <option value="precision_samples">Classification -- 'precision_samples'</option>
1315 <option value="recall">Classification -- 'recall'</option>
1316 <option value="recall_micro">Classification -- 'recall_micro'</option>
1317 <option value="recall_macro">Classification -- 'recall_macro'</option>
1318 <option value="recall_wighted">Classification -- 'recall_wighted'</option>
1319 <option value="recall_samples">Classification -- 'recall_samples'</option>
1320 <option value="roc_auc">Classification -- 'roc_auc'</option>
1321 </param>
1322 </xml>
1323
1324 <xml name="secondary_scoring_selection_regression">
1325 <param name="secondary_scoring" type="select" multiple="true" label="Additional scoring used in multi-metric mode:" help="If the same metric with the primary is chosen, the metric will be ignored.">
1326 <option value="explained_variance">Regression -- 'explained_variance'</option>
1327 <option value="neg_mean_absolute_error">Regression -- 'neg_mean_absolute_error'</option>
1328 <option value="neg_mean_squared_error">Regression -- 'neg_mean_squared_error'</option>
1329 <option value="neg_mean_squared_log_error">Regression -- 'neg_mean_squared_log_error'</option>
1330 <option value="neg_median_absolute_error">Regression -- 'neg_median_absolute_error'</option>
1331 <option value="r2">Regression -- 'r2'</option>
1332 </param>
1333 </xml>
1334
1335 <xml name="secondary_scoring_selection_anormaly">
1336 <param name="secondary_scoring" type="select" multiple="true" label="Additional scoring used in multi-metric mode:" help="If the same metric with the primary is chosen, the metric will be ignored.">
1337 <option value="binarize_auc_scorer">anomaly detection -- binarize_auc_scorer</option>
1338 <option value="binarize_average_precision_scorer">anomaly detection -- binarize_average_precision_scorer</option>
1339 </param>
1340 </xml>
1341
1342 <xml name="pre_dispatch" token_type="hidden" token_default_value="all" token_help="Number of predispatched jobs for parallel execution">
1343 <param argument="pre_dispatch" type="@TYPE@" value="@DEFAULT_VALUE@" optional="true" label="pre_dispatch" help="@HELP@"/>
1344 </xml>
1345
1346 <xml name="search_cv_estimator">
1347 <param name="infile_estimator" type="data" format="zip" label="Choose the dataset containing pipeline/estimator object"/>
1348 <section name="search_params_builder" title="Search parameters Builder" expanded="true">
1349 <param name="infile_params" type="data" format="tabular" optional="true" label="Choose the dataset containing parameter names" help="This dataset could be the output of `get_params` in the `Estimator Attributes` tool."/>
1350 <repeat name="param_set" min="1" max="30" title="Parameter settings for search:">
1351 <param name="sp_name" type="select" optional="true" label="Choose a parameter name (with current value)">
1352 <options from_dataset="infile_params" startswith="@">
1353 <column name="name" index="2"/>
1354 <column name="value" index="1"/>
1355 <filter type="unique_value" name="unique_param" column="1"/>
1356 </options>
1357 </param>
1358 <param name="sp_list" type="text" value="" optional="true" label="Search list" help="list or array-like, for example: [1, 10, 100, 1000], [True, False] and ['auto', 'sqrt', None]. See `help` section for more examples">
1359 <sanitizer>
1360 <valid initial="default">
1361 <add value="&apos;"/>
1362 <add value="&quot;"/>
1363 <add value="["/>
1364 <add value="]"/>
1365 </valid>
1366 </sanitizer>
1367 </param>
1368 </repeat>
1369 </section>
1370 </xml>
1371
1372 <xml name="estimator_and_hyperparameter">
1373 <param name="infile_estimator" type="data" format="zip" label="Choose the dataset containing pipeline/estimator object"/>
1374 <section name="hyperparams_swapping" title="Hyperparameter Swapping" expanded="false">
1375 <param name="infile_params" type="data" format="tabular" optional="true" label="Choose the dataset containing hyperparameters for the pipeline/estimator above" help="This dataset could be the output of `get_params` in the `Estimator Attributes` tool."/>
1376 <repeat name="param_set" min="1" max="30" title="New hyperparameter setting">
1377 <param name="sp_name" type="select" optional="true" label="Choose a parameter name (with current value)">
1378 <options from_dataset="infile_params" startswith="@">
1379 <column name="name" index="2"/>
1380 <column name="value" index="1"/>
1381 <filter type="unique_value" name="unique_param" column="1"/>
1382 </options>
1383 </param>
1384 <param name="sp_value" type="text" value="" optional="true" label="New value" help="Supports int, float, boolean, single quoted string, and selected object constructor. Similar to the `Parameter settings for search` section in `searchcv` tool except that only single value is expected here.">
1385 <sanitizer>
1386 <valid initial="default">
1387 <add value="&apos;"/>
1388 <add value="&quot;"/>
1389 </valid>
1390 </sanitizer>
1391 </param>
1392 </repeat>
1393 </section>
1394 </xml>
1395
1396 <xml name="search_cv_options">
1397 <expand macro="scoring_selection"/>
1398 <expand macro="model_validation_common_options"/>
1399 <!--expand macro="pre_dispatch" default_value="2*n_jobs" help="Controls the number of jobs that get dispatched during parallel execution"/-->
1400 <param argument="iid" type="boolean" truevalue="booltrue" falsevalue="boolfalse" checked="true" label="iid" help="If True, data is identically distributed across the folds"/>
1401 <param argument="refit" type="boolean" truevalue="booltrue" falsevalue="boolfalse" checked="true" label="refit" help="Refit an estimator using the best found parameters on the whole dataset. Be aware that `refit=True` invokes extra computation, but it's REQUIRED for outputting the best estimator!"/>
1402 <param argument="error_score" type="boolean" truevalue="booltrue" falsevalue="boolfalse" checked="true" label="Raise fit error:" help="If false, the metric score is assigned to NaN if an error occurs in estimator fitting and FitFailedWarning is raised."/>
1403 <param argument="return_train_score" type="boolean" truevalue="booltrue" falsevalue="boolfalse" checked="false" label="return_train_score" help=""/>
1404 </xml>
1405
1406 <xml name="estimator_module_options">
1407 <option value="svm" selected="true">sklearn.svm</option>
1408 <option value="linear_model">sklearn.linear_model</option>
1409 <option value="ensemble">sklearn.ensemble</option>
1410 <option value="naive_bayes">sklearn.naive_bayes</option>
1411 <option value="tree">sklearn.tree</option>
1412 <option value="neighbors">sklearn.neighbors</option>
1413 <option value="xgboost">xgboost</option>
1414 <yield/>
1415 </xml>
1416
1417 <xml name="estimator_suboptions">
1418 <when value="svm">
1419 <param name="selected_estimator" type="select" label="Choose estimator class:">
1420 <option value="LinearSVC" selected="true">LinearSVC</option>
1421 <option value="LinearSVR">LinearSVR</option>
1422 <option value="NuSVC">NuSVC</option>
1423 <option value="NuSVR">NuSVR</option>
1424 <option value="OneClassSVM">OneClassSVM</option>
1425 <option value="SVC">SVC</option>
1426 <option value="SVR">SVR</option>
1427 </param>
1428 <expand macro="estimator_params_text"/>
1429 </when>
1430 <when value="linear_model">
1431 <param name="selected_estimator" type="select" label="Choose estimator class:">
1432 <option value="ARDRegression" selected="true">ARDRegression</option>
1433 <option value="BayesianRidge">BayesianRidge</option>
1434 <option value="ElasticNet">ElasticNet</option>
1435 <option value="ElasticNetCV">ElasticNetCV</option>
1436 <option value="HuberRegressor">HuberRegressor</option>
1437 <option value="Lars">Lars</option>
1438 <option value="LarsCV">LarsCV</option>
1439 <option value="Lasso">Lasso</option>
1440 <option value="LassoCV">LassoCV</option>
1441 <option value="LassoLars">LassoLars</option>
1442 <option value="LassoLarsCV">LassoLarsCV</option>
1443 <option value="LassoLarsIC">LassoLarsIC</option>
1444 <option value="LinearRegression">LinearRegression</option>
1445 <option value="LogisticRegression">LogisticRegression</option>
1446 <option value="LogisticRegressionCV">LogisticRegressionCV</option>
1447 <option value="MultiTaskLasso">MultiTaskLasso</option>
1448 <option value="MultiTaskElasticNet">MultiTaskElasticNet</option>
1449 <option value="MultiTaskLassoCV">MultiTaskLassoCV</option>
1450 <option value="MultiTaskElasticNetCV">MultiTaskElasticNetCV</option>
1451 <option value="OrthogonalMatchingPursuit">OrthogonalMatchingPursuit</option>
1452 <option value="OrthogonalMatchingPursuitCV">OrthogonalMatchingPursuitCV</option>
1453 <option value="PassiveAggressiveClassifier">PassiveAggressiveClassifier</option>
1454 <option value="PassiveAggressiveRegressor">PassiveAggressiveRegressor</option>
1455 <option value="Perceptron">Perceptron</option>
1456 <option value="RANSACRegressor">RANSACRegressor</option>
1457 <option value="Ridge">Ridge</option>
1458 <option value="RidgeClassifier">RidgeClassifier</option>
1459 <option value="RidgeClassifierCV">RidgeClassifierCV</option>
1460 <option value="RidgeCV">RidgeCV</option>
1461 <option value="SGDClassifier">SGDClassifier</option>
1462 <option value="SGDRegressor">SGDRegressor</option>
1463 <option value="TheilSenRegressor">TheilSenRegressor</option>
1464 </param>
1465 <expand macro="estimator_params_text"/>
1466 </when>
1467 <when value="ensemble">
1468 <param name="selected_estimator" type="select" label="Choose estimator class:">
1469 <option value="AdaBoostClassifier" selected="true">AdaBoostClassifier</option>
1470 <option value="AdaBoostRegressor">AdaBoostRegressor</option>
1471 <option value="BaggingClassifier">BaggingClassifier</option>
1472 <option value="BaggingRegressor">BaggingRegressor</option>
1473 <option value="ExtraTreesClassifier">ExtraTreesClassifier</option>
1474 <option value="ExtraTreesRegressor">ExtraTreesRegressor</option>
1475 <option value="GradientBoostingClassifier">GradientBoostingClassifier</option>
1476 <option value="GradientBoostingRegressor">GradientBoostingRegressor</option>
1477 <option value="IsolationForest">IsolationForest</option>
1478 <option value="RandomForestClassifier">RandomForestClassifier</option>
1479 <option value="RandomForestRegressor">RandomForestRegressor</option>
1480 <option value="RandomTreesEmbedding">RandomTreesEmbedding</option>
1481 <!--option value="VotingClassifier">VotingClassifier</option-->
1482 </param>
1483 <expand macro="estimator_params_text"/>
1484 </when>
1485 <when value="naive_bayes">
1486 <param name="selected_estimator" type="select" label="Choose estimator class:">
1487 <option value="BernoulliNB" selected="true">BernoulliNB</option>
1488 <option value="GaussianNB">GaussianNB</option>
1489 <option value="MultinomialNB">MultinomialNB</option>
1490 </param>
1491 <expand macro="estimator_params_text"/>
1492 </when>
1493 <when value="tree">
1494 <param name="selected_estimator" type="select" label="Choose estimator class:">
1495 <option value="DecisionTreeClassifier" selected="true">DecisionTreeClassifier</option>
1496 <option value="DecisionTreeRegressor">DecisionTreeRegressor</option>
1497 <option value="ExtraTreeClassifier">ExtraTreeClassifier</option>
1498 <option value="ExtraTreeRegressor">ExtraTreeRegressor</option>
1499 </param>
1500 <expand macro="estimator_params_text"/>
1501 </when>
1502 <when value="neighbors">
1503 <param name="selected_estimator" type="select" label="Choose estimator class:">
1504 <option value="KNeighborsClassifier" selected="true">KNeighborsClassifier</option>
1505 <option value="KNeighborsRegressor">KNeighborsRegressor</option>
1506 <!--option value="BallTree">BallTree</option-->
1507 <!--option value="KDTree">KDTree</option-->
1508 <option value="KernelDensity">KernelDensity</option>
1509 <option value="LocalOutlierFactor">LocalOutlierFactor</option>
1510 <option value="RadiusNeighborsClassifier">RadiusNeighborsClassifier</option>
1511 <option value="RadiusNeighborsRegressor">RadiusNeighborsRegressor</option>
1512 <option value="NearestCentroid">NearestCentroid</option>
1513 <option value="NearestNeighbors">NearestNeighbors</option>
1514 </param>
1515 <expand macro="estimator_params_text"/>
1516 </when>
1517 <when value="xgboost">
1518 <param name="selected_estimator" type="select" label="Choose estimator class:">
1519 <option value="XGBRegressor" selected="true">XGBRegressor</option>
1520 <option value="XGBClassifier">XGBClassifier</option>
1521 </param>
1522 <expand macro="estimator_params_text"/>
1523 </when>
1524 <yield/>
1525 </xml>
1526
1527 <xml name="estimator_selector_all">
1528 <conditional name="estimator_selector">
1529 <param name="selected_module" type="select" label="Choose the module that contains target estimator:" >
1530 <expand macro="estimator_module_options"/>
1531 </param>
1532 <expand macro="estimator_suboptions"/>
1533 </conditional>
1534 </xml>
1535
1536 <xml name="estimator_selector_fs">
1537 <conditional name="estimator_selector">
1538 <param name="selected_module" type="select" label="Choose the module that contains target estimator:" >
1539 <expand macro="estimator_module_options">
1540 <option value="custom_estimator">Load a custom estimator</option>
1541 </expand>
1542 </param>
1543 <expand macro="estimator_suboptions">
1544 <when value="custom_estimator">
1545 <param name="c_estimator" type="data" format="zip" label="Choose the dataset containing the custom estimator or pipeline:"/>
1546 </when>
1547 </expand>
1548 </conditional>
1549 </xml>
1550
1551 <xml name="estimator_params_text" token_label="Type in parameter settings if different from default:" token_default_value=''
1552 token_help="Dictionary-capable, e.g., C=1, kernel='linear'. No double quotes. Leave this box blank for default estimator.">
1553 <param name="text_params" type="text" value="@DEFAULT_VALUE@" optional="true" label="@LABEL@" help="@HELP@">
1554 <sanitizer>
1555 <valid initial="default">
1556 <add value="&apos;"/>
1557 </valid>
1558 </sanitizer>
1559 </param>
1560 </xml>
1561
1562 <xml name="kernel_approximation_all">
1563 <conditional name="kernel_approximation_selector">
1564 <param name="select_algorithm" type="select" label="Choose a kernel approximation algorithm:">
1565 <option value="Nystroem" selected="true">Nystroem</option>
1566 <option value="RBFSampler">RBFSampler</option>
1567 <option value="AdditiveChi2Sampler">AdditiveChi2Sampler</option>
1568 <option value="SkewedChi2Sampler">SkewedChi2Sampler</option>
1569 </param>
1570 <when value="Nystroem">
1571 <expand macro="estimator_params_text"
1572 help="Default(=blank): coef0=None, degree=None, gamma=None, kernel='rbf', kernel_params=None, n_components=100, random_state=None. No double quotes"/>
1573 </when>
1574 <when value="RBFSampler">
1575 <expand macro="estimator_params_text"
1576 help="Default(=blank): gamma=1.0, n_components=100, random_state=None."/>
1577 </when>
1578 <when value="AdditiveChi2Sampler">
1579 <expand macro="estimator_params_text"
1580 help="Default(=blank): sample_interval=None, sample_steps=2."/>
1581 </when>
1582 <when value="SkewedChi2Sampler">
1583 <expand macro="estimator_params_text"
1584 help="Default(=blank): n_components=100, random_state=None, skewedness=1.0."/>
1585 </when>
1586 </conditional>
1587 </xml>
1588
1589 <xml name="matrix_decomposition_all">
1590 <conditional name="matrix_decomposition_selector">
1591 <param name="select_algorithm" type="select" label="Choose a matrix decomposition algorithm:">
1592 <option value="DictionaryLearning" selected="true">DictionaryLearning</option>
1593 <option value="FactorAnalysis">FactorAnalysis</option>
1594 <option value="FastICA">FastICA</option>
1595 <option value="IncrementalPCA">IncrementalPCA</option>
1596 <option value="KernelPCA">KernelPCA</option>
1597 <option value="LatentDirichletAllocation">LatentDirichletAllocation</option>
1598 <option value="MiniBatchDictionaryLearning">MiniBatchDictionaryLearning</option>
1599 <option value="MiniBatchSparsePCA">MiniBatchSparsePCA</option>
1600 <option value="NMF">NMF</option>
1601 <option value="PCA">PCA</option>
1602 <option value="SparsePCA">SparsePCA</option>
1603 <!--option value="SparseCoder">SparseCoder</option-->
1604 <option value="TruncatedSVD">TruncatedSVD</option>
1605 </param>
1606 <when value="DictionaryLearning">
1607 <expand macro="estimator_params_text"
1608 help="Default(=blank): alpha=1, code_init=None, dict_init=None, fit_algorithm='lars', max_iter=1000, n_components=None, random_state=None, split_sign=False, tol=1e-08, transform_algorithm='omp', transform_alpha=None, transform_n_nonzero_coefs=None, verbose=False."/>
1609 </when>
1610 <when value="FactorAnalysis">
1611 <expand macro="estimator_params_text"
1612 help="Default(=blank): copy=True, iterated_power=3, max_iter=1000, n_components=None, noise_variance_init=None, random_state=0, svd_method='randomized', tol=0.01."/>
1613 </when>
1614 <when value="FastICA">
1615 <expand macro="estimator_params_text"
1616 help="Default(=blank): algorithm='parallel', fun='logcosh', fun_args=None, max_iter=200, n_components=None, random_state=None, tol=0.0001, w_init=None, whiten=True. No double quotes."/>
1617 </when>
1618 <when value="IncrementalPCA">
1619 <expand macro="estimator_params_text"
1620 help="Default(=blank): batch_size=None, copy=True, n_components=None, whiten=False."/>
1621 </when>
1622 <when value="KernelPCA">
1623 <expand macro="estimator_params_text"
1624 help="Default(=blank): alpha=1.0, coef0=1, copy_X=True, degree=3, eigen_solver='auto', fit_inverse_transform=False, gamma=None, kernel='linear', kernel_params=None, max_iter=None, n_components=None, random_state=None, remove_zero_eig=False, tol=0. No double quotes."/>
1625 </when>
1626 <when value="LatentDirichletAllocation">
1627 <expand macro="estimator_params_text"
1628 help="Default(=blank): batch_size=128, doc_topic_prior=None, evaluate_every=-1, learning_decay=0.7, learning_method=None, learning_offset=10.0, max_doc_update_iter=100, max_iter=10, mean_change_tol=0.001, n_components=10, n_topics=None, perp_tol=0.1, random_state=None, topic_word_prior=None, total_samples=1000000.0, verbose=0."/>
1629 </when>
1630 <when value="MiniBatchDictionaryLearning">
1631 <expand macro="estimator_params_text"
1632 help="Default(=blank): alpha=1, batch_size=3, dict_init=None, fit_algorithm='lars', n_components=None, n_iter=1000, random_state=None, shuffle=True, split_sign=False, transform_algorithm='omp', transform_alpha=None, transform_n_nonzero_coefs=None, verbose=False."/>
1633 </when>
1634 <when value="MiniBatchSparsePCA">
1635 <expand macro="estimator_params_text"
1636 help="Default(=blank): alpha=1, batch_size=3, callback=None, method='lars', n_components=None, n_iter=100, random_state=None, ridge_alpha=0.01, shuffle=True, verbose=False."/>
1637 </when>
1638 <when value="NMF">
1639 <expand macro="estimator_params_text"
1640 help="Default(=blank): alpha=0.0, beta_loss='frobenius', init=None, l1_ratio=0.0, max_iter=200, n_components=None, random_state=None, shuffle=False, solver='cd', tol=0.0001, verbose=0."/>
1641 </when>
1642 <when value="PCA">
1643 <expand macro="estimator_params_text"
1644 help="Default(=blank): copy=True, iterated_power='auto', n_components=None, random_state=None, svd_solver='auto', tol=0.0, whiten=False."/>
1645 </when>
1646 <when value="SparsePCA">
1647 <expand macro="estimator_params_text"
1648 help="Default(=blank): U_init=None, V_init=None, alpha=1, max_iter=1000, method='lars', n_components=None, random_state=None, ridge_alpha=0.01, tol=1e-08, verbose=False."/>
1649 </when>
1650 <when value="TruncatedSVD">
1651 <expand macro="estimator_params_text"
1652 help="Default(=blank): algorithm='randomized', n_components=2, n_iter=5, random_state=None, tol=0.0."/>
1653 </when>
1654 </conditional>
1655 </xml>
1656
1657 <xml name="FeatureAgglomeration">
1658 <conditional name="FeatureAgglomeration_selector">
1659 <param name="select_algorithm" type="select" label="Choose the algorithm:">
1660 <option value="FeatureAgglomeration" selected="true">FeatureAgglomeration</option>
1661 </param>
1662 <when value="FeatureAgglomeration">
1663 <expand macro="estimator_params_text"
1664 help="Default(=blank): affinity='euclidean', compute_full_tree='auto', connectivity=None, linkage='ward', memory=None, n_clusters=2, pooling_func=np.mean."/>
1665 </when>
1666 </conditional>
1667 </xml>
1668
1669 <xml name="skrebate">
1670 <conditional name="skrebate_selector">
1671 <param name="select_algorithm" type="select" label="Choose the algorithm:">
1672 <option value="ReliefF">ReliefF</option>
1673 <option value="SURF">SURF</option>
1674 <option value="SURFstar">SURFstar</option>
1675 <option value="MultiSURF">MultiSURF</option>
1676 <option value="MultiSURFstar">MultiSURFstar</option>
1677 <!--option value="TuRF">TuRF</option> -->
1678 </param>
1679 <when value="ReliefF">
1680 <expand macro="estimator_params_text"
1681 help="Default(=blank): discrete_threshold=10, n_features_to_select=10, n_neighbors=100, verbose=False."/>
1682 </when>
1683 <when value="SURF">
1684 <expand macro="estimator_params_text"
1685 help="Default(=blank): discrete_threshold=10, n_features_to_select=10, verbose=False."/>
1686 </when>
1687 <when value="SURFstar">
1688 <expand macro="estimator_params_text"
1689 help="Default(=blank): discrete_threshold=10, n_features_to_select=10, verbose=False."/>
1690 </when>
1691 <when value="MultiSURF">
1692 <expand macro="estimator_params_text"
1693 help="Default(=blank): discrete_threshold=10, n_features_to_select=10, verbose=False."/>
1694 </when>
1695 <when value="MultiSURFstar">
1696 <expand macro="estimator_params_text"
1697 help="Default(=blank): discrete_threshold=10, n_features_to_select=10, verbose=False."/>
1698 </when>
1699 <!--when value="TuRF">
1700 <expand macro="estimator_params_text"
1701 help="Default(=blank): core_algorithm='ReliefF', discrete_threshold=10, n_features_to_select=10, n_neighbors=100, pct=0.5, verbose=False."/>
1702 </when> -->
1703 </conditional>
1704 </xml>
1705
1706 <xml name="imbalanced_learn_sampling">
1707 <conditional name="imblearn_selector">
1708 <param name="select_algorithm" type="select" label="Choose the algorithm:">
1709 <option value="under_sampling.ClusterCentroids" selected="true">under_sampling.ClusterCentroids</option>
1710 <option value="under_sampling.CondensedNearestNeighbour">under_sampling.CondensedNearestNeighbour</option>
1711 <option value="under_sampling.EditedNearestNeighbours">under_sampling.EditedNearestNeighbours</option>
1712 <option value="under_sampling.RepeatedEditedNearestNeighbours">under_sampling.RepeatedEditedNearestNeighbours</option>
1713 <option value="under_sampling.AllKNN">under_sampling.AllKNN</option>
1714 <option value="under_sampling.InstanceHardnessThreshold">under_sampling.InstanceHardnessThreshold</option>
1715 <option value="under_sampling.NearMiss">under_sampling.NearMiss</option>
1716 <option value="under_sampling.NeighbourhoodCleaningRule">under_sampling.NeighbourhoodCleaningRule</option>
1717 <option value="under_sampling.OneSidedSelection">under_sampling.OneSidedSelection</option>
1718 <option value="under_sampling.RandomUnderSampler">under_sampling.RandomUnderSampler</option>
1719 <option value="under_sampling.TomekLinks">under_sampling.TomekLinks</option>
1720 <option value="over_sampling.ADASYN">over_sampling.ADASYN</option>
1721 <option value="over_sampling.RandomOverSampler">over_sampling.RandomOverSampler</option>
1722 <option value="over_sampling.SMOTE">over_sampling.SMOTE</option>
1723 <option value="over_sampling.SVMSMOTE">over_sampling.SVMSMOTE</option>
1724 <option value="over_sampling.BorderlineSMOTE">over_sampling.BorderlineSMOTE</option>
1725 <option value="over_sampling.SMOTENC">over_sampling.SMOTENC</option>
1726 <option value="combine.SMOTEENN">combine.SMOTEENN</option>
1727 <option value="combine.SMOTETomek">combine.SMOTETomek</option>
1728 <option value="Z_RandomOverSampler">Z_RandomOverSampler - for regression</option>
1729 </param>
1730 <when value="under_sampling.ClusterCentroids">
1731 <expand macro="estimator_params_text"
1732 help="Default(=blank): sampling_strategy='auto', random_state=None, estimator=None, voting='auto'."/>
1733 </when>
1734 <when value="under_sampling.CondensedNearestNeighbour">
1735 <expand macro="estimator_params_text"
1736 help="Default(=blank): sampling_strategy='auto', random_state=None, n_neighbors=None, n_seeds_S=1."/>
1737 </when>
1738 <when value="under_sampling.EditedNearestNeighbours">
1739 <expand macro="estimator_params_text"
1740 help="Default(=blank): sampling_strategy='auto', random_state=None, n_neighbors=3, max_iter=100, kind_sel='all'."/>
1741 </when>
1742 <when value="under_sampling.RepeatedEditedNearestNeighbours">
1743 <expand macro="estimator_params_text"
1744 help="Default(=blank): sampling_strategy='auto', random_state=None, n_neighbors=3, max_iter=100, kind_sel='all'."/>
1745 </when>
1746 <when value="under_sampling.AllKNN">
1747 <expand macro="estimator_params_text"
1748 help="Default(=blank): sampling_strategy='auto', random_state=None, n_neighbors=3, kind_sel='all', allow_minority=False."/>
1749 </when>
1750 <when value="under_sampling.InstanceHardnessThreshold">
1751 <expand macro="estimator_params_text"
1752 help="Default(=blank): estimator=None, sampling_strategy='auto', random_state=None, cv=5."/>
1753 </when>
1754 <when value="under_sampling.NearMiss">
1755 <expand macro="estimator_params_text"
1756 help="Default(=blank): sampling_strategy='auto', random_state=None, version=1, n_neighbors=3, n_neighbors_ver3=3."/>
1757 </when>
1758 <when value="under_sampling.NeighbourhoodCleaningRule">
1759 <expand macro="estimator_params_text"
1760 help="Default(=blank): sampling_strategy='auto', random_state=None, n_neighbors=3, kind_sel='all', threshold_cleaning=0.5."/>
1761 </when>
1762 <when value="under_sampling.OneSidedSelection">
1763 <expand macro="estimator_params_text"
1764 help="Default(=blank): sampling_strategy='auto', random_state=None, n_neighbors=None, n_seeds_S=1."/>
1765 </when>
1766 <when value="under_sampling.RandomUnderSampler">
1767 <expand macro="estimator_params_text"
1768 help="Default(=blank): sampling_strategy='auto', random_state=None, replacement=False."/>
1769 </when>
1770 <when value="under_sampling.TomekLinks">
1771 <expand macro="estimator_params_text"
1772 help="Default(=blank): sampling_strategy='auto', random_state=None."/>
1773 </when>
1774 <when value="over_sampling.ADASYN">
1775 <expand macro="estimator_params_text"
1776 help="Default(=blank): sampling_strategy='auto', random_state=None, n_neighbors=5."/>
1777 </when>
1778 <when value="over_sampling.RandomOverSampler">
1779 <expand macro="estimator_params_text"
1780 help="Default(=blank): sampling_strategy='auto', random_state=None."/>
1781 </when>
1782 <when value="over_sampling.SMOTE">
1783 <expand macro="estimator_params_text"
1784 help="Default(=blank): sampling_strategy='auto', random_state=None, k_neighbors=5."/>
1785 </when>
1786 <when value="over_sampling.SVMSMOTE">
1787 <expand macro="estimator_params_text"
1788 help="Default(=blank): sampling_strategy='auto', k_neighbors=5, m_neighbors=10, out_step=0.5, random_state=None, svm_estimator=None."/>
1789 </when>
1790 <when value="over_sampling.BorderlineSMOTE">
1791 <expand macro="estimator_params_text"
1792 help="Default(=blank): sampling_strategy='auto', k_neighbors=5, kind='borderline-1', m_neighbors=10, random_state=None."/>
1793 </when>
1794 <when value="over_sampling.SMOTENC">
1795 <expand macro="estimator_params_text"
1796 help="Default: categorical_features=[], sampling_strategy='auto', random_state=None, k_neighbors=5."/>
1797 </when>
1798 <when value="combine.SMOTEENN">
1799 <expand macro="estimator_params_text"
1800 help="Default(=blank): sampling_strategy='auto', random_state=None, smote=None, enn=None."/>
1801 </when>
1802 <when value="combine.SMOTETomek">
1803 <expand macro="estimator_params_text"
1804 help="Default(=blank): sampling_strategy='auto', random_state=None, smote=None, tomek=None."/>
1805 </when>
1806 <when value="Z_RandomOverSampler">
1807 <expand macro="estimator_params_text"
1808 help="Default(=blank): sampling_strategy='auto', random_state=None, negative_thres=0, positive_thres=-1."/>
1809 </when>
1810 </conditional>
1811 </xml>
1812
1813 <xml name="stacking_ensemble_inputs">
1814 <section name="options" title="Advanced Options" expanded="false">
1815 <yield/>
1816 <param argument="use_features_in_secondary" type="boolean" truevalue="booltrue" falsevalue="boolfalse" checked="false"/>
1817 <param argument="store_train_meta_features" type="boolean" truevalue="booltrue" falsevalue="boolfalse" checked="false"/>
1818 </section>
1819 </xml>
1820
1821 <xml name="stacking_base_estimator">
1822 <conditional name="estimator_selector">
1823 <param name="selected_module" type="select" label="Choose the module that contains target estimator:" >
1824 <expand macro="estimator_module_options">
1825 <option value="custom_estimator">Load a custom estimator</option>
1826 </expand>
1827 </param>
1828 <expand macro="estimator_suboptions">
1829 <when value="custom_estimator">
1830 <param name="c_estimator" type="data" format="zip" label="Choose the dataset containing the custom estimator or pipeline"/>
1831 </when>
1832 </expand>
1833 </conditional>
1834 </xml>
1835
1836 <xml name="stacking_voting_weights">
1837 <section name="options" title="Advanced Options" expanded="false">
1838 <param argument="weights" type="text" value="[]" optional="true" help="Sequence of weights (float or int). Uses uniform weights if None (`[]`).">
1839 <sanitizer>
1840 <valid initial="default">
1841 <add value="["/>
1842 <add value="]"/>
1843 </valid>
1844 </sanitizer>
1845 </param>
1846 <yield/>
1847 </section>
1848 </xml>
1849
1850 <xml name="preprocessors_sequence_encoders">
1851 <conditional name="encoder_selection">
1852 <param name="encoder_type" type="select" label="Choose the sequence encoder class">
1853 <option value="GenomeOneHotEncoder">GenomeOneHotEncoder</option>
1854 <option value="ProteinOneHotEncoder">ProteinOneHotEncoder</option>
1855 </param>
1856 <when value="GenomeOneHotEncoder">
1857 <expand macro="preprocessors_sequence_encoder_arguments"/>
1858 </when>
1859 <when value="ProteinOneHotEncoder">
1860 <expand macro="preprocessors_sequence_encoder_arguments"/>
1861 </when>
1862 </conditional>
1863 </xml>
1864
1865 <xml name="preprocessors_sequence_encoder_arguments">
1866 <param argument="seq_length" type="integer" value="" min="0" optional="true" help="Integer. Sequence length"/>
1867 <param argument="padding" type="boolean" truevalue="booltrue" falsevalue="boolfalse" checked="true" help="Whether to pad or truncate sequence to meet the sequence length."/>
1868 </xml>
1869
1870 <!-- Outputs -->
1871
1872 <xml name="output">
1873 <outputs>
1874 <data format="tabular" name="outfile_predict">
1875 <filter>selected_tasks['selected_task'] == 'load'</filter>
1876 </data>
1877 <data format="zip" name="outfile_fit" label="${tool.name}.${selected_tasks.selected_algorithms.selected_algorithm}">
1878 <filter>selected_tasks['selected_task'] == 'train'</filter>
1879 </data>
1880 </outputs>
1881 </xml>
1882
1883 <!--Citations-->
1884 <xml name="eden_citation">
1885 <citations>
1886 <citation type="doi">10.5281/zenodo.15094</citation>
1887 </citations>
1888 </xml>
1889
1890 <xml name="sklearn_citation">
1891 <citations>
1892 <citation type="bibtex">
1893 @article{scikit-learn,
1894 title={Scikit-learn: Machine Learning in {P}ython},
1895 author={Pedregosa, F. and Varoquaux, G. and Gramfort, A. and Michel, V.
1896 and Thirion, B. and Grisel, O. and Blondel, M. and Prettenhofer, P.
1897 and Weiss, R. and Dubourg, V. and Vanderplas, J. and Passos, A. and
1898 Cournapeau, D. and Brucher, M. and Perrot, M. and Duchesnay, E.},
1899 journal={Journal of Machine Learning Research},
1900 volume={12},
1901 pages={2825--2830},
1902 year={2011}
1903 }
1904 </citation>
1905 <yield/>
1906 </citations>
1907 </xml>
1908
1909 <xml name="scipy_citation">
1910 <citations>
1911 <citation type="bibtex">
1912 @Misc{,
1913 author = {Eric Jones and Travis Oliphant and Pearu Peterson and others},
1914 title = {{SciPy}: Open source scientific tools for {Python}},
1915 year = {2001--},
1916 url = "http://www.scipy.org/",
1917 note = {[Online; accessed 2016-04-09]}
1918 }
1919 </citation>
1920 </citations>
1921 </xml>
1922
1923 <xml name="skrebate_citation">
1924 <citation type="bibtex">
1925 @article{DBLP:journals/corr/abs-1711-08477,
1926 author = {Ryan J. Urbanowicz and
1927 Randal S. Olson and
1928 Peter Schmitt and
1929 Melissa Meeker and
1930 Jason H. Moore},
1931 title = {Benchmarking Relief-Based Feature Selection Methods},
1932 journal = {CoRR},
1933 volume = {abs/1711.08477},
1934 year = {2017},
1935 url = {http://arxiv.org/abs/1711.08477},
1936 archivePrefix = {arXiv},
1937 eprint = {1711.08477},
1938 timestamp = {Mon, 13 Aug 2018 16:46:04 +0200},
1939 biburl = {https://dblp.org/rec/bib/journals/corr/abs-1711-08477},
1940 bibsource = {dblp computer science bibliography, https://dblp.org}
1941 }
1942 </citation>
1943 </xml>
1944
1945 <xml name="xgboost_citation">
1946 <citation type="bibtex">
1947 @inproceedings{Chen:2016:XST:2939672.2939785,
1948 author = {Chen, Tianqi and Guestrin, Carlos},
1949 title = {{XGBoost}: A Scalable Tree Boosting System},
1950 booktitle = {Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining},
1951 series = {KDD '16},
1952 year = {2016},
1953 isbn = {978-1-4503-4232-2},
1954 location = {San Francisco, California, USA},
1955 pages = {785--794},
1956 numpages = {10},
1957 url = {http://doi.acm.org/10.1145/2939672.2939785},
1958 doi = {10.1145/2939672.2939785},
1959 acmid = {2939785},
1960 publisher = {ACM},
1961 address = {New York, NY, USA},
1962 keywords = {large-scale machine learning},
1963 }
1964 </citation>
1965 </xml>
1966
1967 <xml name="imblearn_citation">
1968 <citation type="bibtex">
1969 @article{JMLR:v18:16-365,
1970 author = {Guillaume Lema{{\^i}}tre and Fernando Nogueira and Christos K. Aridas},
1971 title = {Imbalanced-learn: A Python Toolbox to Tackle the Curse of Imbalanced Datasets in Machine Learning},
1972 journal = {Journal of Machine Learning Research},
1973 year = {2017},
1974 volume = {18},
1975 number = {17},
1976 pages = {1-5},
1977 url = {http://jmlr.org/papers/v18/16-365.html}
1978 }
1979 </citation>
1980 </xml>
1981
1982 <xml name="selene_citation">
1983 <citation type="bibtex">
1984 @article{chen2019selene,
1985 title={Selene: a PyTorch-based deep learning library for sequence data},
1986 author={Chen, Kathleen M and Cofer, Evan M and Zhou, Jian and Troyanskaya, Olga G},
1987 journal={Nature methods},
1988 volume={16},
1989 number={4},
1990 pages={315},
1991 year={2019},
1992 publisher={Nature Publishing Group}
1993 }
1994 </citation>
1995 </xml>
1996
1997 </macros>