Mercurial > repos > bgruening > svm_classifier
comparison main_macros.xml @ 2:48ac998ec1b9 draft
planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
author | bgruening |
---|---|
date | Tue, 31 May 2016 16:51:42 -0400 |
parents | a43963a460fb |
children | dac91f401f4b |
comparison
equal
deleted
inserted
replaced
1:a43963a460fb | 2:48ac998ec1b9 |
---|---|
12 <stdio> | 12 <stdio> |
13 <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error" /> | 13 <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error" /> |
14 </stdio> | 14 </stdio> |
15 </xml> | 15 </xml> |
16 | 16 |
17 | |
18 <!--Generic interface--> | |
17 <xml name="train_loadConditional" token_train="tabular" token_data="tabular" token_model="txt"> | 19 <xml name="train_loadConditional" token_train="tabular" token_data="tabular" token_model="txt"> |
18 <conditional name="selected_tasks"> | 20 <conditional name="selected_tasks"> |
19 <param name="selected_task" type="select" label="Select a Classification Task"> | 21 <param name="selected_task" type="select" label="Select a Classification Task"> |
22 <option value="train" selected="true">Train a model</option> | |
20 <option value="load">Load a model and predict</option> | 23 <option value="load">Load a model and predict</option> |
21 <option value="train" selected="true">Train a model</option> | |
22 </param> | 24 </param> |
23 <when value="load"> | 25 <when value="load"> |
24 <param name="infile_model" type="data" format="@MODEL@" label="Models" help="Select a model file." /> | 26 <param name="infile_model" type="data" format="@MODEL@" label="Models" help="Select a model file." /> |
25 <param name="infile_data" type="data" format="@DATA@" label="Data (tabular)" help="Select the dataset you want to classify."/> | 27 <param name="infile_data" type="data" format="@DATA@" label="Data (tabular)" help="Select the dataset you want to classify."/> |
26 <conditional name="prediction_options"> | 28 <conditional name="prediction_options"> |
41 </conditional> | 43 </conditional> |
42 </when> | 44 </when> |
43 </conditional> | 45 </conditional> |
44 </xml> | 46 </xml> |
45 | 47 |
48 <xml name="sl_Conditional" token_train="tabular" token_data="tabular" token_model="txt"> | |
49 <conditional name="selected_tasks"> | |
50 <param name="selected_task" type="select" label="Select a Classification Task"> | |
51 <option value="train" selected="true">Train a model</option> | |
52 <option value="load">Load a model and predict</option> | |
53 </param> | |
54 <when value="load"> | |
55 <param name="infile_model" type="data" format="@MODEL@" label="Models" help="Select a model file." /> | |
56 <param name="infile_data" type="data" format="@DATA@" label="Data (tabular)" help="Select the dataset you want to classify."/> | |
57 <conditional name="prediction_options"> | |
58 <param name="prediction_option" type="select" label="Select the type of prediction"> | |
59 <option value="predict">Predict class labels</option> | |
60 <option value="advanced">Include advanced options</option> | |
61 </param> | |
62 <when value="predict"> | |
63 </when> | |
64 <when value="advanced"> | |
65 </when> | |
66 </conditional> | |
67 </when> | |
68 <when value="train"> | |
69 <conditional name="selected_algorithms"> | |
70 <yield /> | |
71 </conditional> | |
72 </when> | |
73 </conditional> | |
74 </xml> | |
75 | |
46 <xml name="advanced_section"> | 76 <xml name="advanced_section"> |
47 <section name="options" title="Advanced Options" expanded="False"> | 77 <section name="options" title="Advanced Options" expanded="False"> |
48 <yield /> | 78 <yield /> |
49 </section> | 79 </section> |
50 </xml> | 80 </xml> |
51 | 81 |
52 <xml name="tabular_input"> | 82 |
53 <param name="infile" type="data" format="tabular" label="Data file with numeric values"/> | 83 <!--Ensemble methods--> |
54 <param name="start_column" type="data_column" data_ref="infile" optional="True" label="Select a subset of data. Start column:" /> | 84 <xml name="n_estimators" token_default_value="10" token_help=" "> |
55 <param name="end_column" type="data_column" data_ref="infile" optional="True" label="End column:" /> | 85 <param argument="n_estimators" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Number of trees in the forest" help="@HELP@"/> |
56 </xml> | 86 </xml> |
57 | 87 |
88 <xml name="max_depth" token_default_value="" token_help=" "> | |
89 <param argument="max_depth" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Maximum depth of the tree" help="@HELP@"/> | |
90 </xml> | |
91 | |
92 <xml name="min_samples_split" token_default_value="2" token_help=" "> | |
93 <param argument="min_samples_split" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Maximum depth of the tree" help="@HELP@"/> | |
94 </xml> | |
95 | |
96 <xml name="min_samples_leaf" token_default_value="1" token_help=" "> | |
97 <param argument="min_samples_leaf" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Minimum number of samples in newly created leaves" help="@HELP@"/> | |
98 </xml> | |
99 | |
100 <xml name="min_weight_fraction_leaf" token_default_value="0.0" token_help=" "> | |
101 <param argument="min_weight_fraction_leaf" type="float" optional="true" value="@DEFAULT_VALUE@" label="Minimum weighted fraction of the input samples required to be at a leaf node" help="@HELP@"/> | |
102 </xml> | |
103 | |
104 <xml name="max_leaf_nodes" token_default_value="" token_help=" "> | |
105 <param argument="max_leaf_nodes" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Maximum number of leaf nodes in best-first method" help="@HELP@"/> | |
106 </xml> | |
107 | |
108 <xml name="bootstrap" token_checked="true" token_help=" "> | |
109 <param argument="bootstrap" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="@CHECKED@" label="Use bootstrap samples for building trees." help="@HELP@"/> | |
110 </xml> | |
111 | |
112 <xml name="criterion" token_help=" "> | |
113 <param argument="criterion" type="select" label="Function to measure the quality of a split" help=" "> | |
114 <option value="gini" selected="true">Gini impurity</option> | |
115 <option value="entropy">Information gain</option> | |
116 <yield/> | |
117 </param> | |
118 </xml> | |
119 | |
120 <xml name="oob_score" token_checked="flase" token_help=" "> | |
121 <param argument="oob_score" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="@CHECKED@" label="Use out-of-bag samples to estimate the generalization error" help="@HELP@"/> | |
122 </xml> | |
123 | |
124 <xml name="max_features" token_default_value="auto" token_help="This could be an integer, float, string, or None. For more information please refer to help. "> | |
125 <param argument="max_features" type="text" optional="true" value="@DEFAULT_VALUE@" label="Number of features for finding the best split" help="@HELP@"/> | |
126 </xml> | |
127 | |
128 <xml name="learning_rate" token_default_value="1.0" token_help=" "> | |
129 <param argument="learning_rate" type="float" optional="true" value="@DEFAULT_VALUE@" label="Learning rate" help="@HELP@"/> | |
130 </xml> | |
131 | |
132 | |
133 <!--Parameters--> | |
58 <xml name="tol" token_default_value="0.0" token_help_text="Early stopping heuristics based on the relative center changes. Set to default (0.0) to disable this convergence detection."> | 134 <xml name="tol" token_default_value="0.0" token_help_text="Early stopping heuristics based on the relative center changes. Set to default (0.0) to disable this convergence detection."> |
59 <param argument="tol" type="float" optional="true" value="@DEFAULT_VALUE@" label="Tolerance" help="@HELP_TEXT@"/> | 135 <param argument="tol" type="float" optional="true" value="@DEFAULT_VALUE@" label="Tolerance" help="@HELP_TEXT@"/> |
60 </xml> | 136 </xml> |
61 | 137 |
62 <xml name="n_clusters" token_default_value="8"> | 138 <xml name="n_clusters" token_default_value="8"> |
134 <param argument="degree" type="integer" optional="true" value="@DEFAULT_VALUE@" label="@LABEL@" help="@HELP_TEXT@"/> | 210 <param argument="degree" type="integer" optional="true" value="@DEFAULT_VALUE@" label="@LABEL@" help="@HELP_TEXT@"/> |
135 </xml> | 211 </xml> |
136 | 212 |
137 <xml name="coef0" token_default_value="1" token_label="Zero coefficient" token_help_text=" "> | 213 <xml name="coef0" token_default_value="1" token_label="Zero coefficient" token_help_text=" "> |
138 <param argument="coef0" type="integer" optional="true" value="@DEFAULT_VALUE@" label="@LABEL@" help="@HELP_TEXT@"/> | 214 <param argument="coef0" type="integer" optional="true" value="@DEFAULT_VALUE@" label="@LABEL@" help="@HELP_TEXT@"/> |
139 </xml> | 215 </xml> |
216 | |
217 <xml name="pos_label" token_default_value=""> | |
218 <param argument="pos_label" type="integer" optional="true" value="@DEFAULT_VALUE@" label="Label of the positive class" help=" "/> | |
219 </xml> | |
220 | |
221 <xml name="average"> | |
222 <param argument="average" type="select" optional="True" label="Averaging type" help=" "> | |
223 <option value="binary" selected="true" help="Only report results for the class specified by pos_label. Applicable only on binary classification.">binary</option> | |
224 <option value="micro" help="Calculate metrics globally by counting the total true positives, false negatives and false positives.">micro</option> | |
225 <option value="samples" help="Calculate metrics for each instance, and find their average (only meaningful for multilabel).">samples</option> | |
226 <!--option value="macro" help=""></option--> | |
227 <!--option value="weighted" help=""></option--> | |
228 </param> | |
229 </xml> | |
230 | |
231 <xml name="beta"> | |
232 <param argument="beta" type="float" value="1.0" label="The strength of recall versus precision in the F-score" help=" "/> | |
233 </xml> | |
234 | |
235 | |
236 <!--Data interface--> | |
237 <xml name="tabular_input"> | |
238 <param name="infile" type="data" format="tabular" label="Data file with numeric values"/> | |
239 <param name="start_column" type="data_column" data_ref="infile" optional="True" label="Select a subset of data. Start column:" /> | |
240 <param name="end_column" type="data_column" data_ref="infile" optional="True" label="End column:" /> | |
241 </xml> | |
242 | |
243 <xml name="sample_cols" token_label1="File containing true class labels:" token_label2="File containing predicted class labels:" token_multiple1="False" token_multiple2="False" token_format1="tabular" token_format2="tabular" token_help1="" token_help2=""> | |
244 <param name="infile1" type="data" format="@FORMAT1@" label="@LABEL1@" help="@HELP1@"/> | |
245 <param name="col1" multiple="@MULTIPLE1@" type="data_column" data_ref="infile1" label="Select target column(s):"/> | |
246 <param name="infile2" type="data" format="@FORMAT2@" label="@LABEL2@" help="@HELP2@"/> | |
247 <param name="col2" multiple="@MULTIPLE2@" type="data_column" data_ref="infile2" label="Select target column(s):"/> | |
248 <yield/> | |
249 </xml> | |
140 | 250 |
141 <xml name="multiple_input" token_name="input_files" token_max_num="10" token_format="txt" token_label="Sparse matrix file (.mtx, .txt)" token_help_text="Specify a sparse matrix file in .txt format."> | 251 <xml name="multiple_input" token_name="input_files" token_max_num="10" token_format="txt" token_label="Sparse matrix file (.mtx, .txt)" token_help_text="Specify a sparse matrix file in .txt format."> |
142 <repeat name="@NAME@" min="1" max="@MAX_NUM@" title="Select input file(s):"> | 252 <repeat name="@NAME@" min="1" max="@MAX_NUM@" title="Select input file(s):"> |
143 <param name="input" type="data" format="@FORMAT@" label="@LABEL@" help="@HELP_TEXT@"/> | 253 <param name="input" type="data" format="@FORMAT@" label="@LABEL@" help="@HELP_TEXT@"/> |
144 </repeat> | 254 </repeat> |
145 </xml> | 255 </xml> |
146 | 256 |
147 <xml name="eden_citation"> | 257 <xml name="sparse_target" token_label1="Select a sparse matrix:" token_label2="Select the tabular containing true labels:" token_multiple="False" token_format1="txt" token_format2="tabular" token_help1="" token_help2=""> |
148 <citations> | 258 <param name="infile1" type="data" format="@FORMAT1@" label="@LABEL1@" help="@HELP1@"/> |
149 <citation type="bibtex"> | 259 <param name="infile2" type="data" format="@FORMAT2@" label="@LABEL2@" help="@HELP2@"/> |
150 @misc{fabrizio_costa_2015_15094, | 260 <param name="col2" multiple="@MULTIPLE@" type="data_column" data_ref="infile2" label="Select target column(s):"/> |
151 author = {Fabrizio Costa and | 261 </xml> |
152 Björn Grüning and | 262 |
153 gigolo}, | 263 <xml name="sl_mixed_input"> |
154 title = {EDeN: EDeN - Graph Vectorizer}, | 264 <conditional name="input_options"> |
155 month = feb, | 265 <param name="selected_input" type="select" label="Select input type:"> |
156 year = 2015, | 266 <option value="tabular" selected="true">tabular data</option> |
157 doi = {10.5281/zenodo.15094}, | 267 <option value="sparse">sparse matrix</option> |
158 url = {http://dx.doi.org/10.5281/zenodo.15094} | 268 </param> |
159 } | 269 <when value="tabular"> |
160 } | 270 <expand macro="sample_cols" multiple1="true"/> |
161 </citation> | 271 </when> |
162 </citations> | 272 <when value="sparse"> |
163 </xml> | 273 <expand macro="sparse_target"/> |
164 | 274 </when> |
165 <xml name="sklearn_citation"> | 275 </conditional> |
166 <citations> | 276 </xml> |
167 <citation type="bibtex"> | 277 |
168 @article{scikit-learn, | 278 |
169 title={Scikit-learn: Machine Learning in {P}ython}, | 279 <!--Advanced options--> |
170 author={Pedregosa, F. and Varoquaux, G. and Gramfort, A. and Michel, V. | |
171 and Thirion, B. and Grisel, O. and Blondel, M. and Prettenhofer, P. | |
172 and Weiss, R. and Dubourg, V. and Vanderplas, J. and Passos, A. and | |
173 Cournapeau, D. and Brucher, M. and Perrot, M. and Duchesnay, E.}, | |
174 journal={Journal of Machine Learning Research}, | |
175 volume={12}, | |
176 pages={2825--2830}, | |
177 year={2011} | |
178 url = {https://github.com/scikit-learn/scikit-learn} | |
179 } | |
180 </citation> | |
181 </citations> | |
182 </xml> | |
183 | |
184 <xml name="scipy_citation"> | |
185 <citations> | |
186 <citation type="bibtex"> | |
187 @Misc{, | |
188 author = {Eric Jones and Travis Oliphant and Pearu Peterson and others}, | |
189 title = {{SciPy}: Open source scientific tools for {Python}}, | |
190 year = {2001--}, | |
191 url = "http://www.scipy.org/", | |
192 note = {[Online; accessed 2016-04-09]} | |
193 } | |
194 </citation> | |
195 </citations> | |
196 </xml> | |
197 | |
198 | |
199 <xml name="nn_advanced_options"> | 280 <xml name="nn_advanced_options"> |
200 <section name="options" title="Advanced Options" expanded="False"> | 281 <section name="options" title="Advanced Options" expanded="False"> |
201 <yield/> | 282 <yield/> |
202 <param argument="weights" type="select" label="Weight function" help="Used in prediction."> | 283 <param argument="weights" type="select" label="Weight function" help="Used in prediction."> |
203 <option value="uniform" selected="true" help="Uniform weights. All points in each neighborhood are weighted equally.">Uniform</option> | 284 <option value="uniform" selected="true" help="Uniform weights. All points in each neighborhood are weighted equally.">Uniform</option> |
440 <param argument="batch_size" type="integer" optional="true" value="500" label="Batch size" help="Number of rows to be processed in each batch run."/> | 521 <param argument="batch_size" type="integer" optional="true" value="500" label="Batch size" help="Number of rows to be processed in each batch run."/> |
441 </section> | 522 </section> |
442 </when> | 523 </when> |
443 </xml> | 524 </xml> |
444 | 525 |
526 <xml name="sparse_preprocessors"> | |
527 <param name="selected_pre_processor" type="select" label="Select a preprocessor:"> | |
528 <option value="StandardScaler" selected="true">Standardize features by removing the mean and scaling to unit variance</option> | |
529 <option value="Binarizer">Binarize data</option> | |
530 <option value="Imputer">Complete missing values</option> | |
531 <option value="MaxAbsScaler">Scale features by their maximum absolute value</option> | |
532 <option value="Normalizer">Normalize samples individually to unit norm</option> | |
533 <yield/> | |
534 </param> | |
535 </xml> | |
536 | |
537 <xml name="sparse_preprocessor_options"> | |
538 <when value="Binarizer"> | |
539 <section name="options" title="Advanced Options" expanded="False"> | |
540 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Use a copy of data for precomputing binarization" help=" "/> | |
541 <param argument="threshold" type="float" optional="true" value="0.0" label="Threshold" help="Feature values below or equal to this are replaced by 0, above it by 1. Threshold may not be less than 0 for operations on sparse matrices. "/> | |
542 </section> | |
543 </when> | |
544 <when value="Imputer"> | |
545 <section name="options" title="Advanced Options" expanded="False"> | |
546 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Use a copy of data for precomputing imputation" help=" "/> | |
547 <param argument="strategy" type="select" optional="true" label="Imputation strategy" help=" "> | |
548 <option value="mean" selected="true">Replace missing values using the mean along the axis</option> | |
549 <option value="median">Replace missing values using the median along the axis</option> | |
550 <option value="most_frequent">Replace missing using the most frequent value along the axis</option> | |
551 </param> | |
552 <param argument="missing_values" type="text" optional="true" value="NaN" label="Placeholder for missing values" help="For missing values encoded as numpy.nan, use the string value “NaN”"/> | |
553 <param argument="axis" type="select" optional="true" label="The axis along which to impute" help=" "> | |
554 <option value="0" selected="true">Impute along columns</option> | |
555 <option value="1">Impute along rows</option> | |
556 </param> | |
557 </section> | |
558 </when> | |
559 <when value="StandardScaler"> | |
560 <section name="options" title="Advanced Options" expanded="False"> | |
561 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Use a copy of data for performing inplace scaling" help=" "/> | |
562 <param argument="with_mean" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Center the data before scaling" help=" "/> | |
563 <param argument="with_std" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Scale the data to unit variance (or unit standard deviation)" help=" "/> | |
564 </section> | |
565 </when> | |
566 <when value="MaxAbsScaler"> | |
567 <section name="options" title="Advanced Options" expanded="False"> | |
568 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Use a copy of data for precomputing scaling" help=" "/> | |
569 </section> | |
570 </when> | |
571 <when value="Normalizer"> | |
572 <section name="options" title="Advanced Options" expanded="False"> | |
573 <param argument="norm" type="select" optional="true" label="The norm to use to normalize non zero samples" help=" "> | |
574 <option value="l1" selected="true">l1</option> | |
575 <option value="l2">l2</option> | |
576 <option value="max">max</option> | |
577 <param argument="copy" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolflase" checked="true" label="Use a copy of data for precomputing row normalization" help=" "/> | |
578 </param> | |
579 </section> | |
580 </when> | |
581 <yield/> | |
582 </xml> | |
583 | |
584 | |
585 <!--Citations--> | |
586 <xml name="eden_citation"> | |
587 <citations> | |
588 <citation type="bibtex"> | |
589 @misc{fabrizio_costa_2015_15094, | |
590 author = {Fabrizio Costa and | |
591 Björn Grüning and | |
592 gigolo}, | |
593 title = {EDeN: EDeN - Graph Vectorizer}, | |
594 month = feb, | |
595 year = 2015, | |
596 doi = {10.5281/zenodo.15094}, | |
597 url = {http://dx.doi.org/10.5281/zenodo.15094} | |
598 } | |
599 } | |
600 </citation> | |
601 </citations> | |
602 </xml> | |
603 | |
604 <xml name="sklearn_citation"> | |
605 <citations> | |
606 <citation type="bibtex"> | |
607 @article{scikit-learn, | |
608 title={Scikit-learn: Machine Learning in {P}ython}, | |
609 author={Pedregosa, F. and Varoquaux, G. and Gramfort, A. and Michel, V. | |
610 and Thirion, B. and Grisel, O. and Blondel, M. and Prettenhofer, P. | |
611 and Weiss, R. and Dubourg, V. and Vanderplas, J. and Passos, A. and | |
612 Cournapeau, D. and Brucher, M. and Perrot, M. and Duchesnay, E.}, | |
613 journal={Journal of Machine Learning Research}, | |
614 volume={12}, | |
615 pages={2825--2830}, | |
616 year={2011} | |
617 url = {https://github.com/scikit-learn/scikit-learn} | |
618 } | |
619 </citation> | |
620 </citations> | |
621 </xml> | |
622 | |
623 <xml name="scipy_citation"> | |
624 <citations> | |
625 <citation type="bibtex"> | |
626 @Misc{, | |
627 author = {Eric Jones and Travis Oliphant and Pearu Peterson and others}, | |
628 title = {{SciPy}: Open source scientific tools for {Python}}, | |
629 year = {2001--}, | |
630 url = "http://www.scipy.org/", | |
631 note = {[Online; accessed 2016-04-09]} | |
632 } | |
633 </citation> | |
634 </citations> | |
635 </xml> | |
636 | |
445 </macros> | 637 </macros> |