annotate ensemble.xml @ 26:8d0d31567045 draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
author bgruening
date Thu, 11 Oct 2018 03:22:26 -0400
parents 18e29854c803
children 5af731ab6995
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
1 <tool id="sklearn_ensemble" name="Ensemble methods" version="@VERSION@">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
2 <description>for classification and regression</description>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
3 <macros>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
4 <import>main_macros.xml</import>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
5 </macros>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
6 <expand macro="python_requirements"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
7 <expand macro="macro_stdio"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
8 <version_command>echo "@VERSION@"</version_command>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
9 <command><![CDATA[
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
10 python "$ensemble_script" '$inputs'
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
11 ]]>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
12 </command>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
13 <configfiles>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
14 <inputs name="inputs"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
15 <configfile name="ensemble_script">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
16 <![CDATA[
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
17 import sys
23
090cb13556f1 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 19
diff changeset
18 import os
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
19 import json
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
20 import numpy as np
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
21 import sklearn.ensemble
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
22 import pandas
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
23 from scipy.io import mmread
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
24
25
18e29854c803 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 2a058459e6daf0486871f93845f00fdb4a4eaca1
bgruening
parents: 24
diff changeset
25 with open("$__tool_directory__/sk_whitelist.json", "r") as f:
18e29854c803 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 2a058459e6daf0486871f93845f00fdb4a4eaca1
bgruening
parents: 24
diff changeset
26 sk_whitelist = json.load(f)
18e29854c803 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 2a058459e6daf0486871f93845f00fdb4a4eaca1
bgruening
parents: 24
diff changeset
27 exec(open("$__tool_directory__/utils.py").read(), globals())
8
ea8b1c89c20b planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit cea052cf3b8dd4f3620253bd222e126de32e7466
bgruening
parents: 6
diff changeset
28
18
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
29 # Get inputs, outputs.
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
30 input_json_path = sys.argv[1]
19
128bd4ab2b82 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 18
diff changeset
31 with open(input_json_path, "r") as param_handler:
128bd4ab2b82 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 18
diff changeset
32 params = json.load(param_handler)
128bd4ab2b82 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 18
diff changeset
33 print(params)
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
34
18
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
35 # Put all cheetah up here to avoid confusion.
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
36 #if $selected_tasks.selected_task == "train":
18
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
37 infile1 = "$selected_tasks.selected_algorithms.input_options.infile1"
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
38 infile2 = "$selected_tasks.selected_algorithms.input_options.infile2"
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
39 #else:
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
40 infile_model = "$selected_tasks.infile_model"
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
41 infile_data = "$selected_tasks.infile_data"
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
42 #end if
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
43 outfile_fit = "$outfile_fit"
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
44 outfile_predict = "$outfile_predict"
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
45
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
46 # All Python from here on out:
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
47
18
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
48 if params["selected_tasks"]["selected_task"] == "train":
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
49 algorithm = params["selected_tasks"]["selected_algorithms"]["selected_algorithm"]
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
50 options = params["selected_tasks"]["selected_algorithms"]["options"]
23
090cb13556f1 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 19
diff changeset
51 if algorithm in ['RandomForestClassifier', 'RandomForestRegressor']:
090cb13556f1 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit d00173591e4a783a4c1cb2664e4bb192ab5414f7
bgruening
parents: 19
diff changeset
52 options['n_jobs'] = N_JOBS
18
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
53 if "select_max_features" in options:
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
54 if options["select_max_features"]["max_features"] == "number_input":
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
55 options["select_max_features"]["max_features"] = options["select_max_features"]["num_max_features"]
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
56 options["select_max_features"].pop("num_max_features")
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
57 options["max_features"] = options["select_max_features"]["max_features"]
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
58 options.pop("select_max_features")
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
59 if "presort" in options:
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
60 if options["presort"] == "true":
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
61 options["presort"] = True
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
62 if options["presort"] == "false":
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
63 options["presort"] = False
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
64 if "min_samples_leaf" in options and options["min_samples_leaf"] == 1.0:
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
65 options["min_samples_leaf"] = 1
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
66 if "min_samples_split" in options and options["min_samples_split"] > 1.0:
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
67 options["min_samples_split"] = int(options["min_samples_split"])
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
68
18
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
69 X, y = get_X_y(params, infile1, infile2)
19
128bd4ab2b82 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 18
diff changeset
70
18
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
71 my_class = getattr(sklearn.ensemble, algorithm)
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
72 estimator = my_class(**options)
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
73 estimator.fit(X,y)
19
128bd4ab2b82 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 18
diff changeset
74 with open(outfile_fit, 'wb') as out_handler:
128bd4ab2b82 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 18
diff changeset
75 pickle.dump(estimator, out_handler, pickle.HIGHEST_PROTOCOL)
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
76
18
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
77 else:
19
128bd4ab2b82 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit f54ff2ba2f8e7542d68966ce5a6b17d7f624ac48
bgruening
parents: 18
diff changeset
78 with open(infile_model, 'rb') as model_handler:
25
18e29854c803 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 2a058459e6daf0486871f93845f00fdb4a4eaca1
bgruening
parents: 24
diff changeset
79 classifier_object = load_model(model_handler)
18
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
80 header = 'infer' if params["selected_tasks"]["header"] else None
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
81 data = pandas.read_csv(infile_data, sep='\t', header=header, index_col=None, parse_dates=True, encoding=None, tupleize_cols=False)
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
82 prediction = classifier_object.predict(data)
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
83 prediction_df = pandas.DataFrame(prediction, columns=["predicted"])
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
84 res = pandas.concat([data, prediction_df], axis=1)
0070e491573f planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 7c2fd140e89605fe689c39e21d70a400545e38cf
bgruening
parents: 17
diff changeset
85 res.to_csv(path_or_buf = outfile_predict, sep="\t", index=False)
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
86
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
87 ]]>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
88 </configfile>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
89 </configfiles>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
90 <inputs>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
91 <expand macro="sl_Conditional" model="zip">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
92 <param name="selected_algorithm" type="select" label="Select an ensemble method:">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
93 <option value="RandomForestClassifier" selected="true">Random forest classifier</option>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
94 <option value="AdaBoostClassifier">Ada boost classifier</option>
9
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
95 <option value="GradientBoostingClassifier">Gradient Boosting Classifier</option>
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
96 <option value="RandomForestRegressor">Random forest regressor</option>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
97 <option value="AdaBoostRegressor">Ada boost regressor</option>
9
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
98 <option value="GradientBoostingRegressor">Gradient Boosting Regressor</option>
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
99 </param>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
100 <when value="RandomForestClassifier">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
101 <expand macro="sl_mixed_input"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
102 <section name="options" title="Advanced Options" expanded="False">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
103 <expand macro="n_estimators"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
104 <expand macro="criterion"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
105 <expand macro="max_features"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
106 <expand macro="max_depth"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
107 <expand macro="min_samples_split"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
108 <expand macro="min_samples_leaf"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
109 <expand macro="min_weight_fraction_leaf"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
110 <expand macro="max_leaf_nodes"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
111 <expand macro="bootstrap"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
112 <expand macro="warm_start" checked="false"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
113 <expand macro="random_state"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
114 <expand macro="oob_score"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
115 <!--class_weight=None-->
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
116 </section>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
117 </when>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
118 <when value="AdaBoostClassifier">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
119 <expand macro="sl_mixed_input"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
120 <section name="options" title="Advanced Options" expanded="False">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
121 <!--base_estimator=None-->
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
122 <expand macro="n_estimators" default_value="50"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
123 <expand macro="learning_rate"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
124 <param argument="algorithm" type="select" label="Boosting algorithm" help=" ">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
125 <option value="SAMME.R" selected="true">SAMME.R</option>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
126 <option value="SAMME">SAMME</option>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
127 </param>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
128 <expand macro="random_state"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
129 </section>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
130 </when>
9
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
131 <when value="GradientBoostingClassifier">
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
132 <expand macro="sl_mixed_input"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
133 <section name="options" title="Advanced Options" expanded="False">
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
134 <!--base_estimator=None-->
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
135 <param argument="loss" type="select" label="Loss function">
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
136 <option value="deviance" selected="true">deviance - logistic regression with probabilistic outputs</option>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
137 <option value="exponential">exponential - gradient boosting recovers the AdaBoost algorithm</option>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
138 </param>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
139 <expand macro="learning_rate" default_value='0.1'/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
140 <expand macro="n_estimators" default_value="100" help="The number of boosting stages to perform"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
141 <expand macro="max_depth" default_value="3" help="maximum depth of the individual regression estimators"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
142 <expand macro="criterion2">
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
143 <option value="friedman_mse" selected="true">friedman_mse - mean squared error with improvement score by Friedman</option>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
144 </expand>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
145 <expand macro="min_samples_split" type="float"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
146 <expand macro="min_samples_leaf" type="float" label="The minimum number of samples required to be at a leaf node"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
147 <expand macro="min_weight_fraction_leaf"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
148 <expand macro="subsample"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
149 <expand macro="max_features"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
150 <expand macro="max_leaf_nodes"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
151 <expand macro="min_impurity_decrease"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
152 <expand macro="verbose"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
153 <expand macro="warm_start" checked="false"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
154 <expand macro="random_state"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
155 <expand macro="presort"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
156 </section>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
157 </when>
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
158 <when value="RandomForestRegressor">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
159 <expand macro="sl_mixed_input"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
160 <section name="options" title="Advanced Options" expanded="False">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
161 <expand macro="n_estimators"/>
9
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
162 <expand macro="criterion2"/>
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
163 <expand macro="max_features"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
164 <expand macro="max_depth"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
165 <expand macro="min_samples_split"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
166 <expand macro="min_samples_leaf"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
167 <expand macro="min_weight_fraction_leaf"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
168 <expand macro="max_leaf_nodes"/>
9
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
169 <expand macro="min_impurity_decrease"/>
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
170 <expand macro="bootstrap"/>
9
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
171 <expand macro="oob_score"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
172 <expand macro="random_state"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
173 <expand macro="verbose"/>
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
174 <expand macro="warm_start" checked="false"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
175 </section>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
176 </when>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
177 <when value="AdaBoostRegressor">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
178 <expand macro="sl_mixed_input"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
179 <section name="options" title="Advanced Options" expanded="False">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
180 <!--base_estimator=None-->
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
181 <expand macro="n_estimators" default_value="50"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
182 <expand macro="learning_rate"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
183 <param argument="loss" type="select" label="Loss function" optional="true" help="Used when updating the weights after each boosting iteration. ">
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
184 <option value="linear" selected="true">linear</option>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
185 <option value="square">square</option>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
186 <option value="exponential">exponential</option>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
187 </param>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
188 <expand macro="random_state"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
189 </section>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
190 </when>
9
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
191 <when value="GradientBoostingRegressor">
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
192 <expand macro="sl_mixed_input"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
193 <section name="options" title="Advanced Options" expanded="False">
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
194 <param argument="loss" type="select" label="Loss function">
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
195 <option value="ls" selected="true">ls - least squares regression</option>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
196 <option value="lad">lad - least absolute deviation</option>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
197 <option value="huber">huber - combination of least squares regression and least absolute deviation</option>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
198 <option value="quantile">quantile - use alpha to specify the quantile</option>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
199 </param>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
200 <expand macro="learning_rate" default_value="0.1"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
201 <expand macro="n_estimators" default_value="100" help="The number of boosting stages to perform"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
202 <expand macro="max_depth" default_value="3" help="maximum depth of the individual regression estimators"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
203 <expand macro="criterion2">
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
204 <option value="friedman_mse" selected="true">friedman_mse - mean squared error with improvement score by Friedman</option>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
205 </expand>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
206 <expand macro="min_samples_split" type="float"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
207 <expand macro="min_samples_leaf" type="float" label="The minimum number of samples required to be at a leaf node"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
208 <expand macro="min_weight_fraction_leaf"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
209 <expand macro="subsample"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
210 <expand macro="max_features"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
211 <expand macro="max_leaf_nodes"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
212 <expand macro="min_impurity_decrease"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
213 <param argument="alpha" type="float" value="0.9" label="alpha" help="The alpha-quantile of the huber loss function and the quantile loss function" />
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
214 <!--base_estimator=None-->
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
215 <expand macro="verbose"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
216 <expand macro="warm_start" checked="false"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
217 <expand macro="random_state"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
218 <expand macro="presort"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
219 </section>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
220 </when>
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
221 </expand>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
222 </inputs>
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
223
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
224 <expand macro="output"/>
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
225
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
226 <tests>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
227 <test>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
228 <param name="infile1" value="train.tabular" ftype="tabular"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
229 <param name="infile2" value="train.tabular" ftype="tabular"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
230 <param name="col1" value="1,2,3,4"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
231 <param name="col2" value="5"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
232 <param name="selected_task" value="train"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
233 <param name="selected_algorithm" value="RandomForestClassifier"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
234 <param name="random_state" value="10"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
235 <output name="outfile_fit" file="rfc_model01" compare="sim_size" delta="500"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
236 </test>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
237 <test>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
238 <param name="infile_model" value="rfc_model01" ftype="zip"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
239 <param name="infile_data" value="test.tabular" ftype="tabular"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
240 <param name="selected_task" value="load"/>
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
241 <output name="outfile_predict" file="rfc_result01" compare="sim_size" delta="500"/>
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
242 </test>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
243 <test>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
244 <param name="infile1" value="regression_train.tabular" ftype="tabular"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
245 <param name="infile2" value="regression_train.tabular" ftype="tabular"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
246 <param name="col1" value="1,2,3,4,5"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
247 <param name="col2" value="6"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
248 <param name="selected_task" value="train"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
249 <param name="selected_algorithm" value="RandomForestRegressor"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
250 <param name="random_state" value="10"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
251 <output name="outfile_fit" file="rfr_model01" compare="sim_size" delta="500"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
252 </test>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
253 <test>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
254 <param name="infile_model" value="rfr_model01" ftype="zip"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
255 <param name="infile_data" value="regression_test.tabular" ftype="tabular"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
256 <param name="selected_task" value="load"/>
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
257 <output name="outfile_predict" file="rfr_result01" compare="sim_size" delta="500"/>
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
258 </test>
9
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
259 <test>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
260 <param name="infile1" value="regression_X.tabular" ftype="tabular"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
261 <param name="infile2" value="regression_y.tabular" ftype="tabular"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
262 <param name="header1" value="True"/>
14
923ecece9e9c planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 97c4f22cdcfa6cddeeffc7b102c418a7ff12a888
bgruening
parents: 9
diff changeset
263 <param name="selected_column_selector_option" value="all_columns"/>
9
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
264 <param name="header2" value="True"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
265 <param name="col2" value="1"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
266 <param name="selected_task" value="train"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
267 <param name="selected_algorithm" value="GradientBoostingRegressor"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
268 <param name="max_features" value="number_input"/>
25
18e29854c803 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 2a058459e6daf0486871f93845f00fdb4a4eaca1
bgruening
parents: 24
diff changeset
269 <param name="num_max_features" value="0.5"/>
9
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
270 <param name="random_state" value="42"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
271 <output name="outfile_fit" file="gbr_model01" compare="sim_size" delta="500"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
272 </test>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
273 <test>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
274 <param name="infile_model" value="gbr_model01" ftype="zip"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
275 <param name="infile_data" value="regression_test_X.tabular" ftype="tabular"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
276 <param name="selected_task" value="load"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
277 <param name="header" value="True"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
278 <output name="outfile_predict" file="gbr_prediction_result01.tabular" compare="sim_size" delta="500"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
279 </test>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
280 <test>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
281 <param name="infile1" value="train.tabular" ftype="tabular"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
282 <param name="infile2" value="train.tabular" ftype="tabular"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
283 <param name="col1" value="1,2,3,4"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
284 <param name="col2" value="5"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
285 <param name="selected_task" value="train"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
286 <param name="selected_algorithm" value="GradientBoostingClassifier"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
287 <output name="outfile_fit" file="gbc_model01" compare="sim_size" delta="500"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
288 </test>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
289 <test>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
290 <param name="infile_model" value="gbc_model01" ftype="zip"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
291 <param name="infile_data" value="test.tabular" ftype="tabular"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
292 <param name="selected_task" value="load"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
293 <output name="outfile_predict" file="gbc_result01" compare="sim_size" delta="500"/>
e4fcbbc81083 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 35fa73d6e9ba8f0789ddfb743d893d950a68af02
bgruening
parents: 8
diff changeset
294 </test>
26
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
295 <test>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
296 <param name="infile1" value="train.tabular" ftype="tabular"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
297 <param name="infile2" value="train.tabular" ftype="tabular"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
298 <param name="col1" value="1,2,3,4"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
299 <param name="col2" value="5"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
300 <param name="selected_task" value="train"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
301 <param name="selected_algorithm" value="AdaBoostClassifier"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
302 <param name="random_state" value="10"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
303 <output name="outfile_fit" file="abc_model01" compare="sim_size" delta="500"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
304 </test>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
305 <test>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
306 <param name="infile_model" value="abc_model01" ftype="zip"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
307 <param name="infile_data" value="test.tabular" ftype="tabular"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
308 <param name="selected_task" value="load"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
309 <output name="outfile_predict" file="abc_result01" compare="sim_size" delta="500"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
310 </test>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
311 <test>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
312 <param name="infile1" value="regression_train.tabular" ftype="tabular"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
313 <param name="infile2" value="regression_train.tabular" ftype="tabular"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
314 <param name="col1" value="1,2,3,4,5"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
315 <param name="col2" value="6"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
316 <param name="selected_task" value="train"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
317 <param name="selected_algorithm" value="AdaBoostRegressor"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
318 <param name="random_state" value="10"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
319 <output name="outfile_fit" file="abr_model01" compare="sim_size" delta="500"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
320 </test>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
321 <test>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
322 <param name="infile_model" value="abr_model01" ftype="zip"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
323 <param name="infile_data" value="regression_test.tabular" ftype="tabular"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
324 <param name="selected_task" value="load"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
325 <output name="outfile_predict" file="abr_result01" compare="sim_size" delta="500"/>
8d0d31567045 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit c64ccc5850c8e061a95fb64e07ed388384e82393
bgruening
parents: 25
diff changeset
326 </test>
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
327 </tests>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
328 <help><![CDATA[
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
329 ***What it does***
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
330 The goal of ensemble methods is to combine the predictions of several base estimators built with a given learning algorithm in order to improve generalizability / robustness over a single estimator. This tool offers two sets of ensemble algorithms for classification and regression: random forests and ADA boosting which are based on sklearn.ensemble library from Scikit-learn. Here you can find out about the input, output and methods presented in the tools. For information about ensemble methods and parameters settings please refer to `Scikit-learn ensemble`_.
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
331
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
332 .. _`Scikit-learn ensemble`: http://scikit-learn.org/stable/modules/ensemble.html
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
333
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
334 **1 - Methods**
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
335 There are two groups of operations available:
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
336
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
337 1 - Train a model : A training set containing samples and their respective labels (or predicted values) are input. Based on the selected algorithm and options, an estimator object is fit to the data and is returned.
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
338
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
339 2 - Load a model and predict : An existing model predicts the class labels (or regression values) for a new dataset.
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
340
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
341 **2 - Trainig input**
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
342 When you choose to train a model, you need a features dataset X and a labels set y. This tool expects tabular or sparse data for X and a single column for y (tabular). You can select a subset of columns in a tabular dataset as your features dataset or labels column. Below you find some examples:
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
343
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
344 **Sample tabular features dataset**
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
345 The following training dataset contains 3 feature columns and a column containing class labels. You can simply select the first 3 columns as features and the last column as labels:
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
346
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
347 ::
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
348
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
349 4.01163365529 -6.10797684314 8.29829894763 1
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
350 10.0788438916 1.59539821454 10.0684278289 0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
351 -5.17607775503 -0.878286135332 6.92941850665 2
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
352 4.00975406235 -7.11847496542 9.3802423585 1
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
353 4.61204065139 -5.71217537352 9.12509610964 1
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
354
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
355
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
356 **Sample sparse features dataset**
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
357 In this case you cannot specifiy a column range.
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
358
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
359 ::
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
360
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
361 4 1048577 8738
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
362 1 271 0.02083333333333341
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
363 1 1038 0.02461995616119806
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
364 2 829017 0.01629088031127686
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
365 2 829437 0.01209127083516686
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
366 2 830752 0.02535100632816968
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
367 3 1047487 0.01485722929945572
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
368 3 1047980 0.02640566620767753
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
369 3 1048475 0.01665869913262564
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
370 4 608 0.01662975263094352
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
371 4 1651 0.02519674277562741
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
372 4 4053 0.04223659971350601
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
373
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
374
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
375 **2 - Trainig output**
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
376 The trained model is generated and output in the form of a binary file.
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
377
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
378
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
379 **3 - Prediction input**
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
380
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
381 When you choose to load a model and do prediction, the tool expects an already trained estimator and a tabular dataset as input. The dataset contains new samples which you want to classify or predict regression values for.
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
382
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
383
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
384 .. class:: warningmark
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
385
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
386 The number of feature columns must be the same in training and prediction datasets!
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
387
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
388
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
389 **3 - Prediction output**
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
390 The tool predicts the class labels for new samples and adds them as the last column to the prediction dataset. The new dataset then is output as a tabular file. The prediction output format should look like the training dataset.
4
3bc536788043 planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 0e582cf1f3134c777cce3aa57d71b80ed95e6ba9
bgruening
parents: 2
diff changeset
391
0
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
392 ]]></help>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
393 <expand macro="sklearn_citation"/>
31fd07e0acdb planemo upload for repository https://github.com/bgruening/galaxytools/tools/sklearn commit 6c002ea2995c85f5f16adb2ef1c6be82dfbc5417
bgruening
parents:
diff changeset
394 </tool>