Mercurial > repos > bgruening > sklearn_data_preprocess
comparison pre_process.xml @ 36:ff2a7f89069e draft
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/sklearn commit 208a8d348e7c7a182cfbe1b6f17868146428a7e2"
| author | bgruening |
|---|---|
| date | Tue, 13 Apr 2021 21:03:03 +0000 |
| parents | e270c53b5df6 |
| children | 6c23a44a3c4f |
comparison
equal
deleted
inserted
replaced
| 35:f40b6759fc1d | 36:ff2a7f89069e |
|---|---|
| 1 <tool id="sklearn_data_preprocess" name="Preprocess" version="@VERSION@"> | 1 <tool id="sklearn_data_preprocess" name="Preprocess" version="@VERSION@" profile="20.05"> |
| 2 <description>raw feature vectors into standardized datasets</description> | 2 <description>raw feature vectors into standardized datasets</description> |
| 3 <macros> | 3 <macros> |
| 4 <import>main_macros.xml</import> | 4 <import>main_macros.xml</import> |
| 5 </macros> | 5 </macros> |
| 6 <expand macro="python_requirements"/> | 6 <expand macro="python_requirements" /> |
| 7 <expand macro="macro_stdio"/> | 7 <expand macro="macro_stdio" /> |
| 8 <version_command>echo "@VERSION@"</version_command> | 8 <version_command>echo "@VERSION@"</version_command> |
| 9 <command> | 9 <command> |
| 10 <![CDATA[ | 10 <![CDATA[ |
| 11 python "$pre_processor_script" '$inputs' | 11 python "$pre_processor_script" '$inputs' |
| 12 ]]> | 12 ]]> |
| 95 </param> | 95 </param> |
| 96 <when value="tabular"> | 96 <when value="tabular"> |
| 97 <param name="infile" type="data" format="tabular" label="Select a tabular file you want to train your preprocessor on its data:" /> | 97 <param name="infile" type="data" format="tabular" label="Select a tabular file you want to train your preprocessor on its data:" /> |
| 98 <param name="header1" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="false" label="Does the dataset contain header:" /> | 98 <param name="header1" type="boolean" optional="true" truevalue="booltrue" falsevalue="boolfalse" checked="false" label="Does the dataset contain header:" /> |
| 99 <conditional name="column_selector_options_1"> | 99 <conditional name="column_selector_options_1"> |
| 100 <expand macro="samples_column_selector_options" multiple="true" column_option="selected_column_selector_option" col_name="col1" infile="infile"/> | 100 <expand macro="samples_column_selector_options" multiple="true" column_option="selected_column_selector_option" col_name="col1" infile="infile" /> |
| 101 </conditional> | 101 </conditional> |
| 102 <conditional name="pre_processors"> | 102 <conditional name="pre_processors"> |
| 103 <expand macro="sparse_preprocessors_ext" /> | 103 <expand macro="sparse_preprocessors_ext" /> |
| 104 <expand macro="sparse_preprocessor_options_ext" /> | 104 <expand macro="sparse_preprocessor_options_ext" /> |
| 105 </conditional> | 105 </conditional> |
| 106 </when> | 106 </when> |
| 107 <when value="sparse"> | 107 <when value="sparse"> |
| 108 <param name="infile" type="data" format="txt" label="Select a sparse representation you want to train your preprocessor on its data:"/> | 108 <param name="infile" type="data" format="txt" label="Select a sparse representation you want to train your preprocessor on its data:" /> |
| 109 <conditional name="pre_processors"> | 109 <conditional name="pre_processors"> |
| 110 <expand macro="sparse_preprocessors"/> | 110 <expand macro="sparse_preprocessors" /> |
| 111 <expand macro="sparse_preprocessor_options"/> | 111 <expand macro="sparse_preprocessor_options" /> |
| 112 </conditional> | 112 </conditional> |
| 113 </when> | 113 </when> |
| 114 </conditional> | 114 </conditional> |
| 115 <param name="save" type="boolean" truevalue="booltrue" falsevalue="boolflase" checked="false" | 115 <param name="save" type="boolean" truevalue="booltrue" falsevalue="boolflase" checked="false" label="Save the preprocessor" help="Saves the preprocessor after fitting to the data. The preprocessor can then be passed to other tools and used in later operations." /> |
| 116 label="Save the preprocessor" | |
| 117 help="Saves the preprocessor after fitting to the data. The preprocessor can then be passed to other tools and used in later operations."/> | |
| 118 </inputs> | 116 </inputs> |
| 119 <outputs> | 117 <outputs> |
| 120 <data format="tabular" name="outfile_transform" from_work_dir="./output"/> | 118 <data format="tabular" name="outfile_transform" from_work_dir="./output" /> |
| 121 <data format="zip" name="outfile_fit"> | 119 <data format="zip" name="outfile_fit"> |
| 122 <filter>save</filter> | 120 <filter>save</filter> |
| 123 </data> | 121 </data> |
| 124 </outputs> | 122 </outputs> |
| 125 <tests> | 123 <tests> |
| 126 <test> | 124 <test> |
| 127 <param name="infile" value="train.tabular" ftype="tabular"/> | 125 <param name="infile" value="train.tabular" ftype="tabular" /> |
| 128 <param name="selected_column_selector_option" value="all_columns"/> | 126 <param name="selected_column_selector_option" value="all_columns" /> |
| 129 <param name="selected_input_type" value="tabular"/> | 127 <param name="selected_input_type" value="tabular" /> |
| 130 <param name="selected_pre_processor" value="KernelCenterer"/> | 128 <param name="selected_pre_processor" value="KernelCenterer" /> |
| 131 <param name="save" value="true"/> | 129 <param name="save" value="true" /> |
| 132 <output name="outfile_transform" file="prp_result01" ftype="tabular"/> | 130 <output name="outfile_transform" file="prp_result01" ftype="tabular" /> |
| 133 <output name="outfile_fit" file="prp_model01" ftype="zip" compare="sim_size" delta="5"/> | 131 <output name="outfile_fit" file="prp_model01" ftype="zip" compare="sim_size" delta="5" /> |
| 134 </test> | 132 </test> |
| 135 <test> | 133 <test> |
| 136 <param name="infile" value="train.tabular" ftype="tabular"/> | 134 <param name="infile" value="train.tabular" ftype="tabular" /> |
| 137 <param name="selected_column_selector_option" value="all_columns"/> | 135 <param name="selected_column_selector_option" value="all_columns" /> |
| 138 <param name="selected_input_type" value="tabular"/> | 136 <param name="selected_input_type" value="tabular" /> |
| 139 <param name="selected_pre_processor" value="MinMaxScaler"/> | 137 <param name="selected_pre_processor" value="MinMaxScaler" /> |
| 140 <param name="save" value="true"/> | 138 <param name="save" value="true" /> |
| 141 <output name="outfile_transform" file="prp_result02" ftype="tabular"/> | 139 <output name="outfile_transform" file="prp_result02" ftype="tabular" /> |
| 142 <output name="outfile_fit" file="prp_model02" ftype="zip" compare="sim_size" delta="5"/> | 140 <output name="outfile_fit" file="prp_model02" ftype="zip" compare="sim_size" delta="5" /> |
| 143 </test> | 141 </test> |
| 144 <test> | 142 <test> |
| 145 <param name="infile" value="train.tabular" ftype="tabular"/> | 143 <param name="infile" value="train.tabular" ftype="tabular" /> |
| 146 <param name="selected_column_selector_option" value="all_columns"/> | 144 <param name="selected_column_selector_option" value="all_columns" /> |
| 147 <param name="selected_input_type" value="tabular"/> | 145 <param name="selected_input_type" value="tabular" /> |
| 148 <param name="selected_pre_processor" value="PolynomialFeatures"/> | 146 <param name="selected_pre_processor" value="PolynomialFeatures" /> |
| 149 <param name="save" value="true"/> | 147 <param name="save" value="true" /> |
| 150 <output name="outfile_transform" file="prp_result03" ftype="tabular"/> | 148 <output name="outfile_transform" file="prp_result03" ftype="tabular" /> |
| 151 <output name="outfile_fit" file="prp_model03" ftype="zip" compare="sim_size" delta="5"/> | 149 <output name="outfile_fit" file="prp_model03" ftype="zip" compare="sim_size" delta="5" /> |
| 152 </test> | 150 </test> |
| 153 <test> | 151 <test> |
| 154 <param name="infile" value="train.tabular" ftype="tabular"/> | 152 <param name="infile" value="train.tabular" ftype="tabular" /> |
| 155 <param name="selected_column_selector_option" value="all_columns"/> | 153 <param name="selected_column_selector_option" value="all_columns" /> |
| 156 <param name="selected_input_type" value="tabular"/> | 154 <param name="selected_input_type" value="tabular" /> |
| 157 <param name="selected_pre_processor" value="RobustScaler"/> | 155 <param name="selected_pre_processor" value="RobustScaler" /> |
| 158 <param name="save" value="true"/> | 156 <param name="save" value="true" /> |
| 159 <output name="outfile_transform" file="prp_result04" ftype="tabular"/> | 157 <output name="outfile_transform" file="prp_result04" ftype="tabular" /> |
| 160 <output name="outfile_fit" file="prp_model04" ftype="zip" compare="sim_size" delta="5"/> | 158 <output name="outfile_fit" file="prp_model04" ftype="zip" compare="sim_size" delta="5" /> |
| 161 </test> | 159 </test> |
| 162 <test> | 160 <test> |
| 163 <param name="infile" value="csr_sparse2.mtx" ftype="txt"/> | 161 <param name="infile" value="csr_sparse2.mtx" ftype="txt" /> |
| 164 <param name="selected_input_type" value="sparse"/> | 162 <param name="selected_input_type" value="sparse" /> |
| 165 <param name="selected_pre_processor" value="Binarizer"/> | 163 <param name="selected_pre_processor" value="Binarizer" /> |
| 166 <param name="save" value="true"/> | 164 <param name="save" value="true" /> |
| 167 <output name="outfile_transform" file="prp_result05" ftype="tabular"/> | 165 <output name="outfile_transform" file="prp_result05" ftype="tabular" /> |
| 168 <output name="outfile_fit" file="prp_model05" ftype="zip" compare="sim_size" delta="5"/> | 166 <output name="outfile_fit" file="prp_model05" ftype="zip" compare="sim_size" delta="5" /> |
| 169 </test> | 167 </test> |
| 170 <test> | 168 <test> |
| 171 <param name="infile" value="train.tabular" ftype="tabular"/> | 169 <param name="infile" value="train.tabular" ftype="tabular" /> |
| 172 <param name="selected_input_type" value="tabular"/> | 170 <param name="selected_input_type" value="tabular" /> |
| 173 <param name="selected_column_selector_option" value="all_columns"/> | 171 <param name="selected_column_selector_option" value="all_columns" /> |
| 174 <param name="selected_pre_processor" value="StandardScaler"/> | 172 <param name="selected_pre_processor" value="StandardScaler" /> |
| 175 <param name="save" value="true"/> | 173 <param name="save" value="true" /> |
| 176 <output name="outfile_transform" file="prp_result07" ftype="tabular"/> | 174 <output name="outfile_transform" file="prp_result07" ftype="tabular" /> |
| 177 <output name="outfile_fit" file="prp_model07" ftype="zip" compare="sim_size" delta="5"/> | 175 <output name="outfile_fit" file="prp_model07" ftype="zip" compare="sim_size" delta="5" /> |
| 178 </test> | 176 </test> |
| 179 <test> | 177 <test> |
| 180 <param name="infile" value="csr_sparse2.mtx" ftype="txt"/> | 178 <param name="infile" value="csr_sparse2.mtx" ftype="txt" /> |
| 181 <param name="selected_input_type" value="sparse"/> | 179 <param name="selected_input_type" value="sparse" /> |
| 182 <param name="selected_pre_processor" value="MaxAbsScaler"/> | 180 <param name="selected_pre_processor" value="MaxAbsScaler" /> |
| 183 <param name="save" value="true"/> | 181 <param name="save" value="true" /> |
| 184 <output name="outfile_transform" file="prp_result08" ftype="tabular"/> | 182 <output name="outfile_transform" file="prp_result08" ftype="tabular" /> |
| 185 <output name="outfile_fit" file="prp_model08" ftype="zip" compare="sim_size" delta="5"/> | 183 <output name="outfile_fit" file="prp_model08" ftype="zip" compare="sim_size" delta="5" /> |
| 186 </test> | 184 </test> |
| 187 <test> | 185 <test> |
| 188 <param name="infile" value="csr_sparse2.mtx" ftype="txt"/> | 186 <param name="infile" value="csr_sparse2.mtx" ftype="txt" /> |
| 189 <param name="selected_input_type" value="sparse"/> | 187 <param name="selected_input_type" value="sparse" /> |
| 190 <param name="selected_pre_processor" value="Normalizer"/> | 188 <param name="selected_pre_processor" value="Normalizer" /> |
| 191 <param name="save" value="true"/> | 189 <param name="save" value="true" /> |
| 192 <output name="outfile_transform" file="prp_result09" ftype="tabular"/> | 190 <output name="outfile_transform" file="prp_result09" ftype="tabular" /> |
| 193 <output name="outfile_fit" file="prp_model09" ftype="zip" compare="sim_size" delta="5"/> | 191 <output name="outfile_fit" file="prp_model09" ftype="zip" compare="sim_size" delta="5" /> |
| 194 </test> | 192 </test> |
| 195 <test> | 193 <test> |
| 196 <param name="infile" value="regression_X.tabular" ftype="tabular"/> | 194 <param name="infile" value="regression_X.tabular" ftype="tabular" /> |
| 197 <param name="header1" value="true"/> | 195 <param name="header1" value="true" /> |
| 198 <param name="selected_column_selector_option" value="all_columns"/> | 196 <param name="selected_column_selector_option" value="all_columns" /> |
| 199 <param name="selected_input_type" value="tabular"/> | 197 <param name="selected_input_type" value="tabular" /> |
| 200 <param name="selected_pre_processor" value="MinMaxScaler"/> | 198 <param name="selected_pre_processor" value="MinMaxScaler" /> |
| 201 <param name="feature_range" value="(-1, 1)"/> | 199 <param name="feature_range" value="(-1, 1)" /> |
| 202 <param name="save" value="false"/> | 200 <param name="save" value="false" /> |
| 203 <output name="outfile_transform" file="prp_result10" ftype="tabular"/> | 201 <output name="outfile_transform" file="prp_result10" ftype="tabular" /> |
| 204 </test> | 202 </test> |
| 205 </tests> | 203 </tests> |
| 206 <help> | 204 <help> |
| 207 <![CDATA[ | 205 <![CDATA[ |
| 208 **What it does** | 206 **What it does** |
| 212 For information about preprocessing classes and parameter settings please refer to `Scikit-learn preprocessing`_. | 210 For information about preprocessing classes and parameter settings please refer to `Scikit-learn preprocessing`_. |
| 213 | 211 |
| 214 .. _`Scikit-learn preprocessing`: http://scikit-learn.org/stable/modules/preprocessing.html | 212 .. _`Scikit-learn preprocessing`: http://scikit-learn.org/stable/modules/preprocessing.html |
| 215 ]]> | 213 ]]> |
| 216 </help> | 214 </help> |
| 217 <expand macro="sklearn_citation"/> | 215 <expand macro="sklearn_citation" /> |
| 218 </tool> | 216 </tool> |
