Skip to content

Commit 315f8d8

Browse files
anuprulezAnup Kumar
andauthored
Fix linting and tool tests for scikit-learn tool suite (bgruening#1817)
* fix clf_metrics tool * fix linting errors and tests * add conditional tags * update tests * update discriminant tool * add pairwise tool * update sparse tool * update tests for ensemble * updatetests for feature selection * update tests for model_prediction, pairwise_metrics, regression_metrics, model_fit * update tests for sklearn_fitted_model_eval and sklearn_generalized_linear * update tests for lightgbm.xml ml_visualization_ex.xml model_validation.xml nn_classifier.xml numeric_clustering.xml * svm search model validation * update tests form keras_batch_ models.xml keras_model_builder.xml pca.xml pipeline.xml sample_generator.xml train_test_eval.xml * update test for keras_train_eval.xml * update tests and test data for sparse.xml * fix tests for preprocessing tool * update test data for preprocessing tools * bump suite version * update tool version * remove unique_param * update suite name * Keras>=2.10 and <2.11 work with Python=3.10 or maybe Python=3.11 * Change python=3.10 * revert the Python=3.9 version * update test files E format --------- Co-authored-by: Anup Kumar <anuprulez@gmail.com>
1 parent 12b8a7f commit 315f8d8

28 files changed

+3145
-1621
lines changed

tools/sklearn/.shed.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ auto_tool_repositories:
2020
name_template: "{{ tool_id }}"
2121
description_template: "Wrapper for scikit learn tool: {{ tool_name }}"
2222
suite:
23-
name: "sklearn_suite"
23+
name: "suite_sklearn"
2424
description: "A suite of Galaxy tools for Machine Learning algorithms such as classification, regression, and clustering"
2525

2626
long_description: |

tools/sklearn/clf_metrics.xml

Lines changed: 253 additions & 108 deletions
Large diffs are not rendered by default.

tools/sklearn/discriminant.xml

Lines changed: 76 additions & 36 deletions
Original file line numberDiff line numberDiff line change
@@ -92,52 +92,92 @@ dump_model_to_h5(classifier_object, '$outfile_fit')
9292
</inputs>
9393
<expand macro="output" />
9494
<tests>
95-
<test>
96-
<param name="infile1" value="train.tabular" ftype="tabular" />
97-
<param name="infile2" value="train.tabular" ftype="tabular" />
98-
<param name="col1" value="1,2,3,4" />
99-
<param name="col2" value="5" />
100-
<param name="selected_task" value="train" />
101-
<param name="selected_algorithm" value="LinearDiscriminantAnalysis" />
102-
<param name="solver" value="svd" />
103-
<param name="store_covariance" value="True" />
95+
<test expect_num_outputs="1">
96+
<conditional name="selected_tasks">
97+
<param name="selected_task" value="train" />
98+
<conditional name="selected_algorithms">
99+
<param name="selected_algorithm" value="LinearDiscriminantAnalysis" />
100+
<conditional name="input_options">
101+
<param name="infile1" value="train.tabular" ftype="tabular" />
102+
<param name="infile2" value="train.tabular" ftype="tabular" />
103+
<conditional name="column_selector_options_1">
104+
<param name="col1" value="1,2,3,4" />
105+
</conditional>
106+
<conditional name="column_selector_options_2">
107+
<param name="col2" value="5" />
108+
</conditional>
109+
</conditional>
110+
<section name="options">
111+
<param name="solver" value="svd" />
112+
<param name="store_covariance" value="True" />
113+
</section>
114+
</conditional>
115+
</conditional>
104116
<output name="outfile_fit" file="lda_model01" compare="sim_size" delta="1" />
105117
</test>
106-
<test>
107-
<param name="infile1" value="train.tabular" ftype="tabular" />
108-
<param name="infile2" value="train.tabular" ftype="tabular" />
109-
<param name="col1" value="1,2,3,4" />
110-
<param name="col2" value="5" />
111-
<param name="selected_task" value="train" />
112-
<param name="selected_algorithm" value="LinearDiscriminantAnalysis" />
113-
<param name="solver" value="lsqr" />
118+
<test expect_num_outputs="1">
119+
<conditional name="selected_tasks">
120+
<param name="selected_task" value="train" />
121+
<conditional name="selected_algorithms">
122+
<param name="selected_algorithm" value="LinearDiscriminantAnalysis" />
123+
<conditional name="input_options">
124+
<param name="infile1" value="train.tabular" ftype="tabular" />
125+
<param name="infile2" value="train.tabular" ftype="tabular" />
126+
<conditional name="column_selector_options_1">
127+
<param name="col1" value="1,2,3,4" />
128+
</conditional>
129+
<conditional name="column_selector_options_2">
130+
<param name="col2" value="5" />
131+
</conditional>
132+
</conditional>
133+
<section name="options">
134+
<param name="solver" value="lsqr" />
135+
</section>
136+
</conditional>
137+
</conditional>
114138
<output name="outfile_fit" file="lda_model02" compare="sim_size" delta="1" />
115139
</test>
116-
<test>
117-
<param name="infile1" value="train.tabular" ftype="tabular" />
118-
<param name="infile2" value="train.tabular" ftype="tabular" />
119-
<param name="col1" value="1,2,3,4" />
120-
<param name="col2" value="5" />
121-
<param name="selected_task" value="train" />
122-
<param name="selected_algorithm" value="QuadraticDiscriminantAnalysis" />
140+
<test expect_num_outputs="1">
141+
<conditional name="selected_tasks">
142+
<param name="selected_task" value="train" />
143+
<conditional name="selected_algorithms">
144+
<param name="selected_algorithm" value="QuadraticDiscriminantAnalysis" />
145+
<conditional name="input_options">
146+
<param name="infile1" value="train.tabular" ftype="tabular" />
147+
<param name="infile2" value="train.tabular" ftype="tabular" />
148+
<conditional name="column_selector_options_1">
149+
<param name="col1" value="1,2,3,4" />
150+
</conditional>
151+
<conditional name="column_selector_options_2">
152+
<param name="col2" value="5" />
153+
</conditional>
154+
</conditional>
155+
</conditional>
156+
</conditional>
123157
<output name="outfile_fit" file="qda_model01" compare="sim_size" delta="1" />
124158
</test>
125-
<test>
126-
<param name="infile_model" value="lda_model01" ftype="h5mlm" />
127-
<param name="infile_data" value="test.tabular" ftype="tabular" />
128-
<param name="selected_task" value="load" />
159+
<test expect_num_outputs="1">
160+
<conditional name="selected_tasks">
161+
<param name="selected_task" value="load" />
162+
<param name="infile_model" value="lda_model01" ftype="h5mlm" />
163+
<param name="infile_data" value="test.tabular" ftype="tabular" />
164+
</conditional>
129165
<output name="outfile_predict" file="lda_prediction_result01.tabular" />
130166
</test>
131-
<test>
132-
<param name="infile_model" value="lda_model02" ftype="h5mlm" />
133-
<param name="infile_data" value="test.tabular" ftype="tabular" />
134-
<param name="selected_task" value="load" />
167+
<test expect_num_outputs="1">
168+
<conditional name="selected_tasks">
169+
<param name="selected_task" value="load" />
170+
<param name="infile_model" value="lda_model02" ftype="h5mlm" />
171+
<param name="infile_data" value="test.tabular" ftype="tabular" />
172+
</conditional>
135173
<output name="outfile_predict" file="lda_prediction_result02.tabular" />
136174
</test>
137-
<test>
138-
<param name="infile_model" value="qda_model01" ftype="h5mlm" />
139-
<param name="infile_data" value="test.tabular" ftype="tabular" />
140-
<param name="selected_task" value="load" />
175+
<test expect_num_outputs="1">
176+
<conditional name="selected_tasks">
177+
<param name="selected_task" value="load" />
178+
<param name="infile_model" value="qda_model01" ftype="h5mlm" />
179+
<param name="infile_data" value="test.tabular" ftype="tabular" />
180+
</conditional>
141181
<output name="outfile_predict" file="qda_prediction_result01.tabular" />
142182
</test>
143183
</tests>

0 commit comments

Comments
 (0)