diff --git a/sklbench/datasets/loaders.py b/sklbench/datasets/loaders.py index 668ed3a7..eb3e3b6b 100644 --- a/sklbench/datasets/loaders.py +++ b/sklbench/datasets/loaders.py @@ -42,8 +42,8 @@ def load_openml_data( ) -> Tuple[Dict, Dict]: x, y = load_openml(openml_id, raw_data_cache) data_desc = dict() - unique_labels = dict(pd.value_counts(y)) - if len(unique_labels) < 32 and all(map(lambda x: x > 4, unique_labels.values())): + unique_labels = pd.Series(y).value_counts() + if len(unique_labels) < 32 and (unique_labels > 4).all(): data_desc["n_classes"] = len(unique_labels) return {"x": x, "y": y}, data_desc diff --git a/sklbench/utils/special_params.py b/sklbench/utils/special_params.py index 42a8ce32..80812012 100644 --- a/sklbench/utils/special_params.py +++ b/sklbench/utils/special_params.py @@ -214,7 +214,7 @@ def assign_case_special_values_on_run( and estimator.endswith("Classifier") ): y_train = convert_to_numpy(data[1]) - value_counts = pd.value_counts(y_train).sort_index() + value_counts = pd.Series(y_train).value_counts().sort_index() if len(value_counts) != 2: logger.info( f"Number of classes ({len(value_counts)}) != 2 "