From 112f757b7399cf63e0056bbd95fd302f9bb900ce Mon Sep 17 00:00:00 2001 From: Yohei Kishimoto Date: Sun, 31 Mar 2024 14:19:59 +0900 Subject: [PATCH] add regression test for #6273 --- tests/python_package_test/test_basic.py | 10 ++++++++++ 1 file changed, 10 insertions(+) diff --git a/tests/python_package_test/test_basic.py b/tests/python_package_test/test_basic.py index 7177623be02d..92f5593ef7c1 100644 --- a/tests/python_package_test/test_basic.py +++ b/tests/python_package_test/test_basic.py @@ -573,6 +573,16 @@ def test_dataset_construction_overwrites_user_provided_metadata_fields(): np_assert_array_equal(dtrain.get_field("weight"), expected_weight, strict=True) +def test_dataset_construction_with_high_cardinality_categorical_succeeds(): + pd = pytest.importorskip("pandas") + X = pd.DataFrame({"x1": np.random.randint(0, 5_000, 10_000)}) + y = np.random.rand(10_000) + ds = lgb.Dataset(X, y, categorical_feature=["x1"]) + ds.construct() + assert ds.num_data() == 10_000 + assert ds.num_feature() == 1 + + def test_choose_param_value(): original_params = { "local_listen_port": 1234,