From f8e108ed675b73bf72989a74ba757cd1483d221b Mon Sep 17 00:00:00 2001 From: Ibraheem Alyan <35265448+ibraheemalayan@users.noreply.github.com> Date: Sat, 4 May 2024 15:43:24 +0300 Subject: [PATCH] Fix issue #1226 Since the datasets contains many null values, Int32 ( nullable integer ) should be used instead --- merlin/datasets/ecommerce/aliccp/dataset.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/merlin/datasets/ecommerce/aliccp/dataset.py b/merlin/datasets/ecommerce/aliccp/dataset.py index 09f5c4fe61..c894dca86a 100644 --- a/merlin/datasets/ecommerce/aliccp/dataset.py +++ b/merlin/datasets/ecommerce/aliccp/dataset.py @@ -445,6 +445,6 @@ def _convert_data( current = [] tmp_files = glob(os.path.join(tmp_dir, f"{data_type}_*.parquet")) - dtypes = {f.name: "int32" for f in _Features().features} + dtypes = {f.name: "Int32" for f in _Features().features} merlin.io.Dataset(tmp_files, dtypes=dtypes).to_parquet(out_dir) shutil.rmtree(tmp_dir)