From 88e125aa05efe47d30c10a958267f632b9630eca Mon Sep 17 00:00:00 2001 From: Nikhil Raverkar Date: Thu, 14 Jul 2022 19:07:54 -0400 Subject: [PATCH] reverting numpy to 1.19.2 to solve pyarrow integration issue, changes to resolve numpy related build issues and adding regression test --- docker/0.23-1/final/Dockerfile.cpu | 3 ++- requirements.txt | 2 +- test/unit/test_modules.py | 9 +++++++++ 3 files changed, 12 insertions(+), 2 deletions(-) diff --git a/docker/0.23-1/final/Dockerfile.cpu b/docker/0.23-1/final/Dockerfile.cpu index bfc91a3..d597bc2 100644 --- a/docker/0.23-1/final/Dockerfile.cpu +++ b/docker/0.23-1/final/Dockerfile.cpu @@ -11,7 +11,8 @@ COPY dist/sagemaker_sklearn_container-2.0-py3-none-any.whl /sagemaker_sklearn_co # https://github.com/googleapis/google-cloud-python/issues/6647 RUN rm -rf /miniconda3/lib/python3.7/site-packages/numpy-1.19.4.dist-info && \ pip install --no-cache /sagemaker_sklearn_container-2.0-py3-none-any.whl && \ - rm /sagemaker_sklearn_container-2.0-py3-none-any.whl + rm /sagemaker_sklearn_container-2.0-py3-none-any.whl && \ + rm /miniconda3/lib/python3.8/site-packages/numpy-1.21.2.dist-info ENV SAGEMAKER_TRAINING_MODULE sagemaker_sklearn_container.training:main ENV SAGEMAKER_SERVING_MODULE sagemaker_sklearn_container.serving:main diff --git a/requirements.txt b/requirements.txt index cbb1251..bc5eadb 100644 --- a/requirements.txt +++ b/requirements.txt @@ -6,7 +6,7 @@ itsdangerous==2.0.1 gunicorn==20.0.4 model-archiver==1.0.3 multi-model-server==1.1.1 -numpy==1.21.0 +numpy==1.19.2 pandas==1.1.3 psutil==5.7.2 python-dateutil==2.8.1 diff --git a/test/unit/test_modules.py b/test/unit/test_modules.py index 1277993..d4e957e 100644 --- a/test/unit/test_modules.py +++ b/test/unit/test_modules.py @@ -1,4 +1,13 @@ +import pandas as pd + + def test_pandas_version(): import pandas as pd major, minor, patch = pd.__version__.split('.') assert major == '1' + + +def test_pyarrow_to_parquet_conversion_regression_issue_106(): + df = pd.DataFrame({'x': [1, 2]}) + df.to_parquet('test.parquet', engine='pyarrow') +