From 76bdb82a12440beda0d256bc92d12d59e668e939 Mon Sep 17 00:00:00 2001 From: "Richard (Rick) Zamora" Date: Wed, 25 Oct 2023 16:32:10 -0500 Subject: [PATCH] Run IO tests for Dask-cuDF (#14327) We are not currently running any IO tests for `dask_cudf` in CI. This PR should correct this. It also modifies a test that *would* be failing due to https://github.com/rapidsai/cudf/issues/14326 Authors: - Richard (Rick) Zamora (https://github.com/rjzamora) - GALI PREM SAGAR (https://github.com/galipremsagar) Approvers: - GALI PREM SAGAR (https://github.com/galipremsagar) - Ray Douglass (https://github.com/raydouglass) URL: https://github.com/rapidsai/cudf/pull/14327 --- ci/test_wheel_dask_cudf.sh | 3 ++- python/dask_cudf/dask_cudf/io/tests/test_parquet.py | 4 +++- 2 files changed, 5 insertions(+), 2 deletions(-) diff --git a/ci/test_wheel_dask_cudf.sh b/ci/test_wheel_dask_cudf.sh index 01019bb7598..8c4ab696249 100755 --- a/ci/test_wheel_dask_cudf.sh +++ b/ci/test_wheel_dask_cudf.sh @@ -16,4 +16,5 @@ python -m pip install git+https://github.com/dask/dask.git@2023.9.2 git+https:// # echo to expand wildcard before adding `[extra]` requires for pip python -m pip install $(echo ./dist/dask_cudf*.whl)[test] -python -m pytest -n 8 ./python/dask_cudf/dask_cudf/tests +# Run tests in dask_cudf/tests and dask_cudf/io/tests +python -m pytest -n 8 ./python/dask_cudf/dask_cudf/ diff --git a/python/dask_cudf/dask_cudf/io/tests/test_parquet.py b/python/dask_cudf/dask_cudf/io/tests/test_parquet.py index 85ec36cf2c5..234b8fc5212 100644 --- a/python/dask_cudf/dask_cudf/io/tests/test_parquet.py +++ b/python/dask_cudf/dask_cudf/io/tests/test_parquet.py @@ -481,7 +481,9 @@ def test_create_metadata_file_inconsistent_schema(tmpdir): # call `compute` on `ddf1`, because the dtype of # the inconsistent column ("a") may be "object" # before computing, and "int" after - dd.assert_eq(ddf1.compute(), ddf2) + # TODO: Uncomment after cudf#14326 is closed + # (See: https://github.com/rapidsai/cudf/issues/14326) + # dd.assert_eq(ddf1.compute(), ddf2) dd.assert_eq(ddf1.compute(), ddf2.compute())