From 707a99419710a3a890754855c62668f5d64744d5 Mon Sep 17 00:00:00 2001 From: ion-elgreco <15728914+ion-elgreco@users.noreply.github.com> Date: Thu, 1 Aug 2024 23:48:05 +0200 Subject: [PATCH] pyarrow 8 test compat --- python/tests/test_cdf.py | 21 +++++++++++++++------ 1 file changed, 15 insertions(+), 6 deletions(-) diff --git a/python/tests/test_cdf.py b/python/tests/test_cdf.py index 2774776eb9..6d02158c10 100644 --- a/python/tests/test_cdf.py +++ b/python/tests/test_cdf.py @@ -3,6 +3,7 @@ import pyarrow as pa import pyarrow.compute as pc +import pyarrow.dataset as ds import pyarrow.parquet as pq from deltalake import DeltaTable, write_deltalake @@ -437,9 +438,13 @@ def test_delete_unpartitioned_cdf(tmp_path, sample_data: pa.Table): dt = DeltaTable(tmp_path) dt.delete("int64 > 2") - expected_data = sample_data.filter(pc.field("int64") > 2).append_column( - field_=pa.field("_change_type", pa.string(), nullable=False), - column=[["delete"] * 2], + expected_data = ( + ds.dataset(sample_data) + .to_table(filter=(pc.field("int64") > 2)) + .append_column( + field_=pa.field("_change_type", pa.string(), nullable=False), + column=[["delete"] * 2], + ) ) cdc_data = pq.read_table(cdc_path) @@ -460,9 +465,13 @@ def test_delete_partitioned_cdf(tmp_path, sample_data: pa.Table): dt = DeltaTable(tmp_path) dt.delete("int64 > 2") - expected_data = sample_data.filter(pc.field("int64") > 2).append_column( - field_=pa.field("_change_type", pa.string(), nullable=False), - column=[["delete"] * 2], + expected_data = ( + ds.dataset(sample_data) + .to_table(filter=(pc.field("int64") > 2)) + .append_column( + field_=pa.field("_change_type", pa.string(), nullable=False), + column=[["delete"] * 2], + ) ) table_schema = dt.schema().to_pyarrow() table_schema = table_schema.insert(