Skip to content

Commit

Permalink
add a test to capture the bug
Browse files Browse the repository at this point in the history
  • Loading branch information
Michael-J-Ward committed Sep 18, 2024
1 parent 6c8bf5f commit ef8d253
Showing 1 changed file with 18 additions and 0 deletions.
18 changes: 18 additions & 0 deletions python/datafusion/tests/test_context.py
Original file line number Diff line number Diff line change
Expand Up @@ -372,6 +372,24 @@ def test_dataset_filter(ctx, capfd):
assert result[0].column(1) == pa.array([-3])


def test_dataset_count(ctx):
# `datafusion-python` issue: https://github.com/apache/datafusion-python/issues/800
batch = pa.RecordBatch.from_arrays(
[pa.array([1, 2, 3]), pa.array([4, 5, 6])],
names=["a", "b"],
)
dataset = ds.dataset([batch])
ctx.register_dataset("t", dataset)

# Testing the dataframe API
df = ctx.table("t")
assert df.count() == 3

# Testing the SQL API
count = ctx.sql("SELECT COUNT(*) FROM t")
count = count.collect()
assert count[0].column(0) == pa.array([3])

def test_pyarrow_predicate_pushdown_is_null(ctx, capfd):
"""Ensure that pyarrow filter gets pushed down for `IsNull`"""
# create a RecordBatch and register it as a pyarrow.dataset.Dataset
Expand Down

0 comments on commit ef8d253

Please sign in to comment.