Files
email-tracker/external/duckdb/test/parquet/parquet_combine.test
2025-10-24 19:21:19 -05:00

34 lines
985 B
SQL

# name: test/parquet/parquet_combine.test
# description: Test Parquet Reader row group combining
# group: [parquet]
require parquet
require vector_size 2048
statement ok
set threads=2;
# before we combined data from threads into multiple row groups,
# this would create 4 row groups, now it should create 3
statement ok
copy (with cte as (from range(2049) union all from range(2049)) from cte) to '__TEST_DIR__/parquet_combine.parquet' (row_group_size 2048);
query I
select count(*) from parquet_metadata('__TEST_DIR__/parquet_combine.parquet')
----
3
# works not just with row_group_size, but also with row_group_size_bytes
statement ok
set preserve_insertion_order=false;
# used to create 4, now it should create 3
statement ok
copy (with cte as (from range(100_000) union all from range(100_000)) from cte) to '__TEST_DIR__/parquet_combine.parquet' (row_group_size_bytes 750_000);
query I
select count(*) from parquet_metadata('__TEST_DIR__/parquet_combine.parquet')
----
3