Files
email-tracker/external/duckdb/test/sql/sample/bernoulli_sampling.test_slow
2025-10-24 19:21:19 -05:00

53 lines
945 B
Plaintext

# name: test/sql/sample/bernoulli_sampling.test_slow
# description: Test reservoir sample crash on large data sets
# group: [sample]
statement ok
create table output (num_rows INT);
set seed 0.3
loop i 0 500
statement ok
WITH some_tab AS (
SELECT UNNEST(range(1000)) AS id
),
some_tab_unq AS (
SELECT distinct(id) AS id FROM some_tab
),
sampled AS (
select id from some_tab_unq
USING SAMPLE 1% (bernoulli)
)
INSERT INTO output select count(*) as n_rows FROM sampled;
endloop
query II
select min(num_rows) > 0, count(*) FILTER (num_rows = 0) = 0 from output;
----
true true
query III
select avg(rowid), min(rowid), max(rowid) from output where num_rows = 0;
----
NULL NULL NULL
statement ok
create table t1 as select range id from range(1000);
set seed 0.6
query I nosort result_1
select id from t1 USING SAMPLE 1% (bernoulli, 5);
----
query I nosort result_1
select id from t1 USING SAMPLE 1% (bernoulli, 5);
----