File: bernoulli_sampling.test_slow

package info (click to toggle)
duckdb 1.5.1-3
  • links: PTS, VCS
  • area: main
  • in suites:
  • size: 299,196 kB
  • sloc: cpp: 865,414; ansic: 57,292; python: 18,871; sql: 12,663; lisp: 11,751; yacc: 7,412; lex: 1,682; sh: 747; makefile: 564
file content (52 lines) | stat: -rw-r--r-- 945 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
# name: test/sql/sample/bernoulli_sampling.test_slow
# description: Test reservoir sample crash on large data sets
# group: [sample]

statement ok
create table output (num_rows INT);

set seed 0.3

loop i 0 500

statement ok
WITH some_tab AS (
    SELECT UNNEST(range(1000)) AS id
),
some_tab_unq AS (
    SELECT distinct(id) AS id FROM some_tab
),
sampled AS (
    select id from some_tab_unq
    USING SAMPLE 1% (bernoulli)
)
INSERT INTO output select count(*) as n_rows FROM sampled;

endloop


query II
select min(num_rows) > 0, count(*) FILTER (num_rows = 0) = 0 from output;
----
true	true

query III
select avg(rowid), min(rowid), max(rowid) from output where num_rows = 0;
----
NULL	NULL	NULL

statement ok
create table t1 as select range id from range(1000);

set seed 0.6

query I nosort result_1
select id from t1 USING SAMPLE 1% (bernoulli, 5);
----

query I nosort result_1
select id from t1 USING SAMPLE 1% (bernoulli, 5);
----