1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
|
# name: test/sql/sample/sample_verification.test_slow
# description: Test SAMPLE keyword
# group: [sample]
statement ok
PRAGMA enable_verification;
# verify that it is a sample without replacement (i.e. the same row will never occur more than once in the result)
loop i 0 10
query I
select count(distinct i) from range(10) tbl(i) using sample 5;
----
5
endloop
# specifying a seed leads to repeatable behavior
loop i 0 10
query I nosort reservoirseed
select * from range(100) using sample 10 (reservoir, 250)
----
query I nosort bernoulliseed
select * from range(100) using sample 10% (bernoulli, 250)
----
query I nosort systemseed
select * from range(100) using sample 10% (system, 250)
----
endloop
# specify as sample_size, with reservoir sampling this should give us an exact count (i.e. always 10)
loop i 0 10
query I
select count(*) from range(100) using sample 10% (reservoir)
----
10
endloop
|