File: sample_verification.test_slow

package info (click to toggle)
duckdb 1.5.1-3
  • links: PTS, VCS
  • area: main
  • in suites:
  • size: 299,196 kB
  • sloc: cpp: 865,414; ansic: 57,292; python: 18,871; sql: 12,663; lisp: 11,751; yacc: 7,412; lex: 1,682; sh: 747; makefile: 564
file content (43 lines) | stat: -rw-r--r-- 913 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
# name: test/sql/sample/sample_verification.test_slow
# description: Test SAMPLE keyword
# group: [sample]

statement ok
PRAGMA enable_verification;

# verify that it is a sample without replacement (i.e. the same row will never occur more than once in the result)
loop i 0 10

query I
select count(distinct i) from range(10) tbl(i) using sample 5;
----
5

endloop

# specifying a seed leads to repeatable behavior
loop i 0 10

query I nosort reservoirseed
select * from range(100) using sample 10 (reservoir, 250)
----

query I nosort bernoulliseed
select * from range(100) using sample 10% (bernoulli, 250)
----

query I nosort systemseed
select * from range(100) using sample 10% (system, 250)
----

endloop

# specify as sample_size, with reservoir sampling this should give us an exact count (i.e. always 10)
loop i 0 10

query I
select count(*) from range(100) using sample 10% (reservoir)
----
10

endloop