File: predicate_factoring.test

package info (click to toggle)
duckdb 1.5.1-3
  • links: PTS, VCS
  • area: main
  • in suites:
  • size: 299,196 kB
  • sloc: cpp: 865,414; ansic: 57,292; python: 18,871; sql: 12,663; lisp: 11,751; yacc: 7,412; lex: 1,682; sh: 747; makefile: 564
file content (120 lines) | stat: -rw-r--r-- 2,746 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
# name: test/sql/optimizer/predicate_factoring.test
# description: Test PredicateFactoringRule - extracts common single-column predicates from disjunctive clauses
# group: [optimizer]

statement ok
PRAGMA enable_verification

statement ok
CREATE TABLE t (a INTEGER, b INTEGER, c INTEGER);

statement ok
INSERT INTO t VALUES (1, 5, 3), (1, 2, 3), (1, 5, 11), (2, 5, 3), (NULL, 5, 3);

# Basic predicate factoring: a=1 is common to both disjuncts and should be extracted
query III rowsort
SELECT * FROM t WHERE (a=1 AND b>3) OR (a=1 AND c<5)
----
1	2	3
1	5	11
1	5	3

# Verify a=1 is pushed down into the scan as a required filter
query II
EXPLAIN SELECT * FROM t WHERE (a=1 AND b>3) OR (a=1 AND c<5)
----
physical_plan	<REGEX>:.*Filters: a=1.*

# Predicate factoring on a different common column: b=5
query III rowsort
SELECT * FROM t WHERE (a=1 AND b=5) OR (a=2 AND b=5)
----
1	5	11
1	5	3
2	5	3

query II
EXPLAIN SELECT * FROM t WHERE (a=1 AND b=5) OR (a=2 AND b=5)
----
physical_plan	<REGEX>:.*Filters:.*b=5.*

# Two common predicates: both a=1 and b=5 should be factored out
query III rowsort
SELECT * FROM t WHERE (a=1 AND b=5 AND c>2) OR (a=1 AND b=5 AND c<6)
----
1	5	11
1	5	3

query II
EXPLAIN SELECT * FROM t WHERE (a=1 AND b=5 AND c>2) OR (a=1 AND b=5 AND c<6)
----
physical_plan	<REGEX>:.*Filters:.*a=1.*b=5.*

# Three-way disjunction: a=1 is common to all three disjuncts
query III rowsort
SELECT * FROM t WHERE (a=1 AND b=5) OR (a=1 AND c>2) OR (a=1 AND b=2)
----
1	2	3
1	5	11
1	5	3

query II
EXPLAIN SELECT * FROM t WHERE (a=1 AND b=5) OR (a=1 AND c>2) OR (a=1 AND b=2)
----
physical_plan	<REGEX>:.*Filters: a=1.*

# No common predicates: no factoring should occur
query III rowsort
SELECT * FROM t WHERE (a=1 AND b>3) OR (a=2 AND c<5)
----
1	5	11
1	5	3
2	5	3

# Rule does not fire for a single-column OR (already pushable)
query III rowsort
SELECT * FROM t WHERE a=1 OR a=2
----
1	2	3
1	5	11
1	5	3
2	5	3

# NULL handling: factored predicate correctly excludes NULLs
query III rowsort
SELECT * FROM t WHERE (a=1 AND b=5) OR (a=1 AND c=3)
----
1	2	3
1	5	11
1	5	3

# Rule only applies to FILTER context, not SELECT clause
query I rowsort
SELECT (a=1 AND b>3) OR (a=1 AND c<5) FROM t
----
0
1
1
1
NULL

# Predicate factoring in a cross join condition
statement ok
CREATE TABLE s (x INTEGER, y INTEGER);

statement ok
INSERT INTO s VALUES (1, 10), (2, 20), (1, 30);

query IIIII rowsort
SELECT t.a, t.b, t.c, s.x, s.y FROM t, s WHERE (t.a=1 AND s.x=1 AND t.b>3) OR (t.a=1 AND s.x=1 AND s.y<20)
----
1	2	3	1	10
1	5	11	1	10
1	5	11	1	30
1	5	3	1	10
1	5	3	1	30

query II
EXPLAIN SELECT t.a, t.b, t.c, s.x, s.y FROM t, s WHERE (t.a=1 AND s.x=1 AND t.b>3) OR (t.a=1 AND s.x=1 AND s.y<20)
----
physical_plan	<REGEX>:.*Filters: x=1.*Filters: a=1.*