File: test_ignore_nulls.test

package info (click to toggle)
duckdb 1.5.1-2
  • links: PTS, VCS
  • area: main
  • in suites:
  • size: 299,196 kB
  • sloc: cpp: 865,414; ansic: 57,292; python: 18,871; sql: 12,663; lisp: 11,751; yacc: 7,412; lex: 1,682; sh: 747; makefile: 558
file content (354 lines) | stat: -rw-r--r-- 5,816 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
# name: test/sql/window/test_ignore_nulls.test
# description: Test IGNORE NULLS window syntax
# group: [window]

statement ok
PRAGMA enable_verification

# Issue #2549
statement ok
CREATE TABLE issue2549 AS SELECT * FROM (VALUES
	(0, 1, 614),
	(1, 1, null),
	(2, 1, null),
	(3, 1, 639),
	(4, 1, 2027)
) tbl(id, user_id, order_id);

query IIII
SELECT
  id,
  user_id,
  order_id,
  LAST_VALUE (order_id IGNORE NULLS) over (
    PARTITION BY user_id
    ORDER BY id
    ROWS BETWEEN UNBOUNDED PRECEDING AND 1 PRECEDING
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	NULL
1	1	NULL	614
2	1	NULL	614
3	1	639	614
4	1	2027	639

query IIII
SELECT
  id,
  user_id,
  order_id,
  FIRST_VALUE (order_id IGNORE NULLS) over (
    PARTITION BY user_id
    ORDER BY id
    ROWS BETWEEN 1 PRECEDING AND UNBOUNDED FOLLOWING
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	614
1	1	NULL	614
2	1	NULL	639
3	1	639	639
4	1	2027	639

query IIII
SELECT
  id,
  user_id,
  order_id,
  NTH_VALUE (order_id, 2 IGNORE NULLS) over (
    PARTITION BY user_id
    ORDER BY id
    ROWS BETWEEN UNBOUNDED PRECEDING AND 1 PRECEDING
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	NULL
1	1	NULL	NULL
2	1	NULL	NULL
3	1	639	NULL
4	1	2027	639

query IIII
SELECT
  id,
  user_id,
  order_id,
  LEAD(order_id, 1, -1 IGNORE NULLS) over (
    PARTITION BY user_id
    ORDER BY id
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	639
1	1	NULL	639
2	1	NULL	639
3	1	639	2027
4	1	2027	-1

query IIII
SELECT
  id,
  user_id,
  order_id,
  LAG(order_id, 1, -1 IGNORE NULLS) over (
    PARTITION BY user_id
    ORDER BY id
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	-1
1	1	NULL	614
2	1	NULL	614
3	1	639	614
4	1	2027	639

# Zero LAG is always identity
query IIII
SELECT
  id,
  user_id,
  order_id,
  LAG(order_id, 0, -1 IGNORE NULLS) over (
    PARTITION BY user_id
    ORDER BY id
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	614
1	1	NULL	NULL
2	1	NULL	NULL
3	1	639	639
4	1	2027	2027

#
# RESPECT NULLS should be the default
#
query IIII
SELECT
  id,
  user_id,
  order_id,
  LAST_VALUE (order_id RESPECT NULLS) over (
    PARTITION BY user_id
    ORDER BY id
    ROWS BETWEEN UNBOUNDED PRECEDING AND 1 PRECEDING
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	NULL
1	1	NULL	614
2	1	NULL	NULL
3	1	639	NULL
4	1	2027	639

query IIII
SELECT
  id,
  user_id,
  order_id,
  FIRST_VALUE (order_id RESPECT NULLS) over (
    PARTITION BY user_id
    ORDER BY id
    ROWS BETWEEN UNBOUNDED PRECEDING AND 1 PRECEDING
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	NULL
1	1	NULL	614
2	1	NULL	614
3	1	639	614
4	1	2027	614

query IIII
SELECT
  id,
  user_id,
  order_id,
  NTH_VALUE (order_id, 2 RESPECT NULLS) over (
    PARTITION BY user_id
    ORDER BY id
    ROWS BETWEEN UNBOUNDED PRECEDING AND 1 PRECEDING
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	NULL
1	1	NULL	NULL
2	1	NULL	NULL
3	1	639	NULL
4	1	2027	NULL

query IIII
SELECT
  id,
  user_id,
  order_id,
  LEAD(order_id, 1, -1 RESPECT NULLS) over (
    PARTITION BY user_id
    ORDER BY id
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	NULL
1	1	NULL	NULL
2	1	NULL	639
3	1	639	2027
4	1	2027	-1

query IIII
SELECT
  id,
  user_id,
  order_id,
  LAG(order_id, 1, -1 RESPECT NULLS) over (
    PARTITION BY user_id
    ORDER BY id
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	-1
1	1	NULL	614
2	1	NULL	NULL
3	1	639	NULL
4	1	2027	639

# Zero LAG is always identity
query IIII
SELECT
  id,
  user_id,
  order_id,
  LAG(order_id, 0, -1 RESPECT NULLS) over (
    PARTITION BY user_id
    ORDER BY id
  ) AS last_order_id
FROM issue2549
ORDER BY ALL
----
0	1	614	614
1	1	NULL	NULL
2	1	NULL	NULL
3	1	639	639
4	1	2027	2027

# Edge cases for FIRST/LAST/NTH_VALUE
statement ok
CREATE TABLE IF NOT EXISTS issue6635(index INTEGER, data INTEGER);

statement ok
insert into issue6635 values 
	(1,1),
	(2,2),
	(3,NULL),
	(4,NULL),
	(5,5),
	(6,NULL),
	(7,NULL)
;

query IIIII
SELECT *, 
	first(data IGNORE NULLS) OVER w, 
	last(data IGNORE NULLS) OVER w,
	nth_value(data, 1 IGNORE NULLS) OVER w
FROM issue6635
WINDOW w AS (
	ORDER BY index 
	ROWS BETWEEN 1 FOLLOWING 
	 AND UNBOUNDED FOLLOWING
)
;
----
1	1	2	5	2
2	2	5	5	5
3	NULL	5	5	5
4	NULL	5	5	5
5	5	NULL	NULL	NULL
6	NULL	NULL	NULL	NULL
7	NULL	NULL	NULL	NULL

# Multiple blocks for ignore nulls
query IIII
WITH gen AS (
    SELECT *,
        ((id * 1327) % 9973) / 10000.0 AS rnd
    FROM generate_series(1, 10000) tbl(id)
),
lvl AS (
    SELECT id,
        rnd,
        CASE
            WHEN rnd <= 0.1 THEN 'shallow'
            WHEN rnd >= 0.9 THEN 'high'
        END AS water_level
    FROM gen
)
SELECT *,
    LAST_VALUE(water_level IGNORE NULLS) OVER (
        ORDER BY id
    ) AS grade
FROM lvl
ORDER BY id
----
40000 values hashing to c302c8b0f3c10c1e5cc7211c4af7a8d6

# Independent INGORE/RESPECT NULLS with shared input.
query III
SELECT 
	v, 
	lead(v) OVER (ORDER BY id), 
	lead(v IGNORE NULLS) OVER (ORDER BY id) 
FROM (VALUES 
	(1, 1), 
	(2, NULL), 
	(3, 2), 
	(4, NULL), 
	(5, 3), 
	(6, NULL)
) tbl(id, v);
----
1	NULL	2
NULL	2	2
2	NULL	3
NULL	3	3
3	NULL	NULL
NULL	NULL	NULL

#
# Unsupported
#

foreach modifier IGNORE RESPECT

# Regular function
statement error
SELECT ABS(x ${modifier} NULLS) FROM range(10) tbl(x)
----
Parser Error: RESPECT/IGNORE NULLS is not supported for non-window functions

# Aggregate function
statement error
SELECT SUM(x ${modifier} NULLS)
FROM range(10) tbl(x)
----
Parser Error: RESPECT/IGNORE NULLS is not supported for non-window functions

# Windowed aggregate
statement error
SELECT SUM(x ${modifier} NULLS) OVER (PARTITION BY (x / 3) ORDER BY x % 3)
FROM range(10) tbl(x)
----
Parser Error: RESPECT/IGNORE NULLS is not supported for windowed aggregates

endloop