File: test_strpos_collate.test

package info (click to toggle)
duckdb 1.5.1-3
  • links: PTS, VCS
  • area: main
  • in suites:
  • size: 299,196 kB
  • sloc: cpp: 865,414; ansic: 57,292; python: 18,871; sql: 12,663; lisp: 11,751; yacc: 7,412; lex: 1,682; sh: 747; makefile: 564
file content (176 lines) | stat: -rw-r--r-- 2,670 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
# name: test/sql/collate/test_strpos_collate.test
# description: Test that strpos/instr/position functions properly support COLLATE NOCASE
# group: [collate]

# Test that strpos works with COLLATE NOCASE
query I
SELECT strpos('HELLO' COLLATE NOCASE, 'el')
----
2

# Test with different case combinations
query I
SELECT strpos('HELLO' COLLATE NOCASE, 'EL')
----
2

query I
SELECT strpos('hello' COLLATE NOCASE, 'EL')
----
2

query I
SELECT strpos('HeLLo' COLLATE NOCASE, 'el')
----
2

# Test instr function (alias for strpos)
query I
SELECT instr('HELLO' COLLATE NOCASE, 'el')
----
2

query I
SELECT instr('hello' COLLATE NOCASE, 'EL')
----
2

# Test position function (alias for strpos)
query I
SELECT position('el' IN ('HELLO' COLLATE NOCASE))
----
2

query I
SELECT position('EL' IN ('hello' COLLATE NOCASE))
----
2

# Test edge cases
query I
SELECT strpos('HELLO' COLLATE NOCASE, '')
----
1

query I
SELECT strpos('HELLO' COLLATE NOCASE, 'xyz')
----
0

query I
SELECT strpos('HELLO' COLLATE NOCASE, 'HELLO')
----
1

# Test with longer strings
query I
SELECT strpos('Hello World' COLLATE NOCASE, 'world')
----
7

query I
SELECT strpos('HELLO WORLD' COLLATE NOCASE, 'o w')
----
5

# Test that other string functions still work (regression test)
query T
SELECT contains('HELLO' COLLATE NOCASE, 'hEllO')
----
true

query T
SELECT starts_with('HELLO' COLLATE NOCASE, 'heL')
----
true

# Test with table data
statement ok
CREATE TABLE collate_test(s VARCHAR COLLATE NOCASE)

statement ok
INSERT INTO collate_test VALUES ('Hello World'), ('HELLO WORLD'), ('hElLo WoRlD')

# Test basic functionality
query I
SELECT strpos(s COLLATE NOCASE, 'hello') FROM collate_test ORDER BY s
----
1
1
1

query I
SELECT strpos(s COLLATE NOCASE, 'world') FROM collate_test ORDER BY s
----
7
7
7

# Test with mixed collations
query I
SELECT strpos('HELLO' COLLATE NOCASE, 'el' COLLATE NOCASE)
----
2

query I
SELECT strpos('HELLO' COLLATE NOCASE, 'EL')
----
2

# Test that non-collated versions still work
query I
SELECT strpos('HELLO', 'el')
----
0

query I
SELECT strpos('HELLO', 'EL')
----
2

# Test with empty strings and edge cases
query I
SELECT strpos('' COLLATE NOCASE, '')
----
1

query I
SELECT strpos('' COLLATE NOCASE, 'a')
----
0

query I
SELECT strpos('a' COLLATE NOCASE, '')
----
1

# Test with special characters
query I
SELECT strpos('HéLLO' COLLATE NOCASE, 'éll')
----
2

query I
SELECT strpos('HÉLLO' COLLATE NOCASE, 'éll')
----
2

# Test that the fix doesn't break existing behavior
query I
SELECT strpos('HELLO', 'HELLO')
----
1

query I
SELECT strpos('HELLO', '')
----
1

query I
SELECT strpos('HELLO', 'xyz')
----
0

# Clean up
statement ok
DROP TABLE collate_test