File: 101_delimited.t

package info (click to toggle)
libregexp-common-perl 2024080801-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 1,328 kB
  • sloc: perl: 17,842; makefile: 2
file content (307 lines) | stat: -rwxr-xr-x 12,484 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
#!/opt/perl/bin/perl

use strict;
use warnings;
no  warnings 'syntax';

use Regexp::Common;
use Test::More;

my $r = eval "require Test::Regexp; 1";

unless ($r) {
    print "1..0 # SKIP Test::Regexp not found\n";
    exit;
}

sub make_test {
    my ($name, $pat) = @_;
    my $keep = $$pat {-keep};
    Test::Regexp::   -> new -> init (
        pattern      => $pat,
        keep_pattern => $keep,
        name         => $name,
    );
}


#
# Test double quoted delimiter
#
{
    my $test = make_test "Double quoted string" =>
                         $RE {delimited} {-delim => '"'};

    $test -> match (q {"a few words"},
                   [q {"a few words"}, q {"}, q {a few words}, q {"}],
                   test => "Simple string"),
    $test -> match (q {"a few \ words"},
                   [q {"a few \ words"}, q {"}, q {a few \ words}, q {"}],
                   test => "Simple string with escape"),
    $test -> match (q {"a few \" words"},
                   [q {"a few \" words"}, q {"}, q {a few \" words}, q {"}],
                   test => "Simple string with escaped delimiter"),
    $test -> match (q {"a 'few' words"},
                   [q {"a 'few' words"}, q {"}, q {a 'few' words}, q {"}],
                   test => "Simple string with single quotes"),

    $test -> no_match (q {'a few words'}, reason => "Wrong delimiters");
    $test -> no_match (q {a few words"}, reason => "No opening delimiter");
    $test -> no_match (q {"a few words}, reason => "No closing delimiter");
    $test -> no_match (q {"a few" words"}, reason => "Unescaped delimiter");
    $test -> no_match (q {"a few\\\\" words"}, reason => "Escaped escape");
    $test -> no_match (q { "a few words"},
                       reason => "Characters before opening delimiter");
    $test -> no_match (q {"a few words" },
                       reason => "Characters after opening delimiter");
}


#
# Test single quoted delimiter
#
{
    my $test = make_test "Single quoted string" =>
                         $RE {delimited} {-delim => "'"};

    $test -> match (q {'a few words'},
                   [q {'a few words'}, q {'}, q {a few words}, q {'}],
                   test => "Simple string"),
    $test -> match (q {'a few \ words'},
                   [q {'a few \ words'}, q {'}, q {a few \ words}, q {'}],
                   test => "Simple string with escape"),
    $test -> match (q {'a few \' words'},
                   [q {'a few \' words'}, q {'}, q {a few \' words}, q {'}],
                   test => "Simple string with escaped delimiter"),
    $test -> match (q {'a "few" words'},
                   [q {'a "few" words'}, q {'}, q {a "few" words}, q {'}],
                   test => "Simple string with double quotes"),

    $test -> no_match (q {"a few words"}, reason => "Wrong delimiters");
    $test -> no_match (q {a few words'}, reason => "No opening delimiter");
    $test -> no_match (q {'a few words}, reason => "No closing delimiter");
    $test -> no_match (q {'a few' words'}, reason => "Unescaped delimiter");
    $test -> no_match (q {'a few\\\\' words'}, reason => "Escaped escape");
    $test -> no_match (q { 'a few words'},
                       reason => "Characters before opening delimiter");
    $test -> no_match (q {'a few words' },
                       reason => "Characters after opening delimiter");
}


#
# Test an odd (space) delimiter
#
{
    my $test = make_test "Space quoted string" =>
                         $RE {delimited} {-delim => " "};

    $test -> match (q { a-few-words },
                   [q { a-few-words }, q { }, q {a-few-words}, q { }],
                   test => "Simple string"),
    $test -> match (q { a-few-\-words },
                   [q { a-few-\-words }, q { }, q {a-few-\-words}, q { }],
                   test => "Simple string with escape"),
    $test -> match (q { a-few-\ -words },
                   [q { a-few-\ -words }, q { }, q {a-few-\ -words}, q { }],
                   test => "Simple string with escaped delimiter"),

    $test -> no_match (q {"a few words"}, reason => "Wrong delimiters");
}


#
# Test $RE {quoted}. This automatically tests multiple delimiters as well.
#
{
    my $test = make_test "Quoted string (using 'quoted')" => $RE {quoted};

    $test -> match (q {"a few words"},
                   [q {"a few words"}, q {"}, q {a few words}, q {"}],
                   test => "Simple string, using double quotes"),
    $test -> match (q {'a few words'},
                   [q {'a few words'}, q {'}, q {a few words}, q {'}],
                   test => "Simple string, using single quotes"),
    $test -> match (q {`a few words`},
                   [q {`a few words`}, q {`}, q {a few words}, q {`}],
                   test => "Simple string, using backticks"),
    $test -> match (q {"a few \ words"},
                   [q {"a few \ words"}, q {"}, q {a few \ words}, q {"}],
                   test => "Double quoted string with escape"),
    $test -> match (q {'a few \ words'},
                   [q {'a few \ words'}, q {'}, q {a few \ words}, q {'}],
                   test => "Single quoted string with escape"),
    $test -> match (q {`a few \ words`},
                   [q {`a few \ words`}, q {`}, q {a few \ words}, q {`}],
                   test => "Backtick quoted string with escape"),
    $test -> match (q {"a few \" words"},
                   [q {"a few \" words"}, q {"}, q {a few \" words}, q {"}],
                   test => "Double quoted string with escaped delimiter"),
    $test -> match (q {'a few \' words'},
                   [q {'a few \' words'}, q {'}, q {a few \' words}, q {'}],
                   test => "Single quoted string with escaped delimiter"),
    $test -> match (q {`a few \` words`},
                   [q {`a few \` words`}, q {`}, q {a few \` words}, q {`}],
                   test => "Backtick quoted string with escaped delimiter"),
    $test -> match (q {"a 'few' words"},
                   [q {"a 'few' words"}, q {"}, q {a 'few' words}, q {"}],
                   test => "Double quoted string with single quotes"),
    $test -> match (q {'a "few" words'},
                   [q {'a "few" words'}, q {'}, q {a "few" words}, q {'}],
                   test => "Single quoted string with double quotes"),
    $test -> match (q {`a "few" words`},
                   [q {`a "few" words`}, q {`}, q {a "few" words}, q {`}],
                   test => "Backtick quoted string with double quotes"),

    $test -> no_match (q {'a few words"}, reason => "Mixed delimiters");
    $test -> no_match (q {'a few words`}, reason => "Mixed delimiters");
    $test -> no_match (q {"a few words`}, reason => "Mixed delimiters");
    $test -> no_match (q {"a few words'}, reason => "Mixed delimiters");
    $test -> no_match (q {`a few words"}, reason => "Mixed delimiters");
    $test -> no_match (q {`a few words'}, reason => "Mixed delimiters");
}


#
# Test an another delimiter
#
{
    my $test = make_test "Bang as delimiter" =>
                         $RE {delimited} {-delim => '"'} {-esc => '!'};

    $test -> match (q {"a few words"},
                   [q {"a few words"}, q {"}, q {a few words}, q {"}],
                   test => "Simple string"),
    $test -> match (q {"a few ! words"},
                   [q {"a few ! words"}, q {"}, q {a few ! words}, q {"}],
                   test => "Simple string with escape"),
    $test -> match (q {"a few !" words"},
                   [q {"a few !" words"}, q {"}, q {a few !" words}, q {"}],
                   test => "Simple string with escaped delimiter"),

    $test -> no_match (q {"a few\" words"}, reason => "Incorrect escape");
    $test -> no_match (q {"a few!!" words"}, reason => "Escaped escape");
}



#
# Test delimiter and escape the same characters
#
{
    my $test = make_test "Delimiter is same as escape" =>
                         $RE {delimited} {-delim => '!'} {-esc => '!'};

    $test -> match (q {!a few words!},
                   [q {!a few words!}, q {!}, q {a few words}, q {!}],
                   test => "Simple string"),
    $test -> match (q {!a few !! words!},
                   [q {!a few !! words!}, q {!}, q {a few !! words}, q {!}],
                   test => "Simple string with escaped delimiter"),

    $test -> no_match (q {!a few\! words!}, reason => "Incorrect escape");
    $test -> no_match (q {!a few! words!},
                       reason => "Escape must be followed by delimiter");
}


#
# Test multiple escapes; they should match up with the delimiters
#
{
    my $test = make_test "Multiple escape characters" =>
                         $RE {quoted} {-esc => '!_'};

    $test -> match (q {"a few words"},
                   [q {"a few words"}, q {"}, q {a few words}, q {"}],
                   test => "Simple string");
    $test -> match (q {"a !"few words"},
                   [q {"a !"few words"}, q {"}, q {a !"few words}, q {"}],
                   test => "Simple string, with escape");
    $test -> match (q {'a _'few words'},
                   [q {'a _'few words'}, q {'}, q {a _'few words}, q {'}],
                   test => "Simple string, with another delimiter/escape");
    $test -> match (q {`a _`few words`},
                   [q {`a _`few words`}, q {`}, q {a _`few words}, q {`}],
                   test => "Escape copied when there are more delimiters");

    $test -> no_match (q {"a _"few words"}, reason => "Incorrect delimiter");
    $test -> no_match (q {'a !'few words'}, reason => "Incorrect delimiter");
    $test -> no_match (q {`a !`few words`}, reason => "Incorrect delimiter");
    $test -> no_match (q {"a \"few words"}, reason => "Incorrect delimiter");
}


#
# Test no escape character
#
{
    my $test = make_test "Double quoted string" =>
                         $RE {delimited} {-delim => '"'} {-esc =>};

    $test -> match (q {"a few words"},
                   [q {"a few words"}, q {"}, q {a few words}, q {"}],
                   test => "Simple string"),

    $test -> no_match (q {"a few" words"}, reason => "Delimiter in string");
    $test -> no_match (q {"a few\" words"}, reason => "There is no escape");
}


#
# Test different closing delimiters
#
{
    my $test = make_test "Bracketed strings" =>
                         $RE {delimited} { -delim => '([{<'} 
                                         {-cdelim => ')]}>'};

    $test -> match ("(a few words)",
                   ["(a few words)", "(", "a few words", ")"],
                   test => "Using parenthesis");
    $test -> match ("[a few words]",
                   ["[a few words]", "[", "a few words", "]"],
                   test => "Using brackets");
    $test -> match ("{a few words}",
                   ["{a few words}", "{", "a few words", "}"],
                   test => "Using braces");
    $test -> match ("<a few words>",
                   ["<a few words>", "<", "a few words", ">"],
                   test => "Using angle brackets");
    $test -> match ("[a [few words]",
                   ["[a [few words]", "[", "a [few words", "]"],
                   test => "Opening delimiter needs no escape");
    $test -> match ('[a [few\] words]',
                   ['[a [few\] words]', "[", 'a [few\] words', "]"],
                   test => "Closing delimiter needs escape");

    $test -> no_match ("[a few words}", reason => "Mismatched delimiters");
    $test -> no_match ("(a few words>", reason => "Mismatched delimiters");
    $test -> no_match ("{a few words{",
                reason => "Using opening delimiter as the closing delimiter");
    $test -> no_match (">a few words>",
                reason => "Using closing delimiter as the opening delimiter");
    $test -> no_match ("[a [few] words]",
                reason => "Unescaped closing delimiter");
}


#
# Use less closing delimiters than opening delimiters
#
{
    my $test = make_test "Less closing delimiters than opening delimiters" =>
                         $RE {delimited} { -delim => "\x{AB}<"}
                                         {-cdelim => "\x{BB}"};
    $test -> match ("\x{AB}a few words\x{BB}",
                   ["\x{AB}a few words\x{BB}", "\x{AB}", "a few words",
                                               "\x{BB}"],
                   test => "Using double angled quotation marks");
    $test -> match ("<a few words\x{BB}",
                   ["<a few words\x{BB}", "<", "a few words", "\x{BB}"],
                   test => "Closing delimiter repeats");
}

done_testing;

__END__