1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102
|
"""
Tests for pygments.regexopt
~~~~~~~~~~~~~~~~~~~~~~~~~~~
:copyright: Copyright 2006-2022 by the Pygments team, see AUTHORS.
:license: BSD, see LICENSE for details.
"""
import re
import random
from itertools import combinations_with_replacement
from pygments.regexopt import regex_opt
ALPHABET = ['a', 'b', 'c', 'd', 'e']
N_TRIES = 15
def generate_keywordlist(length):
return [''.join(p) for p in
combinations_with_replacement(ALPHABET, length)]
def test_randomly():
# generate a list of all possible keywords of a certain length using
# a restricted alphabet, then choose some to match and make sure only
# those do
for n in range(3, N_TRIES):
kwlist = generate_keywordlist(n)
to_match = random.sample(kwlist,
random.randint(1, len(kwlist) - 1))
no_match = set(kwlist) - set(to_match)
rex = re.compile(regex_opt(to_match))
assert rex.groups == 1
for w in to_match:
assert rex.match(w)
for w in no_match:
assert not rex.match(w)
def test_prefix():
opt = regex_opt(('a', 'b'), prefix=r':{1,2}')
print(opt)
rex = re.compile(opt)
assert not rex.match('a')
assert rex.match('::a')
assert not rex.match(':::') # fullmatch
def test_suffix():
opt = regex_opt(('a', 'b'), suffix=r':{1,2}')
print(opt)
rex = re.compile(opt)
assert not rex.match('a')
assert rex.match('a::')
assert not rex.match(':::') # fullmatch
def test_suffix_opt():
# test that detected suffixes remain sorted.
opt = regex_opt(('afoo', 'abfoo'))
print(opt)
rex = re.compile(opt)
m = rex.match('abfoo')
assert m.end() == 5
def test_different_length_grouping():
opt = regex_opt(('a', 'xyz'))
print(opt)
rex = re.compile(opt)
assert rex.match('a')
assert rex.match('xyz')
assert not rex.match('b')
assert rex.groups == 1
def test_same_length_grouping():
opt = regex_opt(('a', 'b'))
print(opt)
rex = re.compile(opt)
assert rex.match('a')
assert rex.match('b')
assert not rex.match('x')
assert rex.groups == 1
groups = rex.match('a').groups()
assert groups == ('a',)
def test_same_length_suffix_grouping():
opt = regex_opt(('a', 'b'), suffix='(m)')
print(opt)
rex = re.compile(opt)
assert rex.match('am')
assert rex.match('bm')
assert not rex.match('xm')
assert not rex.match('ax')
assert rex.groups == 2
groups = rex.match('am').groups()
assert groups == ('a', 'm')
|