extmod/modure: Convert byte offsets to unicode indices when necessary.
And add a test. Fixes issue #9202. Signed-off-by: Jeff Epler <jepler@gmail.com>
This commit is contained in:
committed by
Damien George
parent
719dbbf563
commit
e90b85cc98
32
tests/unicode/unicode_ure.py
Normal file
32
tests/unicode/unicode_ure.py
Normal file
@@ -0,0 +1,32 @@
|
||||
# test match.span() for unicode strings
|
||||
|
||||
try:
|
||||
import ure as re
|
||||
except ImportError:
|
||||
try:
|
||||
import re
|
||||
except ImportError:
|
||||
print("SKIP")
|
||||
raise SystemExit
|
||||
|
||||
try:
|
||||
m = re.match(".", "a")
|
||||
m.span
|
||||
except AttributeError:
|
||||
print("SKIP")
|
||||
raise SystemExit
|
||||
|
||||
|
||||
def print_spans(match):
|
||||
print("----")
|
||||
try:
|
||||
i = 0
|
||||
while True:
|
||||
print(match.span(i), match.start(i), match.end(i))
|
||||
i += 1
|
||||
except IndexError:
|
||||
pass
|
||||
|
||||
|
||||
m = re.match(r"([0-9]*)(([a-z]*)([0-9]*))", "1234\u2764567")
|
||||
print_spans(m)
|
||||
Reference in New Issue
Block a user