mirror of
https://github.com/python/cpython.git
synced 2025-08-31 05:58:33 +00:00
Issue #18468: The re.split, re.findall, and re.sub functions and the group()
and groups() methods of match object now always return a string or a bytes object.
This commit is contained in:
parent
355dda8d17
commit
25324971fb
3 changed files with 131 additions and 65 deletions
|
@ -17,8 +17,26 @@ from weakref import proxy
|
|||
|
||||
import unittest
|
||||
|
||||
class S(str):
|
||||
def __getitem__(self, index):
|
||||
return S(super().__getitem__(index))
|
||||
|
||||
class B(bytes):
|
||||
def __getitem__(self, index):
|
||||
return B(super().__getitem__(index))
|
||||
|
||||
class ReTests(unittest.TestCase):
|
||||
|
||||
def assertTypedEqual(self, actual, expect, msg=None):
|
||||
self.assertEqual(actual, expect, msg)
|
||||
def recurse(actual, expect):
|
||||
if isinstance(expect, (tuple, list)):
|
||||
for x, y in zip(actual, expect):
|
||||
recurse(x, y)
|
||||
else:
|
||||
self.assertIs(type(actual), type(expect), msg)
|
||||
recurse(actual, expect)
|
||||
|
||||
def test_keep_buffer(self):
|
||||
# See bug 14212
|
||||
b = bytearray(b'x')
|
||||
|
@ -53,6 +71,13 @@ class ReTests(unittest.TestCase):
|
|||
return str(int_value + 1)
|
||||
|
||||
def test_basic_re_sub(self):
|
||||
self.assertTypedEqual(re.sub('y', 'a', 'xyz'), 'xaz')
|
||||
self.assertTypedEqual(re.sub('y', S('a'), S('xyz')), 'xaz')
|
||||
self.assertTypedEqual(re.sub(b'y', b'a', b'xyz'), b'xaz')
|
||||
self.assertTypedEqual(re.sub(b'y', B(b'a'), B(b'xyz')), b'xaz')
|
||||
self.assertTypedEqual(re.sub(b'y', bytearray(b'a'), bytearray(b'xyz')), b'xaz')
|
||||
self.assertTypedEqual(re.sub(b'y', memoryview(b'a'), memoryview(b'xyz')), b'xaz')
|
||||
|
||||
self.assertEqual(re.sub("(?i)b+", "x", "bbbb BBBB"), 'x x')
|
||||
self.assertEqual(re.sub(r'\d+', self.bump_num, '08.2 -2 23x99y'),
|
||||
'9.3 -3 24x100y')
|
||||
|
@ -210,10 +235,22 @@ class ReTests(unittest.TestCase):
|
|||
self.assertEqual(re.subn("b*", "x", "xyz", 2), ('xxxyz', 2))
|
||||
|
||||
def test_re_split(self):
|
||||
self.assertEqual(re.split(":", ":a:b::c"), ['', 'a', 'b', '', 'c'])
|
||||
self.assertEqual(re.split(":*", ":a:b::c"), ['', 'a', 'b', 'c'])
|
||||
self.assertEqual(re.split("(:*)", ":a:b::c"),
|
||||
['', ':', 'a', ':', 'b', '::', 'c'])
|
||||
for string in ":a:b::c", S(":a:b::c"):
|
||||
self.assertTypedEqual(re.split(":", string),
|
||||
['', 'a', 'b', '', 'c'])
|
||||
self.assertTypedEqual(re.split(":*", string),
|
||||
['', 'a', 'b', 'c'])
|
||||
self.assertTypedEqual(re.split("(:*)", string),
|
||||
['', ':', 'a', ':', 'b', '::', 'c'])
|
||||
for string in (b":a:b::c", B(b":a:b::c"), bytearray(b":a:b::c"),
|
||||
memoryview(b":a:b::c")):
|
||||
self.assertTypedEqual(re.split(b":", string),
|
||||
[b'', b'a', b'b', b'', b'c'])
|
||||
self.assertTypedEqual(re.split(b":*", string),
|
||||
[b'', b'a', b'b', b'c'])
|
||||
self.assertTypedEqual(re.split(b"(:*)", string),
|
||||
[b'', b':', b'a', b':', b'b', b'::', b'c'])
|
||||
|
||||
self.assertEqual(re.split("(?::*)", ":a:b::c"), ['', 'a', 'b', 'c'])
|
||||
self.assertEqual(re.split("(:)*", ":a:b::c"),
|
||||
['', ':', 'a', ':', 'b', ':', 'c'])
|
||||
|
@ -235,22 +272,39 @@ class ReTests(unittest.TestCase):
|
|||
|
||||
def test_re_findall(self):
|
||||
self.assertEqual(re.findall(":+", "abc"), [])
|
||||
self.assertEqual(re.findall(":+", "a:b::c:::d"), [":", "::", ":::"])
|
||||
self.assertEqual(re.findall("(:+)", "a:b::c:::d"), [":", "::", ":::"])
|
||||
self.assertEqual(re.findall("(:)(:*)", "a:b::c:::d"), [(":", ""),
|
||||
(":", ":"),
|
||||
(":", "::")])
|
||||
for string in "a:b::c:::d", S("a:b::c:::d"):
|
||||
self.assertTypedEqual(re.findall(":+", string),
|
||||
[":", "::", ":::"])
|
||||
self.assertTypedEqual(re.findall("(:+)", string),
|
||||
[":", "::", ":::"])
|
||||
self.assertTypedEqual(re.findall("(:)(:*)", string),
|
||||
[(":", ""), (":", ":"), (":", "::")])
|
||||
for string in (b"a:b::c:::d", B(b"a:b::c:::d"), bytearray(b"a:b::c:::d"),
|
||||
memoryview(b"a:b::c:::d")):
|
||||
self.assertTypedEqual(re.findall(b":+", string),
|
||||
[b":", b"::", b":::"])
|
||||
self.assertTypedEqual(re.findall(b"(:+)", string),
|
||||
[b":", b"::", b":::"])
|
||||
self.assertTypedEqual(re.findall(b"(:)(:*)", string),
|
||||
[(b":", b""), (b":", b":"), (b":", b"::")])
|
||||
|
||||
def test_bug_117612(self):
|
||||
self.assertEqual(re.findall(r"(a|(b))", "aba"),
|
||||
[("a", ""),("b", "b"),("a", "")])
|
||||
|
||||
def test_re_match(self):
|
||||
self.assertEqual(re.match('a', 'a').groups(), ())
|
||||
self.assertEqual(re.match('(a)', 'a').groups(), ('a',))
|
||||
self.assertEqual(re.match(r'(a)', 'a').group(0), 'a')
|
||||
self.assertEqual(re.match(r'(a)', 'a').group(1), 'a')
|
||||
self.assertEqual(re.match(r'(a)', 'a').group(1, 1), ('a', 'a'))
|
||||
for string in 'a', S('a'):
|
||||
self.assertEqual(re.match('a', string).groups(), ())
|
||||
self.assertEqual(re.match('(a)', string).groups(), ('a',))
|
||||
self.assertEqual(re.match('(a)', string).group(0), 'a')
|
||||
self.assertEqual(re.match('(a)', string).group(1), 'a')
|
||||
self.assertEqual(re.match('(a)', string).group(1, 1), ('a', 'a'))
|
||||
for string in b'a', B(b'a'), bytearray(b'a'), memoryview(b'a'):
|
||||
self.assertEqual(re.match(b'a', string).groups(), ())
|
||||
self.assertEqual(re.match(b'(a)', string).groups(), (b'a',))
|
||||
self.assertEqual(re.match(b'(a)', string).group(0), b'a')
|
||||
self.assertEqual(re.match(b'(a)', string).group(1), b'a')
|
||||
self.assertEqual(re.match(b'(a)', string).group(1, 1), (b'a', b'a'))
|
||||
|
||||
pat = re.compile('((a)|(b))(c)?')
|
||||
self.assertEqual(pat.match('a').groups(), ('a', 'a', None, None))
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue