From: Martin v. Löwis Date: Sat, 19 Apr 2003 08:37:24 +0000 (+0000) Subject: Patch #681152: Support escaped Unicode characters in classes. Fixes #612074. X-Git-Tag: v2.3c1~1116 X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=53d93adc46c73e6fdcd6db2d16f0136eadba9839;p=python Patch #681152: Support escaped Unicode characters in classes. Fixes #612074. Will backport to 2.2. --- diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py index fdf6767367..b85aea70a4 100644 --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -254,7 +254,7 @@ def _class_escape(source, escape): if len(escape) != 2: raise error, "bogus escape: %s" % repr("\\" + escape) return LITERAL, atoi(escape, 16) & 0xff - elif str(escape[1:2]) in OCTDIGITS: + elif escape[1:2] in OCTDIGITS: # octal escape (up to three digits) while source.next in OCTDIGITS and len(escape) < 5: escape = escape + source.get() diff --git a/Lib/test/test_sre.py b/Lib/test/test_sre.py index e4eb08ddd7..db871620fa 100644 --- a/Lib/test/test_sre.py +++ b/Lib/test/test_sre.py @@ -96,6 +96,10 @@ test(r"""sre.match('.*?cd', 20000*'abc'+'de').end(0)""", 60001) # non-simple '*?' still recurses and hits the recursion limit test(r"""sre.search('(a|b)*?c', 10000*'ab'+'cd').end(0)""", None, RuntimeError) +# bug 612074 +pat=u"["+sre.escape(u"\u2039")+u"]" +test(r"""sre.compile(pat) and 1""", 1, None) + if verbose: print 'Running tests on sre.sub'