]> granicus.if.org Git - python/commitdiff
Fix and test for bug #764548:
authorJust van Rossum <just@letterror.com>
Wed, 2 Jul 2003 20:03:04 +0000 (20:03 +0000)
committerJust van Rossum <just@letterror.com>
Wed, 2 Jul 2003 20:03:04 +0000 (20:03 +0000)
Use isinstance() instead of comparing types directly, to enable
subclasses of str and unicode to be used as patterns.
Blessed by /F.

Lib/sre.py
Lib/sre_compile.py
Lib/test/test_re.py

index 7e107a68fd0fe4344a567338fe0dbe09273390b6..7910c83eac34a391bad061cc13ae15bd5082bff4 100644 (file)
@@ -219,9 +219,9 @@ def _compile(*key):
     if p is not None:
         return p
     pattern, flags = key
-    if type(pattern) is _pattern_type:
+    if isinstance(pattern, _pattern_type):
         return pattern
-    if type(pattern) not in sre_compile.STRING_TYPES:
+    if not isinstance(pattern, sre_compile.STRING_TYPES):
         raise TypeError, "first argument must be string or compiled pattern"
     try:
         p = sre_compile.compile(pattern, flags)
index 1d59d7e0976eb3f22e10aacec398204f608d6156..96f337a7794faa4d2a5e05093c40371bc47880a8 100644 (file)
@@ -428,12 +428,12 @@ def _compile_info(code, pattern, flags):
         _compile_charset(charset, flags, code)
     code[skip] = len(code) - skip
 
-STRING_TYPES = [type("")]
-
 try:
-    STRING_TYPES.append(type(unicode("")))
+    unicode
 except NameError:
-    pass
+    STRING_TYPES = type("")
+else:
+    STRING_TYPES = (type(""), type(unicode("")))
 
 def _code(p, flags):
 
@@ -453,7 +453,7 @@ def _code(p, flags):
 def compile(p, flags=0):
     # internal: convert pattern list to internal format
 
-    if type(p) in STRING_TYPES:
+    if isinstance(p, STRING_TYPES):
         import sre_parse
         pattern = p
         p = sre_parse.parse(p, flags)
index 50d7ed4339b3e655ce2662a9eb1562671ff687f8..f7248062a2abc3c1b4355687c2e16191aa358970 100644 (file)
@@ -474,6 +474,16 @@ class ReTests(unittest.TestCase):
         self.assertEqual(re.match('(a)((?!(b)*))*', 'abb').groups(),
                          ('a', None, None))
 
+    def test_bug_764548(self):
+        # bug 764548, re.compile() barfs on str/unicode subclasses
+        try:
+            unicode
+        except NameError:
+            return  # no problem if we have no unicode
+        class my_unicode(unicode): pass
+        pat = re.compile(my_unicode("abc"))
+        self.assertEqual(pat.match("xyz"), None)
+
     def test_finditer(self):
         iter = re.finditer(r":+", "a:b::c:::d")
         self.assertEqual([item.group(0) for item in iter],