From: Guido van Rossum Date: Tue, 11 Apr 2000 15:39:02 +0000 (+0000) Subject: Marc-Andre Lemburg: X-Git-Tag: v1.6a2~5 X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=dc742b318480617cdb84af400c4d9dccae3a33d5;p=python Marc-Andre Lemburg: Added a few missing whitespace Unicode char mappings. Thanks to Brian Hooper. --- diff --git a/Objects/unicodectype.c b/Objects/unicodectype.c index 946be22e6e..da2b8d5b18 100644 --- a/Objects/unicodectype.c +++ b/Objects/unicodectype.c @@ -633,8 +633,8 @@ int _PyUnicode_IsNumeric(register const Py_UNICODE ch) #ifndef WANT_WCTYPE_FUNCTIONS -/* Returns 1 for Unicode characters having the type 'WS', 'B' or 'S', - 0 otherwise. */ +/* Returns 1 for Unicode characters having the bidirectional type + 'WS', 'B' or 'S' or the category 'Zs', 0 otherwise. */ int _PyUnicode_IsWhitespace(register const Py_UNICODE ch) { @@ -649,6 +649,8 @@ int _PyUnicode_IsWhitespace(register const Py_UNICODE ch) case 0x001E: /* RECORD SEPARATOR */ case 0x001F: /* UNIT SEPARATOR */ case 0x0020: /* SPACE */ + case 0x0085: /* NEXT LINE */ + case 0x00A0: /* NO-BREAK SPACE */ case 0x1680: /* OGHAM SPACE MARK */ case 0x2000: /* EN QUAD */ case 0x2001: /* EM QUAD */ @@ -661,7 +663,9 @@ int _PyUnicode_IsWhitespace(register const Py_UNICODE ch) case 0x2008: /* PUNCTUATION SPACE */ case 0x2009: /* THIN SPACE */ case 0x200A: /* HAIR SPACE */ + case 0x200B: /* ZERO WIDTH SPACE */ case 0x2028: /* LINE SEPARATOR */ + case 0x2029: /* PARAGRAPH SEPARATOR */ case 0x202F: /* NARROW NO-BREAK SPACE */ case 0x3000: /* IDEOGRAPHIC SPACE */ return 1;