UnicodeEncodeError uses the new Unicode API
authorVictor Stinner <victor.stinner@haypocalc.com>
Sun, 20 Nov 2011 21:50:23 +0000 (22:50 +0100)
committerVictor Stinner <victor.stinner@haypocalc.com>
Sun, 20 Nov 2011 21:50:23 +0000 (22:50 +0100)
The index is a character index, not a index in a Py_UNICODE* string.

Objects/exceptions.c

index 5b5447a1d7d6d8e802933aa5d07de069562df3ca..c8f90b89a09a4be15e6f7d32e24fad9c5f0b5d82 100644 (file)
@@ -1542,8 +1542,8 @@ UnicodeEncodeError_str(PyObject *self)
     if (encoding_str == NULL)
         goto done;
 
-    if (uself->start < PyUnicode_GET_SIZE(uself->object) && uself->end == uself->start+1) {
-        int badchar = (int)PyUnicode_AS_UNICODE(uself->object)[uself->start];
+    if (uself->start < PyUnicode_GET_LENGTH(uself->object) && uself->end == uself->start+1) {
+        Py_UCS4 badchar = PyUnicode_ReadChar(uself->object, uself->start);
         const char *fmt;
         if (badchar <= 0xff)
             fmt = "'%U' codec can't encode character '\\x%02x' in position %zd: %U";
@@ -1554,7 +1554,7 @@ UnicodeEncodeError_str(PyObject *self)
         result = PyUnicode_FromFormat(
             fmt,
             encoding_str,
-            badchar,
+            (int)badchar,
             uself->start,
             reason_str);
     }