]> granicus.if.org Git - python/commitdiff
Issue #1521: on 64bit platforms, str.decode fails on very long strings.
authorAmaury Forgeot d'Arc <amauryfa@gmail.com>
Fri, 30 Nov 2007 20:51:40 +0000 (20:51 +0000)
committerAmaury Forgeot d'Arc <amauryfa@gmail.com>
Fri, 30 Nov 2007 20:51:40 +0000 (20:51 +0000)
The t# and w# formats were not correctly handled.

Will backport.

Lib/test/test_bigmem.py
Misc/NEWS
Python/getargs.c

index 6d6c37ceea6ba56faba0e10d5f4774bab906378f..d4fc6eb478510c495cc21bf181f6eaf717bb83f6 100644 (file)
@@ -65,13 +65,15 @@ class StrTest(unittest.TestCase):
         self.assertEquals(s.count('i'), 1)
         self.assertEquals(s.count('j'), 0)
 
-    @bigmemtest(minsize=0, memuse=1)
+    @bigmemtest(minsize=_2G + 2, memuse=3)
     def test_decode(self, size):
-        pass
+        s = '.' * size
+        self.assertEquals(len(s.decode('utf-8')), size)
 
-    @bigmemtest(minsize=0, memuse=1)
+    @bigmemtest(minsize=_2G + 2, memuse=3)
     def test_encode(self, size):
-        pass
+        s = u'.' * size
+        self.assertEquals(len(s.encode('utf-8')), size)
 
     @bigmemtest(minsize=_2G, memuse=2)
     def test_endswith(self, size):
index 05b7491476bd5bd1101957e1dbee95a728f79f6b..4fa85c683623b3c0e727c4f8f14cc2bfe2d645c9 100644 (file)
--- a/Misc/NEWS
+++ b/Misc/NEWS
@@ -12,6 +12,11 @@ What's New in Python 2.6 alpha 1?
 Core and builtins
 -----------------
 
+- Issue #1521: On 64bit platforms, using PyArgs_ParseTuple with the t# of w#
+  format code incorrectly truncated the length to an int, even when
+  PY_SSIZE_T_CLEAN is set.  The str.decode method used to return incorrect
+  results with huge strings.
+
 - Issue #1402: Fix a crash on exit, when another thread is still running, and
   if the deallocation of its frames somehow calls the PyGILState_Ensure() /
   PyGILState_Release() functions.
index a848116d7477670546620a849bed427cbc3d68ab..2cae516ef53284f7dd192bfc5a282e89ddce3fd5 100644 (file)
@@ -894,7 +894,8 @@ convertsimple(PyObject *arg, const char **p_format, va_list *p_va, int flags,
                char **buffer;
                const char *encoding;
                PyObject *s;
-               int size, recode_strings;
+               Py_ssize_t size;
+               int recode_strings;
 
                /* Get 'e' parameter: the encoding name */
                encoding = (const char *)va_arg(*p_va, const char *);
@@ -1144,7 +1145,7 @@ convertsimple(PyObject *arg, const char **p_format, va_list *p_va, int flags,
        case 'w': { /* memory buffer, read-write access */
                void **p = va_arg(*p_va, void **);
                PyBufferProcs *pb = arg->ob_type->tp_as_buffer;
-               int count;
+               Py_ssize_t count;
                        
                if (pb == NULL || 
                    pb->bf_getwritebuffer == NULL ||
@@ -1166,7 +1167,7 @@ convertsimple(PyObject *arg, const char **p_format, va_list *p_va, int flags,
        case 't': { /* 8-bit character buffer, read-only access */
                char **p = va_arg(*p_va, char **);
                PyBufferProcs *pb = arg->ob_type->tp_as_buffer;
-               int count;
+               Py_ssize_t count;
                
                if (*format++ != '#')
                        return converterr(