From: Antoine Pitrou Date: Sun, 12 Sep 2010 14:56:27 +0000 (+0000) Subject: Merged revisions 84737 via svnmerge from X-Git-Tag: v2.7.1rc1~304 X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=e4195e8825a195e54967a4f7b02d83b11637ec1d;p=python Merged revisions 84737 via svnmerge from svn+ssh://pythondev@svn.python.org/python/branches/py3k ........ r84737 | antoine.pitrou | 2010-09-12 16:51:20 +0200 (dim., 12 sept. 2010) | 4 lines Issue #9837: The read() method of ZipExtFile objects (as returned by ZipFile.open()) could return more bytes than requested. ........ --- diff --git a/Lib/test/test_zipfile.py b/Lib/test/test_zipfile.py index 8d87ac5c93..aee499ca73 100644 --- a/Lib/test/test_zipfile.py +++ b/Lib/test/test_zipfile.py @@ -929,6 +929,26 @@ class OtherTests(unittest.TestCase): def test_read_with_bad_crc_deflated(self): self.check_read_with_bad_crc(zipfile.ZIP_DEFLATED) + def check_read_return_size(self, compression): + # Issue #9837: ZipExtFile.read() shouldn't return more bytes + # than requested. + for test_size in (1, 4095, 4096, 4097, 16384): + file_size = test_size + 1 + junk = b''.join(struct.pack('B', randint(0, 255)) + for x in range(file_size)) + with zipfile.ZipFile(io.BytesIO(), "w", compression) as zipf: + zipf.writestr('foo', junk) + with zipf.open('foo', 'r') as fp: + buf = fp.read(test_size) + self.assertEqual(len(buf), test_size) + + def test_read_return_size_stored(self): + self.check_read_return_size(zipfile.ZIP_STORED) + + @skipUnless(zlib, "requires zlib") + def test_read_return_size_deflated(self): + self.check_read_return_size(zipfile.ZIP_DEFLATED) + def tearDown(self): unlink(TESTFN) unlink(TESTFN2) diff --git a/Lib/zipfile.py b/Lib/zipfile.py index ef19a28513..496cf83fda 100644 --- a/Lib/zipfile.py +++ b/Lib/zipfile.py @@ -565,17 +565,20 @@ class ZipExtFile(io.BufferedIOBase): """Read and return up to n bytes. If the argument is omitted, None, or negative, data is read and returned until EOF is reached.. """ - buf = '' - while n < 0 or n is None or n > len(buf): - data = self.read1(n) + if n is None: + n = -1 + while True: + if n < 0: + data = self.read1(n) + elif n > len(buf): + data = self.read1(n - len(buf)) + else: + return buf if len(data) == 0: return buf - buf += data - return buf - def _update_crc(self, newdata, eof): # Update the CRC using the given data. if self._expected_crc is None: diff --git a/Misc/NEWS b/Misc/NEWS index a31d95aee8..dff7f79f7d 100644 --- a/Misc/NEWS +++ b/Misc/NEWS @@ -43,6 +43,9 @@ Core and Builtins Library ------- +- Issue #9837: The read() method of ZipExtFile objects (as returned by + ZipFile.open()) could return more bytes than requested. + - Issue #9825: removed __del__ from the definition of collections.OrderedDict. This prevents user-created self-referencing ordered dictionaries from becoming permanently uncollectable GC garbage. The downside is that