Issue #11224: Improved sparse file read support (r85916) introduced a

author Lars Gustäbel <lars@gustaebel.de>

Wed, 23 Feb 2011 11:42:22 +0000 (11:42 +0000)

committer Lars Gustäbel <lars@gustaebel.de>

Wed, 23 Feb 2011 11:42:22 +0000 (11:42 +0000)
author Lars Gustäbel <lars@gustaebel.de>
Wed, 23 Feb 2011 11:42:22 +0000 (11:42 +0000)
committer Lars Gustäbel <lars@gustaebel.de>
Wed, 23 Feb 2011 11:42:22 +0000 (11:42 +0000)
diff --git a/Lib/tarfile.py b/Lib/tarfile.py

index e3747e9c79c3551b06969db5fb88858b594ad2d5..0f9d1dade180239aabdd570db363eb6500bfe830 100644 (file)
--- a/Lib/tarfile.py
+++ b/Lib/tarfile.py
@@ -760,9 +760,8 @@ class _FileInFile(object):
                          self.map_index = 0
              length = min(size, stop - self.position)
              if data:
-                self.fileobj.seek(offset)
-                block = self.fileobj.read(stop - start)
-                buf += block[self.position - start:self.position + length]
+                self.fileobj.seek(offset + (self.position - start))
+                buf += self.fileobj.read(length)
              else:
                  buf += NUL * length
              size -= length
diff --git a/Lib/test/test_tarfile.py b/Lib/test/test_tarfile.py

index 94ef61c0ce701f11a118ef70af259660f3f04901..68e094d5dbc872199b252f6570a923d93792c5f7 100644 (file)
--- a/Lib/test/test_tarfile.py
+++ b/Lib/test/test_tarfile.py
@@ -419,6 +419,22 @@ class StreamReadTest(CommonReadTest):
  
      mode="r|"
  
+    def test_read_through(self):
+        # Issue #11224: A poorly designed _FileInFile.read() method
+        # caused seeking errors with stream tar files.
+        for tarinfo in self.tar:
+            if not tarinfo.isreg():
+                continue
+            fobj = self.tar.extractfile(tarinfo)
+            while True:
+                try:
+                    buf = fobj.read(512)
+                except tarfile.StreamError:
+                    self.fail("simple read-through using TarFile.extractfile() failed")
+                if not buf:
+                    break
+            fobj.close()
+
      def test_fileobj_regular_file(self):
          tarinfo = self.tar.next() # get "regtype" (can't use getmember)
          fobj = self.tar.extractfile(tarinfo)
diff --git a/Misc/NEWS b/Misc/NEWS

index a3a246ceb8190d0f6ce8ef380e64c046f5808074..9dcd309312b2d635f9b1636121f83c7fe0f4d3a0 100644 (file)
--- a/Misc/NEWS
+++ b/Misc/NEWS
@@ -27,6 +27,10 @@ Core and Builtins
  Library
  -------
  
+- Issue #11224: Fixed a regression in tarfile that affected the file-like
+  objects returned by TarFile.extractfile() regarding performance, memory
+  consumption and failures with the stream interface.
+
  - Issue #10924: Adding salt and Modular Crypt Format to crypt library.
    Moved old C wrapper to _crypt, and added a Python wrapper with
    enhanced salt generation and simpler API for password generation.
author	Lars Gustäbel <lars@gustaebel.de>
	Wed, 23 Feb 2011 11:42:22 +0000 (11:42 +0000)
committer	Lars Gustäbel <lars@gustaebel.de>
	Wed, 23 Feb 2011 11:42:22 +0000 (11:42 +0000)
Lib/tarfile.py		patch \| blob \| history
Lib/test/test_tarfile.py		patch \| blob \| history
Misc/NEWS		patch \| blob \| history