changeset: 96844:372aa98eb72e branch: 2.7 user: Lars Gustäbel date: Mon Jul 06 09:23:04 2015 +0200 files: Lib/tarfile.py Lib/test/test_tarfile.py Misc/NEWS description: Issue #24259: tarfile now raises a ReadError if an archive is truncated inside a data segment. diff -r 79ed3573b977 -r 372aa98eb72e Lib/tarfile.py --- a/Lib/tarfile.py Mon Jul 06 00:08:15 2015 -0500 +++ b/Lib/tarfile.py Mon Jul 06 09:23:04 2015 +0200 @@ -744,12 +744,18 @@ else: return self.readsparse(size) + def __read(self, size): + buf = self.fileobj.read(size) + if len(buf) != size: + raise ReadError("unexpected end of data") + return buf + def readnormal(self, size): """Read operation for regular files. """ self.fileobj.seek(self.offset + self.position) self.position += size - return self.fileobj.read(size) + return self.__read(size) def readsparse(self, size): """Read operation for sparse files. @@ -777,7 +783,7 @@ realpos = section.realpos + self.position - section.offset self.fileobj.seek(self.offset + realpos) self.position += size - return self.fileobj.read(size) + return self.__read(size) else: self.position += size return NUL * size @@ -2336,8 +2342,13 @@ self.firstmember = None return m + # Advance the file pointer. + if self.offset != self.fileobj.tell(): + self.fileobj.seek(self.offset - 1) + if not self.fileobj.read(1): + raise ReadError("unexpected end of data") + # Read the next block. - self.fileobj.seek(self.offset) tarinfo = None while True: try: diff -r 79ed3573b977 -r 372aa98eb72e Lib/test/test_tarfile.py --- a/Lib/test/test_tarfile.py Mon Jul 06 00:08:15 2015 -0500 +++ b/Lib/test/test_tarfile.py Mon Jul 06 09:23:04 2015 +0200 @@ -285,6 +285,30 @@ "ignore_zeros=True should have skipped the %r-blocks" % char) tar.close() + def test_premature_end_of_archive(self): + for size in (512, 600, 1024, 1200): + with tarfile.open(tmpname, "w:") as tar: + t = tarfile.TarInfo("foo") + t.size = 1024 + tar.addfile(t, StringIO.StringIO("a" * 1024)) + + with open(tmpname, "r+b") as fobj: + fobj.truncate(size) + + with tarfile.open(tmpname) as tar: + with self.assertRaisesRegexp(tarfile.ReadError, "unexpected end of data"): + for t in tar: + pass + + with tarfile.open(tmpname) as tar: + t = tar.next() + + with self.assertRaisesRegexp(tarfile.ReadError, "unexpected end of data"): + tar.extract(t, TEMPDIR) + + with self.assertRaisesRegexp(tarfile.ReadError, "unexpected end of data"): + tar.extractfile(t).read() + class MiscReadTest(CommonReadTest): taropen = tarfile.TarFile.taropen diff -r 79ed3573b977 -r 372aa98eb72e Misc/NEWS --- a/Misc/NEWS Mon Jul 06 00:08:15 2015 -0500 +++ b/Misc/NEWS Mon Jul 06 09:23:04 2015 +0200 @@ -34,6 +34,9 @@ Library ------- +- Issue #24259: tarfile now raises a ReadError if an archive is truncated + inside a data segment. + - Issue #24514: tarfile now tolerates number fields consisting of only whitespace.