summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorNadeem Vawda <nadeem.vawda@gmail.com>2012-11-04 23:38:48 (GMT)
committerNadeem Vawda <nadeem.vawda@gmail.com>2012-11-04 23:38:48 (GMT)
commit519f43844babca8bb23cfc2cd0ba9f5ee0b26034 (patch)
tree0f59159b07393ff15c890bbfb1dd9f2a32e6fa6e
parentab60de478d70650a7a786d0d4a10ef6dcf1c2880 (diff)
parent39079946a257522ecb66cb068c872f5d1fe70ea3 (diff)
downloadcpython-519f43844babca8bb23cfc2cd0ba9f5ee0b26034.zip
cpython-519f43844babca8bb23cfc2cd0ba9f5ee0b26034.tar.gz
cpython-519f43844babca8bb23cfc2cd0ba9f5ee0b26034.tar.bz2
Issue #16350: Fix zlib decompressor handling of unused_data with multiple calls to decompress() after EOF.
Patch by Serhiy Storchaka.
-rw-r--r--Lib/test/test_zlib.py14
-rw-r--r--Misc/NEWS4
-rw-r--r--Modules/zlibmodule.c29
3 files changed, 41 insertions, 6 deletions
diff --git a/Lib/test/test_zlib.py b/Lib/test/test_zlib.py
index d637c2d..b6a60f4 100644
--- a/Lib/test/test_zlib.py
+++ b/Lib/test/test_zlib.py
@@ -487,6 +487,20 @@ class CompressObjectTestCase(BaseCompressTestCase, unittest.TestCase):
dco.flush()
self.assertFalse(dco.eof)
+ def test_decompress_unused_data(self):
+ # Repeated calls to decompress() after EOF should accumulate data in
+ # dco.unused_data, instead of just storing the arg to the last call.
+ x = zlib.compress(HAMLET_SCENE) + HAMLET_SCENE
+ for step in 1, 2, 100:
+ dco = zlib.decompressobj()
+ data = b''.join(dco.decompress(x[i : i + step])
+ for i in range(0, len(x), step))
+ data += dco.flush()
+
+ self.assertTrue(dco.eof)
+ self.assertEqual(data, HAMLET_SCENE)
+ self.assertEqual(dco.unused_data, HAMLET_SCENE)
+
if hasattr(zlib.compressobj(), "copy"):
def test_compresscopy(self):
# Test copying a compression object
diff --git a/Misc/NEWS b/Misc/NEWS
index 73d6e37..63baa0d 100644
--- a/Misc/NEWS
+++ b/Misc/NEWS
@@ -77,6 +77,10 @@ Core and Builtins
Library
-------
+- Issue #16350: zlib.Decompress.decompress() now accumulates data from
+ successive calls after EOF in unused_data, instead of only saving the argument
+ to the last call. Patch by Serhiy Storchaka.
+
- Issue #12759: sre_parse now raises a proper error when the name of the group
is missing. Initial patch by Serhiy Storchaka.
diff --git a/Modules/zlibmodule.c b/Modules/zlibmodule.c
index 6519194..888ef53 100644
--- a/Modules/zlibmodule.c
+++ b/Modules/zlibmodule.c
@@ -693,12 +693,29 @@ PyZlib_objdecompress(compobject *self, PyObject *args)
preserved.
*/
if (err == Z_STREAM_END) {
- Py_XDECREF(self->unused_data); /* Free original empty string */
- self->unused_data = PyBytes_FromStringAndSize(
- (char *)self->zst.next_in, self->zst.avail_in);
- if (self->unused_data == NULL) {
- Py_DECREF(RetVal);
- goto error;
+ if (self->zst.avail_in > 0) {
+ /* Append the leftover data to the existing value of unused_data. */
+ Py_ssize_t old_size = PyBytes_GET_SIZE(self->unused_data);
+ Py_ssize_t new_size = old_size + self->zst.avail_in;
+ PyObject *new_data;
+ if (new_size <= old_size) { /* Check for overflow. */
+ PyErr_NoMemory();
+ Py_DECREF(RetVal);
+ RetVal = NULL;
+ goto error;
+ }
+ new_data = PyBytes_FromStringAndSize(NULL, new_size);
+ if (new_data == NULL) {
+ Py_DECREF(RetVal);
+ RetVal = NULL;
+ goto error;
+ }
+ Py_MEMCPY(PyBytes_AS_STRING(new_data),
+ PyBytes_AS_STRING(self->unused_data), old_size);
+ Py_MEMCPY(PyBytes_AS_STRING(new_data) + old_size,
+ self->zst.next_in, self->zst.avail_in);
+ Py_DECREF(self->unused_data);
+ self->unused_data = new_data;
}
self->eof = 1;
/* We will only get Z_BUF_ERROR if the output buffer was full