mirror of
https://github.com/python/cpython.git
synced 2025-10-24 07:26:11 +00:00
1199 lines
36 KiB
C
1199 lines
36 KiB
C
/* zlibmodule.c -- gzip-compatible data compression */
|
|
/* See http://www.gzip.org/zlib/ */
|
|
|
|
/* Windows users: read Python's PCbuild\readme.txt */
|
|
|
|
|
|
#include "Python.h"
|
|
#include "structmember.h"
|
|
#include "zlib.h"
|
|
|
|
#ifdef WITH_THREAD
|
|
#include "pythread.h"
|
|
#define ENTER_ZLIB(obj) \
|
|
Py_BEGIN_ALLOW_THREADS; \
|
|
PyThread_acquire_lock((obj)->lock, 1); \
|
|
Py_END_ALLOW_THREADS;
|
|
#define LEAVE_ZLIB(obj) PyThread_release_lock((obj)->lock);
|
|
#else
|
|
#define ENTER_ZLIB(obj)
|
|
#define LEAVE_ZLIB(obj)
|
|
#endif
|
|
|
|
/* The following parameters are copied from zutil.h, version 0.95 */
|
|
#define DEFLATED 8
|
|
#if MAX_MEM_LEVEL >= 8
|
|
# define DEF_MEM_LEVEL 8
|
|
#else
|
|
# define DEF_MEM_LEVEL MAX_MEM_LEVEL
|
|
#endif
|
|
#define DEF_WBITS MAX_WBITS
|
|
|
|
/* The output buffer will be increased in chunks of DEFAULTALLOC bytes. */
|
|
#define DEFAULTALLOC (16*1024)
|
|
|
|
static PyTypeObject Comptype;
|
|
static PyTypeObject Decomptype;
|
|
|
|
static PyObject *ZlibError;
|
|
|
|
typedef struct
|
|
{
|
|
PyObject_HEAD
|
|
z_stream zst;
|
|
PyObject *unused_data;
|
|
PyObject *unconsumed_tail;
|
|
int is_initialised;
|
|
#ifdef WITH_THREAD
|
|
PyThread_type_lock lock;
|
|
#endif
|
|
} compobject;
|
|
|
|
static void
|
|
zlib_error(z_stream zst, int err, char *msg)
|
|
{
|
|
const char *zmsg = Z_NULL;
|
|
/* In case of a version mismatch, zst.msg won't be initialized.
|
|
Check for this case first, before looking at zst.msg. */
|
|
if (err == Z_VERSION_ERROR)
|
|
zmsg = "library version mismatch";
|
|
if (zmsg == Z_NULL)
|
|
zmsg = zst.msg;
|
|
if (zmsg == Z_NULL) {
|
|
switch (err) {
|
|
case Z_BUF_ERROR:
|
|
zmsg = "incomplete or truncated stream";
|
|
break;
|
|
case Z_STREAM_ERROR:
|
|
zmsg = "inconsistent stream state";
|
|
break;
|
|
case Z_DATA_ERROR:
|
|
zmsg = "invalid input data";
|
|
break;
|
|
}
|
|
}
|
|
if (zmsg == Z_NULL)
|
|
PyErr_Format(ZlibError, "Error %d %s", err, msg);
|
|
else
|
|
PyErr_Format(ZlibError, "Error %d %s: %.200s", err, msg, zmsg);
|
|
}
|
|
|
|
PyDoc_STRVAR(compressobj__doc__,
|
|
"compressobj([level]) -- Return a compressor object.\n"
|
|
"\n"
|
|
"Optional arg level is the compression level, in 0-9.");
|
|
|
|
PyDoc_STRVAR(decompressobj__doc__,
|
|
"decompressobj([wbits]) -- Return a decompressor object.\n"
|
|
"\n"
|
|
"Optional arg wbits is the window buffer size.");
|
|
|
|
static compobject *
|
|
newcompobject(PyTypeObject *type)
|
|
{
|
|
compobject *self;
|
|
self = PyObject_New(compobject, type);
|
|
if (self == NULL)
|
|
return NULL;
|
|
self->is_initialised = 0;
|
|
self->unused_data = PyBytes_FromStringAndSize("", 0);
|
|
if (self->unused_data == NULL) {
|
|
Py_DECREF(self);
|
|
return NULL;
|
|
}
|
|
self->unconsumed_tail = PyBytes_FromStringAndSize("", 0);
|
|
if (self->unconsumed_tail == NULL) {
|
|
Py_DECREF(self);
|
|
return NULL;
|
|
}
|
|
#ifdef WITH_THREAD
|
|
self->lock = PyThread_allocate_lock();
|
|
#endif
|
|
return self;
|
|
}
|
|
|
|
PyDoc_STRVAR(compress__doc__,
|
|
"compress(string[, level]) -- Returned compressed string.\n"
|
|
"\n"
|
|
"Optional arg level is the compression level, in 0-9.");
|
|
|
|
static PyObject *
|
|
PyZlib_compress(PyObject *self, PyObject *args)
|
|
{
|
|
PyObject *ReturnVal = NULL;
|
|
Py_buffer pinput;
|
|
Byte *input, *output = NULL;
|
|
unsigned int length;
|
|
int level=Z_DEFAULT_COMPRESSION, err;
|
|
z_stream zst;
|
|
|
|
/* require Python string object, optional 'level' arg */
|
|
if (!PyArg_ParseTuple(args, "y*|i:compress", &pinput, &level))
|
|
return NULL;
|
|
|
|
if (pinput.len > UINT_MAX) {
|
|
PyErr_SetString(PyExc_OverflowError,
|
|
"Size does not fit in an unsigned int");
|
|
goto error;
|
|
}
|
|
input = pinput.buf;
|
|
length = pinput.len;
|
|
|
|
zst.avail_out = length + length/1000 + 12 + 1;
|
|
|
|
output = (Byte*)malloc(zst.avail_out);
|
|
if (output == NULL) {
|
|
PyErr_SetString(PyExc_MemoryError,
|
|
"Can't allocate memory to compress data");
|
|
goto error;
|
|
}
|
|
|
|
/* Past the point of no return. From here on out, we need to make sure
|
|
we clean up mallocs & INCREFs. */
|
|
|
|
zst.zalloc = (alloc_func)NULL;
|
|
zst.zfree = (free_func)Z_NULL;
|
|
zst.next_out = (Byte *)output;
|
|
zst.next_in = (Byte *)input;
|
|
zst.avail_in = length;
|
|
err = deflateInit(&zst, level);
|
|
|
|
switch(err) {
|
|
case(Z_OK):
|
|
break;
|
|
case(Z_MEM_ERROR):
|
|
PyErr_SetString(PyExc_MemoryError,
|
|
"Out of memory while compressing data");
|
|
goto error;
|
|
case(Z_STREAM_ERROR):
|
|
PyErr_SetString(ZlibError,
|
|
"Bad compression level");
|
|
goto error;
|
|
default:
|
|
deflateEnd(&zst);
|
|
zlib_error(zst, err, "while compressing data");
|
|
goto error;
|
|
}
|
|
|
|
Py_BEGIN_ALLOW_THREADS;
|
|
err = deflate(&zst, Z_FINISH);
|
|
Py_END_ALLOW_THREADS;
|
|
|
|
if (err != Z_STREAM_END) {
|
|
zlib_error(zst, err, "while compressing data");
|
|
deflateEnd(&zst);
|
|
goto error;
|
|
}
|
|
|
|
err=deflateEnd(&zst);
|
|
if (err == Z_OK)
|
|
ReturnVal = PyBytes_FromStringAndSize((char *)output,
|
|
zst.total_out);
|
|
else
|
|
zlib_error(zst, err, "while finishing compression");
|
|
|
|
error:
|
|
PyBuffer_Release(&pinput);
|
|
free(output);
|
|
|
|
return ReturnVal;
|
|
}
|
|
|
|
PyDoc_STRVAR(decompress__doc__,
|
|
"decompress(string[, wbits[, bufsize]]) -- Return decompressed string.\n"
|
|
"\n"
|
|
"Optional arg wbits is the window buffer size. Optional arg bufsize is\n"
|
|
"the initial output buffer size.");
|
|
|
|
static PyObject *
|
|
PyZlib_decompress(PyObject *self, PyObject *args)
|
|
{
|
|
PyObject *result_str = NULL;
|
|
Py_buffer pinput;
|
|
Byte *input;
|
|
unsigned int length;
|
|
int err;
|
|
int wsize=DEF_WBITS;
|
|
Py_ssize_t r_strlen=DEFAULTALLOC;
|
|
z_stream zst;
|
|
|
|
if (!PyArg_ParseTuple(args, "y*|in:decompress",
|
|
&pinput, &wsize, &r_strlen))
|
|
return NULL;
|
|
|
|
if (pinput.len > UINT_MAX) {
|
|
PyErr_SetString(PyExc_OverflowError,
|
|
"Size does not fit in an unsigned int");
|
|
goto error;
|
|
}
|
|
input = pinput.buf;
|
|
length = pinput.len;
|
|
|
|
if (r_strlen <= 0)
|
|
r_strlen = 1;
|
|
|
|
zst.avail_in = length;
|
|
zst.avail_out = r_strlen;
|
|
|
|
if (!(result_str = PyBytes_FromStringAndSize(NULL, r_strlen)))
|
|
goto error;
|
|
|
|
zst.zalloc = (alloc_func)NULL;
|
|
zst.zfree = (free_func)Z_NULL;
|
|
zst.next_out = (Byte *)PyBytes_AS_STRING(result_str);
|
|
zst.next_in = (Byte *)input;
|
|
err = inflateInit2(&zst, wsize);
|
|
|
|
switch(err) {
|
|
case(Z_OK):
|
|
break;
|
|
case(Z_MEM_ERROR):
|
|
PyErr_SetString(PyExc_MemoryError,
|
|
"Out of memory while decompressing data");
|
|
goto error;
|
|
default:
|
|
inflateEnd(&zst);
|
|
zlib_error(zst, err, "while preparing to decompress data");
|
|
goto error;
|
|
}
|
|
|
|
do {
|
|
Py_BEGIN_ALLOW_THREADS
|
|
err=inflate(&zst, Z_FINISH);
|
|
Py_END_ALLOW_THREADS
|
|
|
|
switch(err) {
|
|
case(Z_STREAM_END):
|
|
break;
|
|
case(Z_BUF_ERROR):
|
|
/*
|
|
* If there is at least 1 byte of room according to zst.avail_out
|
|
* and we get this error, assume that it means zlib cannot
|
|
* process the inflate call() due to an error in the data.
|
|
*/
|
|
if (zst.avail_out > 0) {
|
|
zlib_error(zst, err, "while decompressing data");
|
|
inflateEnd(&zst);
|
|
goto error;
|
|
}
|
|
/* fall through */
|
|
case(Z_OK):
|
|
/* need more memory */
|
|
if (_PyBytes_Resize(&result_str, r_strlen << 1) < 0) {
|
|
inflateEnd(&zst);
|
|
goto error;
|
|
}
|
|
zst.next_out =
|
|
(unsigned char *)PyBytes_AS_STRING(result_str) + r_strlen;
|
|
zst.avail_out = r_strlen;
|
|
r_strlen = r_strlen << 1;
|
|
break;
|
|
default:
|
|
inflateEnd(&zst);
|
|
zlib_error(zst, err, "while decompressing data");
|
|
goto error;
|
|
}
|
|
} while (err != Z_STREAM_END);
|
|
|
|
err = inflateEnd(&zst);
|
|
if (err != Z_OK) {
|
|
zlib_error(zst, err, "while finishing data decompression");
|
|
goto error;
|
|
}
|
|
|
|
if (_PyBytes_Resize(&result_str, zst.total_out) < 0)
|
|
goto error;
|
|
|
|
PyBuffer_Release(&pinput);
|
|
return result_str;
|
|
|
|
error:
|
|
PyBuffer_Release(&pinput);
|
|
Py_XDECREF(result_str);
|
|
return NULL;
|
|
}
|
|
|
|
static PyObject *
|
|
PyZlib_compressobj(PyObject *selfptr, PyObject *args)
|
|
{
|
|
compobject *self;
|
|
int level=Z_DEFAULT_COMPRESSION, method=DEFLATED;
|
|
int wbits=MAX_WBITS, memLevel=DEF_MEM_LEVEL, strategy=0, err;
|
|
|
|
if (!PyArg_ParseTuple(args, "|iiiii:compressobj", &level, &method, &wbits,
|
|
&memLevel, &strategy))
|
|
return NULL;
|
|
|
|
self = newcompobject(&Comptype);
|
|
if (self==NULL)
|
|
return(NULL);
|
|
self->zst.zalloc = (alloc_func)NULL;
|
|
self->zst.zfree = (free_func)Z_NULL;
|
|
self->zst.next_in = NULL;
|
|
self->zst.avail_in = 0;
|
|
err = deflateInit2(&self->zst, level, method, wbits, memLevel, strategy);
|
|
switch(err) {
|
|
case (Z_OK):
|
|
self->is_initialised = 1;
|
|
return (PyObject*)self;
|
|
case (Z_MEM_ERROR):
|
|
Py_DECREF(self);
|
|
PyErr_SetString(PyExc_MemoryError,
|
|
"Can't allocate memory for compression object");
|
|
return NULL;
|
|
case(Z_STREAM_ERROR):
|
|
Py_DECREF(self);
|
|
PyErr_SetString(PyExc_ValueError, "Invalid initialization option");
|
|
return NULL;
|
|
default:
|
|
zlib_error(self->zst, err, "while creating compression object");
|
|
Py_DECREF(self);
|
|
return NULL;
|
|
}
|
|
}
|
|
|
|
static PyObject *
|
|
PyZlib_decompressobj(PyObject *selfptr, PyObject *args)
|
|
{
|
|
int wbits=DEF_WBITS, err;
|
|
compobject *self;
|
|
if (!PyArg_ParseTuple(args, "|i:decompressobj", &wbits))
|
|
return NULL;
|
|
|
|
self = newcompobject(&Decomptype);
|
|
if (self == NULL)
|
|
return(NULL);
|
|
self->zst.zalloc = (alloc_func)NULL;
|
|
self->zst.zfree = (free_func)Z_NULL;
|
|
self->zst.next_in = NULL;
|
|
self->zst.avail_in = 0;
|
|
err = inflateInit2(&self->zst, wbits);
|
|
switch(err) {
|
|
case (Z_OK):
|
|
self->is_initialised = 1;
|
|
return (PyObject*)self;
|
|
case(Z_STREAM_ERROR):
|
|
Py_DECREF(self);
|
|
PyErr_SetString(PyExc_ValueError, "Invalid initialization option");
|
|
return NULL;
|
|
case (Z_MEM_ERROR):
|
|
Py_DECREF(self);
|
|
PyErr_SetString(PyExc_MemoryError,
|
|
"Can't allocate memory for decompression object");
|
|
return NULL;
|
|
default:
|
|
zlib_error(self->zst, err, "while creating decompression object");
|
|
Py_DECREF(self);
|
|
return NULL;
|
|
}
|
|
}
|
|
|
|
static void
|
|
Dealloc(compobject *self)
|
|
{
|
|
#ifdef WITH_THREAD
|
|
PyThread_free_lock(self->lock);
|
|
#endif
|
|
Py_XDECREF(self->unused_data);
|
|
Py_XDECREF(self->unconsumed_tail);
|
|
PyObject_Del(self);
|
|
}
|
|
|
|
static void
|
|
Comp_dealloc(compobject *self)
|
|
{
|
|
if (self->is_initialised)
|
|
deflateEnd(&self->zst);
|
|
Dealloc(self);
|
|
}
|
|
|
|
static void
|
|
Decomp_dealloc(compobject *self)
|
|
{
|
|
if (self->is_initialised)
|
|
inflateEnd(&self->zst);
|
|
Dealloc(self);
|
|
}
|
|
|
|
PyDoc_STRVAR(comp_compress__doc__,
|
|
"compress(data) -- Return a string containing data compressed.\n"
|
|
"\n"
|
|
"After calling this function, some of the input data may still\n"
|
|
"be stored in internal buffers for later processing.\n"
|
|
"Call the flush() method to clear these buffers.");
|
|
|
|
|
|
static PyObject *
|
|
PyZlib_objcompress(compobject *self, PyObject *args)
|
|
{
|
|
int err;
|
|
unsigned int inplen;
|
|
Py_ssize_t length = DEFAULTALLOC;
|
|
PyObject *RetVal = NULL;
|
|
Py_buffer pinput;
|
|
Byte *input;
|
|
unsigned long start_total_out;
|
|
|
|
if (!PyArg_ParseTuple(args, "y*:compress", &pinput))
|
|
return NULL;
|
|
if (pinput.len > UINT_MAX) {
|
|
PyErr_SetString(PyExc_OverflowError,
|
|
"Size does not fit in an unsigned int");
|
|
goto error_outer;
|
|
}
|
|
input = pinput.buf;
|
|
inplen = pinput.len;
|
|
|
|
if (!(RetVal = PyBytes_FromStringAndSize(NULL, length)))
|
|
goto error_outer;
|
|
|
|
ENTER_ZLIB(self);
|
|
|
|
start_total_out = self->zst.total_out;
|
|
self->zst.avail_in = inplen;
|
|
self->zst.next_in = input;
|
|
self->zst.avail_out = length;
|
|
self->zst.next_out = (unsigned char *)PyBytes_AS_STRING(RetVal);
|
|
|
|
Py_BEGIN_ALLOW_THREADS
|
|
err = deflate(&(self->zst), Z_NO_FLUSH);
|
|
Py_END_ALLOW_THREADS
|
|
|
|
/* while Z_OK and the output buffer is full, there might be more output,
|
|
so extend the output buffer and try again */
|
|
while (err == Z_OK && self->zst.avail_out == 0) {
|
|
if (_PyBytes_Resize(&RetVal, length << 1) < 0) {
|
|
Py_DECREF(RetVal);
|
|
RetVal = NULL;
|
|
goto error;
|
|
}
|
|
self->zst.next_out =
|
|
(unsigned char *)PyBytes_AS_STRING(RetVal) + length;
|
|
self->zst.avail_out = length;
|
|
length = length << 1;
|
|
|
|
Py_BEGIN_ALLOW_THREADS
|
|
err = deflate(&(self->zst), Z_NO_FLUSH);
|
|
Py_END_ALLOW_THREADS
|
|
}
|
|
/* We will only get Z_BUF_ERROR if the output buffer was full but
|
|
there wasn't more output when we tried again, so it is not an error
|
|
condition.
|
|
*/
|
|
|
|
if (err != Z_OK && err != Z_BUF_ERROR) {
|
|
zlib_error(self->zst, err, "while compressing");
|
|
Py_DECREF(RetVal);
|
|
RetVal = NULL;
|
|
goto error;
|
|
}
|
|
if (_PyBytes_Resize(&RetVal, self->zst.total_out - start_total_out) < 0) {
|
|
Py_DECREF(RetVal);
|
|
RetVal = NULL;
|
|
}
|
|
|
|
error:
|
|
LEAVE_ZLIB(self);
|
|
error_outer:
|
|
PyBuffer_Release(&pinput);
|
|
return RetVal;
|
|
}
|
|
|
|
/* Helper for objdecompress() and unflush(). Saves any unconsumed input data in
|
|
self->unused_data or self->unconsumed_tail, as appropriate. */
|
|
static int
|
|
save_unconsumed_input(compobject *self, int err)
|
|
{
|
|
if (err == Z_STREAM_END) {
|
|
/* The end of the compressed data has been reached. Store the leftover
|
|
input data in self->unused_data. */
|
|
if (self->zst.avail_in > 0) {
|
|
Py_ssize_t old_size = PyBytes_GET_SIZE(self->unused_data);
|
|
Py_ssize_t new_size;
|
|
PyObject *new_data;
|
|
if (self->zst.avail_in > PY_SSIZE_T_MAX - old_size) {
|
|
PyErr_NoMemory();
|
|
return -1;
|
|
}
|
|
new_size = old_size + self->zst.avail_in;
|
|
new_data = PyBytes_FromStringAndSize(NULL, new_size);
|
|
if (new_data == NULL)
|
|
return -1;
|
|
Py_MEMCPY(PyBytes_AS_STRING(new_data),
|
|
PyBytes_AS_STRING(self->unused_data), old_size);
|
|
Py_MEMCPY(PyBytes_AS_STRING(new_data) + old_size,
|
|
self->zst.next_in, self->zst.avail_in);
|
|
Py_DECREF(self->unused_data);
|
|
self->unused_data = new_data;
|
|
self->zst.avail_in = 0;
|
|
}
|
|
}
|
|
if (self->zst.avail_in > 0 || PyBytes_GET_SIZE(self->unconsumed_tail)) {
|
|
/* This code handles two distinct cases:
|
|
1. Output limit was reached. Save leftover input in unconsumed_tail.
|
|
2. All input data was consumed. Clear unconsumed_tail. */
|
|
PyObject *new_data = PyBytes_FromStringAndSize(
|
|
(char *)self->zst.next_in, self->zst.avail_in);
|
|
if (new_data == NULL)
|
|
return -1;
|
|
Py_DECREF(self->unconsumed_tail);
|
|
self->unconsumed_tail = new_data;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
PyDoc_STRVAR(decomp_decompress__doc__,
|
|
"decompress(data, max_length) -- Return a string containing the decompressed\n"
|
|
"version of the data.\n"
|
|
"\n"
|
|
"After calling this function, some of the input data may still be stored in\n"
|
|
"internal buffers for later processing.\n"
|
|
"Call the flush() method to clear these buffers.\n"
|
|
"If the max_length parameter is specified then the return value will be\n"
|
|
"no longer than max_length. Unconsumed input data will be stored in\n"
|
|
"the unconsumed_tail attribute.");
|
|
|
|
static PyObject *
|
|
PyZlib_objdecompress(compobject *self, PyObject *args)
|
|
{
|
|
int err, max_length = 0;
|
|
unsigned int inplen;
|
|
Py_ssize_t old_length, length = DEFAULTALLOC;
|
|
PyObject *RetVal = NULL;
|
|
Py_buffer pinput;
|
|
Byte *input;
|
|
unsigned long start_total_out;
|
|
|
|
if (!PyArg_ParseTuple(args, "y*|i:decompress", &pinput,
|
|
&max_length))
|
|
return NULL;
|
|
if (pinput.len > UINT_MAX) {
|
|
PyErr_SetString(PyExc_OverflowError,
|
|
"Size does not fit in an unsigned int");
|
|
goto error_outer;
|
|
}
|
|
input = pinput.buf;
|
|
inplen = pinput.len;
|
|
if (max_length < 0) {
|
|
PyErr_SetString(PyExc_ValueError,
|
|
"max_length must be greater than zero");
|
|
goto error_outer;
|
|
}
|
|
|
|
/* limit amount of data allocated to max_length */
|
|
if (max_length && length > max_length)
|
|
length = max_length;
|
|
if (!(RetVal = PyBytes_FromStringAndSize(NULL, length)))
|
|
goto error_outer;
|
|
|
|
ENTER_ZLIB(self);
|
|
|
|
start_total_out = self->zst.total_out;
|
|
self->zst.avail_in = inplen;
|
|
self->zst.next_in = input;
|
|
self->zst.avail_out = length;
|
|
self->zst.next_out = (unsigned char *)PyBytes_AS_STRING(RetVal);
|
|
|
|
Py_BEGIN_ALLOW_THREADS
|
|
err = inflate(&(self->zst), Z_SYNC_FLUSH);
|
|
Py_END_ALLOW_THREADS
|
|
|
|
/* While Z_OK and the output buffer is full, there might be more output.
|
|
So extend the output buffer and try again.
|
|
*/
|
|
while (err == Z_OK && self->zst.avail_out == 0) {
|
|
/* If max_length set, don't continue decompressing if we've already
|
|
reached the limit.
|
|
*/
|
|
if (max_length && length >= max_length)
|
|
break;
|
|
|
|
/* otherwise, ... */
|
|
old_length = length;
|
|
length = length << 1;
|
|
if (max_length && length > max_length)
|
|
length = max_length;
|
|
|
|
if (_PyBytes_Resize(&RetVal, length) < 0) {
|
|
Py_DECREF(RetVal);
|
|
RetVal = NULL;
|
|
goto error;
|
|
}
|
|
self->zst.next_out =
|
|
(unsigned char *)PyBytes_AS_STRING(RetVal) + old_length;
|
|
self->zst.avail_out = length - old_length;
|
|
|
|
Py_BEGIN_ALLOW_THREADS
|
|
err = inflate(&(self->zst), Z_SYNC_FLUSH);
|
|
Py_END_ALLOW_THREADS
|
|
}
|
|
|
|
if (save_unconsumed_input(self, err) < 0) {
|
|
Py_DECREF(RetVal);
|
|
RetVal = NULL;
|
|
goto error;
|
|
}
|
|
|
|
/* This is the logical place to call inflateEnd, but the old behaviour of
|
|
only calling it on flush() is preserved. */
|
|
|
|
if (err != Z_STREAM_END && err != Z_OK && err != Z_BUF_ERROR) {
|
|
/* We will only get Z_BUF_ERROR if the output buffer was full
|
|
but there wasn't more output when we tried again, so it is
|
|
not an error condition.
|
|
*/
|
|
zlib_error(self->zst, err, "while decompressing");
|
|
Py_DECREF(RetVal);
|
|
RetVal = NULL;
|
|
goto error;
|
|
}
|
|
|
|
if (_PyBytes_Resize(&RetVal, self->zst.total_out - start_total_out) < 0) {
|
|
Py_DECREF(RetVal);
|
|
RetVal = NULL;
|
|
}
|
|
|
|
error:
|
|
LEAVE_ZLIB(self);
|
|
error_outer:
|
|
PyBuffer_Release(&pinput);
|
|
return RetVal;
|
|
}
|
|
|
|
PyDoc_STRVAR(comp_flush__doc__,
|
|
"flush( [mode] ) -- Return a string containing any remaining compressed data.\n"
|
|
"\n"
|
|
"mode can be one of the constants Z_SYNC_FLUSH, Z_FULL_FLUSH, Z_FINISH; the\n"
|
|
"default value used when mode is not specified is Z_FINISH.\n"
|
|
"If mode == Z_FINISH, the compressor object can no longer be used after\n"
|
|
"calling the flush() method. Otherwise, more data can still be compressed.");
|
|
|
|
static PyObject *
|
|
PyZlib_flush(compobject *self, PyObject *args)
|
|
{
|
|
int err, length = DEFAULTALLOC;
|
|
PyObject *RetVal;
|
|
int flushmode = Z_FINISH;
|
|
unsigned long start_total_out;
|
|
|
|
if (!PyArg_ParseTuple(args, "|i:flush", &flushmode))
|
|
return NULL;
|
|
|
|
/* Flushing with Z_NO_FLUSH is a no-op, so there's no point in
|
|
doing any work at all; just return an empty string. */
|
|
if (flushmode == Z_NO_FLUSH) {
|
|
return PyBytes_FromStringAndSize(NULL, 0);
|
|
}
|
|
|
|
if (!(RetVal = PyBytes_FromStringAndSize(NULL, length)))
|
|
return NULL;
|
|
|
|
ENTER_ZLIB(self);
|
|
|
|
start_total_out = self->zst.total_out;
|
|
self->zst.avail_in = 0;
|
|
self->zst.avail_out = length;
|
|
self->zst.next_out = (unsigned char *)PyBytes_AS_STRING(RetVal);
|
|
|
|
Py_BEGIN_ALLOW_THREADS
|
|
err = deflate(&(self->zst), flushmode);
|
|
Py_END_ALLOW_THREADS
|
|
|
|
/* while Z_OK and the output buffer is full, there might be more output,
|
|
so extend the output buffer and try again */
|
|
while (err == Z_OK && self->zst.avail_out == 0) {
|
|
if (_PyBytes_Resize(&RetVal, length << 1) < 0) {
|
|
Py_DECREF(RetVal);
|
|
RetVal = NULL;
|
|
goto error;
|
|
}
|
|
self->zst.next_out =
|
|
(unsigned char *)PyBytes_AS_STRING(RetVal) + length;
|
|
self->zst.avail_out = length;
|
|
length = length << 1;
|
|
|
|
Py_BEGIN_ALLOW_THREADS
|
|
err = deflate(&(self->zst), flushmode);
|
|
Py_END_ALLOW_THREADS
|
|
}
|
|
|
|
/* If flushmode is Z_FINISH, we also have to call deflateEnd() to free
|
|
various data structures. Note we should only get Z_STREAM_END when
|
|
flushmode is Z_FINISH, but checking both for safety*/
|
|
if (err == Z_STREAM_END && flushmode == Z_FINISH) {
|
|
err = deflateEnd(&(self->zst));
|
|
if (err != Z_OK) {
|
|
zlib_error(self->zst, err, "from deflateEnd()");
|
|
Py_DECREF(RetVal);
|
|
RetVal = NULL;
|
|
goto error;
|
|
}
|
|
else
|
|
self->is_initialised = 0;
|
|
|
|
/* We will only get Z_BUF_ERROR if the output buffer was full
|
|
but there wasn't more output when we tried again, so it is
|
|
not an error condition.
|
|
*/
|
|
} else if (err!=Z_OK && err!=Z_BUF_ERROR) {
|
|
zlib_error(self->zst, err, "while flushing");
|
|
Py_DECREF(RetVal);
|
|
RetVal = NULL;
|
|
goto error;
|
|
}
|
|
|
|
if (_PyBytes_Resize(&RetVal, self->zst.total_out - start_total_out) < 0) {
|
|
Py_DECREF(RetVal);
|
|
RetVal = NULL;
|
|
}
|
|
|
|
error:
|
|
LEAVE_ZLIB(self);
|
|
|
|
return RetVal;
|
|
}
|
|
|
|
#ifdef HAVE_ZLIB_COPY
|
|
PyDoc_STRVAR(comp_copy__doc__,
|
|
"copy() -- Return a copy of the compression object.");
|
|
|
|
static PyObject *
|
|
PyZlib_copy(compobject *self)
|
|
{
|
|
compobject *retval = NULL;
|
|
int err;
|
|
|
|
retval = newcompobject(&Comptype);
|
|
if (!retval) return NULL;
|
|
|
|
/* Copy the zstream state
|
|
* We use ENTER_ZLIB / LEAVE_ZLIB to make this thread-safe
|
|
*/
|
|
ENTER_ZLIB(self);
|
|
err = deflateCopy(&retval->zst, &self->zst);
|
|
switch(err) {
|
|
case(Z_OK):
|
|
break;
|
|
case(Z_STREAM_ERROR):
|
|
PyErr_SetString(PyExc_ValueError, "Inconsistent stream state");
|
|
goto error;
|
|
case(Z_MEM_ERROR):
|
|
PyErr_SetString(PyExc_MemoryError,
|
|
"Can't allocate memory for compression object");
|
|
goto error;
|
|
default:
|
|
zlib_error(self->zst, err, "while copying compression object");
|
|
goto error;
|
|
}
|
|
Py_INCREF(self->unused_data);
|
|
Py_INCREF(self->unconsumed_tail);
|
|
Py_XDECREF(retval->unused_data);
|
|
Py_XDECREF(retval->unconsumed_tail);
|
|
retval->unused_data = self->unused_data;
|
|
retval->unconsumed_tail = self->unconsumed_tail;
|
|
|
|
/* Mark it as being initialized */
|
|
retval->is_initialised = 1;
|
|
|
|
LEAVE_ZLIB(self);
|
|
return (PyObject *)retval;
|
|
|
|
error:
|
|
LEAVE_ZLIB(self);
|
|
Py_XDECREF(retval);
|
|
return NULL;
|
|
}
|
|
|
|
PyDoc_STRVAR(decomp_copy__doc__,
|
|
"copy() -- Return a copy of the decompression object.");
|
|
|
|
static PyObject *
|
|
PyZlib_uncopy(compobject *self)
|
|
{
|
|
compobject *retval = NULL;
|
|
int err;
|
|
|
|
retval = newcompobject(&Decomptype);
|
|
if (!retval) return NULL;
|
|
|
|
/* Copy the zstream state
|
|
* We use ENTER_ZLIB / LEAVE_ZLIB to make this thread-safe
|
|
*/
|
|
ENTER_ZLIB(self);
|
|
err = inflateCopy(&retval->zst, &self->zst);
|
|
switch(err) {
|
|
case(Z_OK):
|
|
break;
|
|
case(Z_STREAM_ERROR):
|
|
PyErr_SetString(PyExc_ValueError, "Inconsistent stream state");
|
|
goto error;
|
|
case(Z_MEM_ERROR):
|
|
PyErr_SetString(PyExc_MemoryError,
|
|
"Can't allocate memory for decompression object");
|
|
goto error;
|
|
default:
|
|
zlib_error(self->zst, err, "while copying decompression object");
|
|
goto error;
|
|
}
|
|
|
|
Py_INCREF(self->unused_data);
|
|
Py_INCREF(self->unconsumed_tail);
|
|
Py_XDECREF(retval->unused_data);
|
|
Py_XDECREF(retval->unconsumed_tail);
|
|
retval->unused_data = self->unused_data;
|
|
retval->unconsumed_tail = self->unconsumed_tail;
|
|
|
|
/* Mark it as being initialized */
|
|
retval->is_initialised = 1;
|
|
|
|
LEAVE_ZLIB(self);
|
|
return (PyObject *)retval;
|
|
|
|
error:
|
|
LEAVE_ZLIB(self);
|
|
Py_XDECREF(retval);
|
|
return NULL;
|
|
}
|
|
#endif
|
|
|
|
PyDoc_STRVAR(decomp_flush__doc__,
|
|
"flush( [length] ) -- Return a string containing any remaining\n"
|
|
"decompressed data. length, if given, is the initial size of the\n"
|
|
"output buffer.\n"
|
|
"\n"
|
|
"The decompressor object can no longer be used after this call.");
|
|
|
|
static PyObject *
|
|
PyZlib_unflush(compobject *self, PyObject *args)
|
|
{
|
|
int err, length = DEFAULTALLOC;
|
|
PyObject * retval = NULL;
|
|
unsigned long start_total_out;
|
|
|
|
if (!PyArg_ParseTuple(args, "|i:flush", &length))
|
|
return NULL;
|
|
if (length <= 0) {
|
|
PyErr_SetString(PyExc_ValueError, "length must be greater than zero");
|
|
return NULL;
|
|
}
|
|
if (!(retval = PyBytes_FromStringAndSize(NULL, length)))
|
|
return NULL;
|
|
|
|
|
|
ENTER_ZLIB(self);
|
|
|
|
start_total_out = self->zst.total_out;
|
|
self->zst.avail_in = PyBytes_GET_SIZE(self->unconsumed_tail);
|
|
self->zst.next_in = (Byte *)PyBytes_AS_STRING(self->unconsumed_tail);
|
|
self->zst.avail_out = length;
|
|
self->zst.next_out = (Byte *)PyBytes_AS_STRING(retval);
|
|
|
|
Py_BEGIN_ALLOW_THREADS
|
|
err = inflate(&(self->zst), Z_FINISH);
|
|
Py_END_ALLOW_THREADS
|
|
|
|
/* while Z_OK and the output buffer is full, there might be more output,
|
|
so extend the output buffer and try again */
|
|
while ((err == Z_OK || err == Z_BUF_ERROR) && self->zst.avail_out == 0) {
|
|
if (_PyBytes_Resize(&retval, length << 1) < 0) {
|
|
Py_DECREF(retval);
|
|
retval = NULL;
|
|
goto error;
|
|
}
|
|
self->zst.next_out = (Byte *)PyBytes_AS_STRING(retval) + length;
|
|
self->zst.avail_out = length;
|
|
length = length << 1;
|
|
|
|
Py_BEGIN_ALLOW_THREADS
|
|
err = inflate(&(self->zst), Z_FINISH);
|
|
Py_END_ALLOW_THREADS
|
|
}
|
|
|
|
if (save_unconsumed_input(self, err) < 0) {
|
|
Py_DECREF(retval);
|
|
retval = NULL;
|
|
goto error;
|
|
}
|
|
|
|
/* If flushmode is Z_FINISH, we also have to call deflateEnd() to free
|
|
various data structures. Note we should only get Z_STREAM_END when
|
|
flushmode is Z_FINISH */
|
|
if (err == Z_STREAM_END) {
|
|
err = inflateEnd(&(self->zst));
|
|
self->is_initialised = 0;
|
|
if (err != Z_OK) {
|
|
zlib_error(self->zst, err, "from inflateEnd()");
|
|
Py_DECREF(retval);
|
|
retval = NULL;
|
|
goto error;
|
|
}
|
|
}
|
|
|
|
if (_PyBytes_Resize(&retval, self->zst.total_out - start_total_out) < 0) {
|
|
Py_DECREF(retval);
|
|
retval = NULL;
|
|
}
|
|
|
|
error:
|
|
|
|
LEAVE_ZLIB(self);
|
|
|
|
return retval;
|
|
}
|
|
|
|
static PyMethodDef comp_methods[] =
|
|
{
|
|
{"compress", (binaryfunc)PyZlib_objcompress, METH_VARARGS,
|
|
comp_compress__doc__},
|
|
{"flush", (binaryfunc)PyZlib_flush, METH_VARARGS,
|
|
comp_flush__doc__},
|
|
#ifdef HAVE_ZLIB_COPY
|
|
{"copy", (PyCFunction)PyZlib_copy, METH_NOARGS,
|
|
comp_copy__doc__},
|
|
#endif
|
|
{NULL, NULL}
|
|
};
|
|
|
|
static PyMethodDef Decomp_methods[] =
|
|
{
|
|
{"decompress", (binaryfunc)PyZlib_objdecompress, METH_VARARGS,
|
|
decomp_decompress__doc__},
|
|
{"flush", (binaryfunc)PyZlib_unflush, METH_VARARGS,
|
|
decomp_flush__doc__},
|
|
#ifdef HAVE_ZLIB_COPY
|
|
{"copy", (PyCFunction)PyZlib_uncopy, METH_NOARGS,
|
|
decomp_copy__doc__},
|
|
#endif
|
|
{NULL, NULL}
|
|
};
|
|
|
|
#define COMP_OFF(x) offsetof(compobject, x)
|
|
static PyMemberDef Decomp_members[] = {
|
|
{"unused_data", T_OBJECT, COMP_OFF(unused_data), READONLY},
|
|
{"unconsumed_tail", T_OBJECT, COMP_OFF(unconsumed_tail), READONLY},
|
|
{NULL},
|
|
};
|
|
|
|
PyDoc_STRVAR(adler32__doc__,
|
|
"adler32(string[, start]) -- Compute an Adler-32 checksum of string.\n"
|
|
"\n"
|
|
"An optional starting value can be specified. The returned checksum is\n"
|
|
"an integer.");
|
|
|
|
static PyObject *
|
|
PyZlib_adler32(PyObject *self, PyObject *args)
|
|
{
|
|
unsigned int adler32val = 1; /* adler32(0L, Z_NULL, 0) */
|
|
Py_buffer pbuf;
|
|
|
|
if (!PyArg_ParseTuple(args, "y*|I:adler32", &pbuf, &adler32val))
|
|
return NULL;
|
|
/* Releasing the GIL for very small buffers is inefficient
|
|
and may lower performance */
|
|
if (pbuf.len > 1024*5) {
|
|
unsigned char *buf = pbuf.buf;
|
|
Py_ssize_t len = pbuf.len;
|
|
|
|
Py_BEGIN_ALLOW_THREADS
|
|
/* Avoid truncation of length for very large buffers. adler32() takes
|
|
length as an unsigned int, which may be narrower than Py_ssize_t. */
|
|
while (len > (size_t) UINT_MAX) {
|
|
adler32val = adler32(adler32val, buf, UINT_MAX);
|
|
buf += (size_t) UINT_MAX;
|
|
len -= (size_t) UINT_MAX;
|
|
}
|
|
adler32val = adler32(adler32val, buf, len);
|
|
Py_END_ALLOW_THREADS
|
|
} else {
|
|
adler32val = adler32(adler32val, pbuf.buf, pbuf.len);
|
|
}
|
|
PyBuffer_Release(&pbuf);
|
|
return PyLong_FromUnsignedLong(adler32val & 0xffffffffU);
|
|
}
|
|
|
|
PyDoc_STRVAR(crc32__doc__,
|
|
"crc32(string[, start]) -- Compute a CRC-32 checksum of string.\n"
|
|
"\n"
|
|
"An optional starting value can be specified. The returned checksum is\n"
|
|
"an integer.");
|
|
|
|
static PyObject *
|
|
PyZlib_crc32(PyObject *self, PyObject *args)
|
|
{
|
|
unsigned int crc32val = 0; /* crc32(0L, Z_NULL, 0) */
|
|
Py_buffer pbuf;
|
|
int signed_val;
|
|
|
|
if (!PyArg_ParseTuple(args, "y*|I:crc32", &pbuf, &crc32val))
|
|
return NULL;
|
|
/* Releasing the GIL for very small buffers is inefficient
|
|
and may lower performance */
|
|
if (pbuf.len > 1024*5) {
|
|
unsigned char *buf = pbuf.buf;
|
|
Py_ssize_t len = pbuf.len;
|
|
|
|
Py_BEGIN_ALLOW_THREADS
|
|
/* Avoid truncation of length for very large buffers. crc32() takes
|
|
length as an unsigned int, which may be narrower than Py_ssize_t. */
|
|
while (len > (size_t) UINT_MAX) {
|
|
crc32val = crc32(crc32val, buf, UINT_MAX);
|
|
buf += (size_t) UINT_MAX;
|
|
len -= (size_t) UINT_MAX;
|
|
}
|
|
signed_val = crc32(crc32val, buf, len);
|
|
Py_END_ALLOW_THREADS
|
|
} else {
|
|
signed_val = crc32(crc32val, pbuf.buf, pbuf.len);
|
|
}
|
|
PyBuffer_Release(&pbuf);
|
|
return PyLong_FromUnsignedLong(signed_val & 0xffffffffU);
|
|
}
|
|
|
|
|
|
static PyMethodDef zlib_methods[] =
|
|
{
|
|
{"adler32", (PyCFunction)PyZlib_adler32, METH_VARARGS,
|
|
adler32__doc__},
|
|
{"compress", (PyCFunction)PyZlib_compress, METH_VARARGS,
|
|
compress__doc__},
|
|
{"compressobj", (PyCFunction)PyZlib_compressobj, METH_VARARGS,
|
|
compressobj__doc__},
|
|
{"crc32", (PyCFunction)PyZlib_crc32, METH_VARARGS,
|
|
crc32__doc__},
|
|
{"decompress", (PyCFunction)PyZlib_decompress, METH_VARARGS,
|
|
decompress__doc__},
|
|
{"decompressobj", (PyCFunction)PyZlib_decompressobj, METH_VARARGS,
|
|
decompressobj__doc__},
|
|
{NULL, NULL}
|
|
};
|
|
|
|
static PyTypeObject Comptype = {
|
|
PyVarObject_HEAD_INIT(0, 0)
|
|
"zlib.Compress",
|
|
sizeof(compobject),
|
|
0,
|
|
(destructor)Comp_dealloc, /*tp_dealloc*/
|
|
0, /*tp_print*/
|
|
0, /*tp_getattr*/
|
|
0, /*tp_setattr*/
|
|
0, /*tp_reserved*/
|
|
0, /*tp_repr*/
|
|
0, /*tp_as_number*/
|
|
0, /*tp_as_sequence*/
|
|
0, /*tp_as_mapping*/
|
|
0, /*tp_hash*/
|
|
0, /*tp_call*/
|
|
0, /*tp_str*/
|
|
0, /*tp_getattro*/
|
|
0, /*tp_setattro*/
|
|
0, /*tp_as_buffer*/
|
|
Py_TPFLAGS_DEFAULT, /*tp_flags*/
|
|
0, /*tp_doc*/
|
|
0, /*tp_traverse*/
|
|
0, /*tp_clear*/
|
|
0, /*tp_richcompare*/
|
|
0, /*tp_weaklistoffset*/
|
|
0, /*tp_iter*/
|
|
0, /*tp_iternext*/
|
|
comp_methods, /*tp_methods*/
|
|
};
|
|
|
|
static PyTypeObject Decomptype = {
|
|
PyVarObject_HEAD_INIT(0, 0)
|
|
"zlib.Decompress",
|
|
sizeof(compobject),
|
|
0,
|
|
(destructor)Decomp_dealloc, /*tp_dealloc*/
|
|
0, /*tp_print*/
|
|
0, /*tp_getattr*/
|
|
0, /*tp_setattr*/
|
|
0, /*tp_reserved*/
|
|
0, /*tp_repr*/
|
|
0, /*tp_as_number*/
|
|
0, /*tp_as_sequence*/
|
|
0, /*tp_as_mapping*/
|
|
0, /*tp_hash*/
|
|
0, /*tp_call*/
|
|
0, /*tp_str*/
|
|
0, /*tp_getattro*/
|
|
0, /*tp_setattro*/
|
|
0, /*tp_as_buffer*/
|
|
Py_TPFLAGS_DEFAULT, /*tp_flags*/
|
|
0, /*tp_doc*/
|
|
0, /*tp_traverse*/
|
|
0, /*tp_clear*/
|
|
0, /*tp_richcompare*/
|
|
0, /*tp_weaklistoffset*/
|
|
0, /*tp_iter*/
|
|
0, /*tp_iternext*/
|
|
Decomp_methods, /*tp_methods*/
|
|
Decomp_members, /*tp_members*/
|
|
};
|
|
|
|
PyDoc_STRVAR(zlib_module_documentation,
|
|
"The functions in this module allow compression and decompression using the\n"
|
|
"zlib library, which is based on GNU zip.\n"
|
|
"\n"
|
|
"adler32(string[, start]) -- Compute an Adler-32 checksum.\n"
|
|
"compress(string[, level]) -- Compress string, with compression level in 0-9.\n"
|
|
"compressobj([level]) -- Return a compressor object.\n"
|
|
"crc32(string[, start]) -- Compute a CRC-32 checksum.\n"
|
|
"decompress(string,[wbits],[bufsize]) -- Decompresses a compressed string.\n"
|
|
"decompressobj([wbits]) -- Return a decompressor object.\n"
|
|
"\n"
|
|
"'wbits' is window buffer size.\n"
|
|
"Compressor objects support compress() and flush() methods; decompressor\n"
|
|
"objects support decompress() and flush().");
|
|
|
|
static struct PyModuleDef zlibmodule = {
|
|
PyModuleDef_HEAD_INIT,
|
|
"zlib",
|
|
zlib_module_documentation,
|
|
-1,
|
|
zlib_methods,
|
|
NULL,
|
|
NULL,
|
|
NULL,
|
|
NULL
|
|
};
|
|
|
|
PyMODINIT_FUNC
|
|
PyInit_zlib(void)
|
|
{
|
|
PyObject *m, *ver;
|
|
if (PyType_Ready(&Comptype) < 0)
|
|
return NULL;
|
|
if (PyType_Ready(&Decomptype) < 0)
|
|
return NULL;
|
|
m = PyModule_Create(&zlibmodule);
|
|
if (m == NULL)
|
|
return NULL;
|
|
|
|
ZlibError = PyErr_NewException("zlib.error", NULL, NULL);
|
|
if (ZlibError != NULL) {
|
|
Py_INCREF(ZlibError);
|
|
PyModule_AddObject(m, "error", ZlibError);
|
|
}
|
|
PyModule_AddIntConstant(m, "MAX_WBITS", MAX_WBITS);
|
|
PyModule_AddIntConstant(m, "DEFLATED", DEFLATED);
|
|
PyModule_AddIntConstant(m, "DEF_MEM_LEVEL", DEF_MEM_LEVEL);
|
|
PyModule_AddIntConstant(m, "Z_BEST_SPEED", Z_BEST_SPEED);
|
|
PyModule_AddIntConstant(m, "Z_BEST_COMPRESSION", Z_BEST_COMPRESSION);
|
|
PyModule_AddIntConstant(m, "Z_DEFAULT_COMPRESSION", Z_DEFAULT_COMPRESSION);
|
|
PyModule_AddIntConstant(m, "Z_FILTERED", Z_FILTERED);
|
|
PyModule_AddIntConstant(m, "Z_HUFFMAN_ONLY", Z_HUFFMAN_ONLY);
|
|
PyModule_AddIntConstant(m, "Z_DEFAULT_STRATEGY", Z_DEFAULT_STRATEGY);
|
|
|
|
PyModule_AddIntConstant(m, "Z_FINISH", Z_FINISH);
|
|
PyModule_AddIntConstant(m, "Z_NO_FLUSH", Z_NO_FLUSH);
|
|
PyModule_AddIntConstant(m, "Z_SYNC_FLUSH", Z_SYNC_FLUSH);
|
|
PyModule_AddIntConstant(m, "Z_FULL_FLUSH", Z_FULL_FLUSH);
|
|
|
|
ver = PyUnicode_FromString(ZLIB_VERSION);
|
|
if (ver != NULL)
|
|
PyModule_AddObject(m, "ZLIB_VERSION", ver);
|
|
|
|
PyModule_AddStringConstant(m, "__version__", "1.0");
|
|
|
|
return m;
|
|
}
|