cpython/Modules/zlibmodule.c

1164 lines
34 KiB
C
Raw Normal View History

1997-04-29 12:38:09 -03:00
/* zlibmodule.c -- gzip-compatible data compression */
/* See http://zlib.net/ */
/* Windows users: read Python's PCbuild\readme.txt */
#define PY_SSIZE_T_CLEAN
1997-04-29 12:38:09 -03:00
#include "Python.h"
#include "zlib.h"
1997-04-29 12:38:09 -03:00
#ifdef WITH_THREAD
#include "pythread.h"
/* #defs ripped off from _tkinter.c, even though the situation here is much
simpler, because we don't have to worry about waiting for Tcl
events! And, since zlib itself is threadsafe, we don't need to worry
about re-entering zlib functions.
N.B.
Since ENTER_ZLIB and LEAVE_ZLIB only need to be called on functions
that modify the components of preexisting de/compress objects, it
could prove to be a performance gain on multiprocessor machines if
there was an de/compress object-specific lock. However, for the
moment the ENTER_ZLIB and LEAVE_ZLIB calls are global for ALL
de/compress objects.
*/
static PyThread_type_lock zlib_lock = NULL; /* initialized on module load */
#define ENTER_ZLIB \
Py_BEGIN_ALLOW_THREADS \
PyThread_acquire_lock(zlib_lock, 1); \
Py_END_ALLOW_THREADS
#define LEAVE_ZLIB \
PyThread_release_lock(zlib_lock);
#else
#define ENTER_ZLIB
#define LEAVE_ZLIB
#endif
1997-04-29 12:38:09 -03:00
/* The following parameters are copied from zutil.h, version 0.95 */
#define DEFLATED 8
#if MAX_MEM_LEVEL >= 8
# define DEF_MEM_LEVEL 8
#else
# define DEF_MEM_LEVEL MAX_MEM_LEVEL
#endif
#define DEF_WBITS MAX_WBITS
/* The output buffer will be increased in chunks of DEFAULTALLOC bytes. */
#define DEFAULTALLOC (16*1024)
1997-04-29 12:38:09 -03:00
#define PyInit_zlib initzlib
static PyTypeObject Comptype;
static PyTypeObject Decomptype;
1997-04-29 12:38:09 -03:00
static PyObject *ZlibError;
2001-10-17 00:57:20 -03:00
typedef struct
1997-04-29 12:38:09 -03:00
{
PyObject_HEAD
z_stream zst;
PyObject *unused_data;
PyObject *unconsumed_tail;
int is_initialised;
1997-04-29 12:38:09 -03:00
} compobject;
static void
zlib_error(z_stream zst, int err, char *msg)
{
const char *zmsg = Z_NULL;
/* In case of a version mismatch, zst.msg won't be initialized.
Check for this case first, before looking at zst.msg. */
if (err == Z_VERSION_ERROR)
zmsg = "library version mismatch";
if (zmsg == Z_NULL)
zmsg = zst.msg;
if (zmsg == Z_NULL) {
switch (err) {
case Z_BUF_ERROR:
zmsg = "incomplete or truncated stream";
break;
case Z_STREAM_ERROR:
zmsg = "inconsistent stream state";
break;
case Z_DATA_ERROR:
zmsg = "invalid input data";
break;
}
}
if (zmsg == Z_NULL)
PyErr_Format(ZlibError, "Error %d %s", err, msg);
else
PyErr_Format(ZlibError, "Error %d %s: %.200s", err, msg, zmsg);
}
2002-06-13 17:33:02 -03:00
PyDoc_STRVAR(compressobj__doc__,
"compressobj([level]) -- Return a compressor object.\n"
"\n"
"Optional arg level is the compression level, in 0-9 or -1.");
1997-06-03 19:21:03 -03:00
2002-06-13 17:33:02 -03:00
PyDoc_STRVAR(decompressobj__doc__,
"decompressobj([wbits]) -- Return a decompressor object.\n"
"\n"
"Optional arg wbits indicates the window buffer size and container format.");
1997-06-03 19:21:03 -03:00
1997-04-29 12:38:09 -03:00
static compobject *
2000-07-10 06:57:19 -03:00
newcompobject(PyTypeObject *type)
1997-04-29 12:38:09 -03:00
{
2001-10-17 00:57:20 -03:00
compobject *self;
self = PyObject_New(compobject, type);
if (self == NULL)
return NULL;
self->is_initialised = 0;
self->unused_data = PyString_FromString("");
if (self->unused_data == NULL) {
Py_DECREF(self);
return NULL;
}
self->unconsumed_tail = PyString_FromString("");
if (self->unconsumed_tail == NULL) {
Py_DECREF(self);
return NULL;
}
return self;
1997-04-29 12:38:09 -03:00
}
static void
arrange_input_buffer(z_stream *zst, Py_ssize_t *remains)
{
if ((size_t)*remains > UINT_MAX) {
zst->avail_in = UINT_MAX;
} else {
zst->avail_in = *remains;
}
*remains -= zst->avail_in;
}
static Py_ssize_t
arrange_output_buffer_with_maximum(z_stream *zst, PyObject **buffer,
Py_ssize_t length,
Py_ssize_t max_length)
{
Py_ssize_t occupied;
if (*buffer == NULL) {
if (!(*buffer = PyBytes_FromStringAndSize(NULL, length)))
return -1;
occupied = 0;
}
else {
occupied = zst->next_out - (Byte *)PyBytes_AS_STRING(*buffer);
if (length == occupied) {
Py_ssize_t new_length;
assert(length <= max_length);
/* can not scale the buffer over max_length */
if (length == max_length)
return -2;
if (length <= (max_length >> 1))
new_length = length << 1;
else
new_length = max_length;
if (_PyBytes_Resize(buffer, new_length) < 0)
return -1;
length = new_length;
}
}
if ((size_t)(length - occupied) > UINT_MAX) {
zst->avail_out = UINT_MAX;
} else {
zst->avail_out = length - occupied;
}
zst->next_out = (Byte *)PyBytes_AS_STRING(*buffer) + occupied;
return length;
}
static Py_ssize_t
arrange_output_buffer(z_stream *zst, PyObject **buffer, Py_ssize_t length)
{
Py_ssize_t ret;
ret = arrange_output_buffer_with_maximum(zst, buffer, length,
PY_SSIZE_T_MAX);
if (ret == -2)
PyErr_NoMemory();
return ret;
}
2002-06-13 17:33:02 -03:00
PyDoc_STRVAR(compress__doc__,
"compress(string[, level]) -- Returned compressed string.\n"
"\n"
"Optional arg level is the compression level, in 0-9.");
1997-06-03 19:21:03 -03:00
1997-04-29 12:38:09 -03:00
static PyObject *
2000-07-10 06:57:19 -03:00
PyZlib_compress(PyObject *self, PyObject *args)
1997-04-29 12:38:09 -03:00
{
PyObject *RetVal = NULL;
Byte *ibuf;
Py_ssize_t ibuflen, obuflen = DEFAULTALLOC;
int level=Z_DEFAULT_COMPRESSION;
int err, flush;
z_stream zst;
2001-10-17 00:57:20 -03:00
/* require Python string object, optional 'level' arg */
if (!PyArg_ParseTuple(args, "s#|i:compress", &ibuf, &ibuflen, &level))
return NULL;
zst.zalloc = (alloc_func)NULL;
zst.zfree = (free_func)Z_NULL;
zst.next_in = ibuf;
err = deflateInit(&zst, level);
switch (err) {
case Z_OK:
break;
case Z_MEM_ERROR:
PyErr_SetString(PyExc_MemoryError,
"Out of memory while compressing data");
goto error;
case Z_STREAM_ERROR:
PyErr_SetString(ZlibError, "Bad compression level");
goto error;
default:
1997-04-29 12:38:09 -03:00
deflateEnd(&zst);
zlib_error(zst, err, "while compressing data");
goto error;
1997-04-29 12:38:09 -03:00
}
do {
arrange_input_buffer(&zst, &ibuflen);
flush = ibuflen == 0 ? Z_FINISH : Z_NO_FLUSH;
do {
obuflen = arrange_output_buffer(&zst, &RetVal, obuflen);
if (obuflen < 0) {
deflateEnd(&zst);
goto error;
}
Py_BEGIN_ALLOW_THREADS
err = deflate(&zst, flush);
Py_END_ALLOW_THREADS
if (err == Z_STREAM_ERROR) {
deflateEnd(&zst);
zlib_error(zst, err, "while compressing data");
goto error;
}
} while (zst.avail_out == 0);
assert(zst.avail_in == 0);
2001-10-17 00:57:20 -03:00
} while (flush != Z_FINISH);
assert(err == Z_STREAM_END);
err = deflateEnd(&zst);
if (err == Z_OK) {
if (_PyBytes_Resize(&RetVal, zst.next_out -
(Byte *)PyBytes_AS_STRING(RetVal)) < 0)
goto error;
return RetVal;
}
2001-10-17 00:57:20 -03:00
else
zlib_error(zst, err, "while finishing compression");
error:
Py_XDECREF(RetVal);
return NULL;
1997-04-29 12:38:09 -03:00
}
2002-06-13 17:33:02 -03:00
PyDoc_STRVAR(decompress__doc__,
"decompress(string[, wbits[, bufsize]]) -- Return decompressed string.\n"
"\n"
"Optional arg wbits indicates the window buffer size and container format.\n"
"Optional arg bufsize is the initial output buffer size.");
1997-06-03 19:21:03 -03:00
1997-04-29 12:38:09 -03:00
static PyObject *
2000-07-10 06:57:19 -03:00
PyZlib_decompress(PyObject *self, PyObject *args)
1997-04-29 12:38:09 -03:00
{
PyObject *RetVal = NULL;
Byte *ibuf;
Py_ssize_t ibuflen;
int err, flush;
int wsize=DEF_WBITS;
Py_ssize_t r_strlen=DEFAULTALLOC;
z_stream zst;
if (!PyArg_ParseTuple(args, "s#|in:decompress",
&ibuf, &ibuflen, &wsize, &r_strlen))
return NULL;
if (r_strlen <= 0) {
r_strlen = 1;
}
zst.zalloc = (alloc_func)NULL;
zst.zfree = (free_func)Z_NULL;
zst.avail_in = 0;
zst.next_in = ibuf;
err = inflateInit2(&zst, wsize);
switch (err) {
case Z_OK:
break;
case Z_MEM_ERROR:
PyErr_SetString(PyExc_MemoryError,
"Out of memory while decompressing data");
goto error;
default:
1997-04-29 12:38:09 -03:00
inflateEnd(&zst);
zlib_error(zst, err, "while preparing to decompress data");
goto error;
1997-04-29 12:38:09 -03:00
}
do {
arrange_input_buffer(&zst, &ibuflen);
flush = ibuflen == 0 ? Z_FINISH : Z_NO_FLUSH;
do {
r_strlen = arrange_output_buffer(&zst, &RetVal, r_strlen);
if (r_strlen < 0) {
inflateEnd(&zst);
goto error;
}
Py_BEGIN_ALLOW_THREADS
err = inflate(&zst, flush);
Py_END_ALLOW_THREADS
switch (err) {
case Z_OK: /* fall through */
case Z_BUF_ERROR: /* fall through */
case Z_STREAM_END:
break;
case Z_MEM_ERROR:
inflateEnd(&zst);
PyErr_SetString(PyExc_MemoryError,
"Out of memory while decompressing data");
goto error;
default:
inflateEnd(&zst);
zlib_error(zst, err, "while decompressing data");
goto error;
}
} while (zst.avail_out == 0);
} while (err != Z_STREAM_END && ibuflen != 0);
if (err != Z_STREAM_END) {
inflateEnd(&zst);
zlib_error(zst, err, "while decompressing data");
goto error;
}
err = inflateEnd(&zst);
if (err != Z_OK) {
zlib_error(zst, err, "while finishing data decompression");
goto error;
1997-04-29 12:38:09 -03:00
}
_PyString_Resize(&RetVal, zst.next_out -
(Byte *)PyBytes_AS_STRING(RetVal));
return RetVal;
error:
Py_XDECREF(RetVal);
return NULL;
1997-04-29 12:38:09 -03:00
}
static PyObject *
2000-07-10 06:57:19 -03:00
PyZlib_compressobj(PyObject *selfptr, PyObject *args)
1997-04-29 12:38:09 -03:00
{
2001-10-16 18:59:35 -03:00
compobject *self;
int level=Z_DEFAULT_COMPRESSION, method=DEFLATED;
int wbits=MAX_WBITS, memLevel=DEF_MEM_LEVEL, strategy=0, err;
if (!PyArg_ParseTuple(args, "|iiiii:compressobj", &level, &method, &wbits,
&memLevel, &strategy))
return NULL;
2001-10-16 18:59:35 -03:00
self = newcompobject(&Comptype);
if (self == NULL)
return(NULL);
2001-10-16 18:59:35 -03:00
self->zst.zalloc = (alloc_func)NULL;
self->zst.zfree = (free_func)Z_NULL;
self->zst.next_in = NULL;
self->zst.avail_in = 0;
2001-10-16 18:59:35 -03:00
err = deflateInit2(&self->zst, level, method, wbits, memLevel, strategy);
switch (err) {
case Z_OK:
self->is_initialised = 1;
return (PyObject *)self;
case Z_MEM_ERROR:
Py_DECREF(self);
PyErr_SetString(PyExc_MemoryError,
"Can't allocate memory for compression object");
return NULL;
case Z_STREAM_ERROR:
Py_DECREF(self);
PyErr_SetString(PyExc_ValueError, "Invalid initialization option");
return NULL;
1997-04-29 12:38:09 -03:00
default:
zlib_error(self->zst, err, "while creating compression object");
Py_DECREF(self);
return NULL;
1997-04-29 12:38:09 -03:00
}
}
static PyObject *
2000-07-10 06:57:19 -03:00
PyZlib_decompressobj(PyObject *selfptr, PyObject *args)
1997-04-29 12:38:09 -03:00
{
2001-10-16 18:59:35 -03:00
int wbits=DEF_WBITS, err;
compobject *self;
if (!PyArg_ParseTuple(args, "|i:decompressobj", &wbits))
return NULL;
2001-10-16 18:59:35 -03:00
self = newcompobject(&Decomptype);
2001-10-17 00:57:20 -03:00
if (self == NULL)
return NULL;
2001-10-16 18:59:35 -03:00
self->zst.zalloc = (alloc_func)NULL;
self->zst.zfree = (free_func)Z_NULL;
self->zst.next_in = NULL;
self->zst.avail_in = 0;
2001-10-16 18:59:35 -03:00
err = inflateInit2(&self->zst, wbits);
switch (err) {
case Z_OK:
self->is_initialised = 1;
return (PyObject *)self;
case Z_STREAM_ERROR:
Py_DECREF(self);
PyErr_SetString(PyExc_ValueError, "Invalid initialization option");
return NULL;
case Z_MEM_ERROR:
Py_DECREF(self);
PyErr_SetString(PyExc_MemoryError,
"Can't allocate memory for decompression object");
return NULL;
1997-04-29 12:38:09 -03:00
default:
zlib_error(self->zst, err, "while creating decompression object");
Py_DECREF(self);
return NULL;
2001-10-16 18:59:35 -03:00
}
1997-04-29 12:38:09 -03:00
}
static void
2000-07-10 06:57:19 -03:00
Comp_dealloc(compobject *self)
1997-04-29 12:38:09 -03:00
{
if (self->is_initialised)
deflateEnd(&self->zst);
Py_XDECREF(self->unused_data);
Py_XDECREF(self->unconsumed_tail);
PyObject_Del(self);
1997-04-29 12:38:09 -03:00
}
static void
2000-07-10 06:57:19 -03:00
Decomp_dealloc(compobject *self)
1997-04-29 12:38:09 -03:00
{
if (self->is_initialised)
inflateEnd(&self->zst);
Py_XDECREF(self->unused_data);
Py_XDECREF(self->unconsumed_tail);
PyObject_Del(self);
1997-04-29 12:38:09 -03:00
}
2002-06-13 17:33:02 -03:00
PyDoc_STRVAR(comp_compress__doc__,
"compress(data) -- Return a string containing data compressed.\n"
"\n"
1997-06-03 19:21:03 -03:00
"After calling this function, some of the input data may still\n"
"be stored in internal buffers for later processing.\n"
2002-06-13 17:33:02 -03:00
"Call the flush() method to clear these buffers.");
1997-06-03 19:21:03 -03:00
1997-04-29 12:38:09 -03:00
static PyObject *
2000-07-10 06:57:19 -03:00
PyZlib_objcompress(compobject *self, PyObject *args)
1997-04-29 12:38:09 -03:00
{
PyObject *RetVal = NULL;
Py_ssize_t ibuflen, obuflen = DEFAULTALLOC;
int err;
if (!PyArg_ParseTuple(args, "s#:compress", &self->zst.next_in, &ibuflen))
return NULL;
ENTER_ZLIB
do {
arrange_input_buffer(&self->zst, &ibuflen);
do {
obuflen = arrange_output_buffer(&self->zst, &RetVal, obuflen);
if (obuflen < 0)
goto error;
Py_BEGIN_ALLOW_THREADS
err = deflate(&self->zst, Z_NO_FLUSH);
Py_END_ALLOW_THREADS
if (err == Z_STREAM_ERROR) {
zlib_error(self->zst, err, "while compressing data");
goto error;
}
} while (self->zst.avail_out == 0);
assert(self->zst.avail_in == 0);
} while (ibuflen != 0);
_PyString_Resize(&RetVal, self->zst.next_out -
(Byte *)PyBytes_AS_STRING(RetVal));
goto success;
error:
Py_CLEAR(RetVal);
success:
LEAVE_ZLIB
return RetVal;
1997-04-29 12:38:09 -03:00
}
/* Helper for objdecompress() and unflush(). Saves any unconsumed input data in
self->unused_data or self->unconsumed_tail, as appropriate. */
static int
save_unconsumed_input(compobject *self, Byte *input, Py_ssize_t inplen,
int err)
{
if (err == Z_STREAM_END) {
/* The end of the compressed data has been reached. Store the leftover
input data in self->unused_data. */
if (self->zst.avail_in > 0) {
Py_ssize_t old_size = PyString_GET_SIZE(self->unused_data);
Py_ssize_t new_size, left_size;
PyObject *new_data;
left_size = input + inplen - self->zst.next_in;
if (left_size > (PY_SSIZE_T_MAX - old_size)) {
PyErr_NoMemory();
return -1;
}
new_size = old_size + left_size;
new_data = PyString_FromStringAndSize(NULL, new_size);
if (new_data == NULL)
return -1;
Py_MEMCPY(PyString_AS_STRING(new_data),
PyString_AS_STRING(self->unused_data), old_size);
Py_MEMCPY(PyString_AS_STRING(new_data) + old_size,
self->zst.next_in, left_size);
Py_SETREF(self->unused_data, new_data);
self->zst.avail_in = 0;
}
}
if (self->zst.avail_in > 0 || PyString_GET_SIZE(self->unconsumed_tail)) {
/* This code handles two distinct cases:
1. Output limit was reached. Save leftover input in unconsumed_tail.
2. All input data was consumed. Clear unconsumed_tail. */
Py_ssize_t left_size = input + inplen - self->zst.next_in;
PyObject *new_data = PyString_FromStringAndSize(
(char *)self->zst.next_in, left_size);
if (new_data == NULL)
return -1;
Py_SETREF(self->unconsumed_tail, new_data);
}
return 0;
}
2002-06-13 17:33:02 -03:00
PyDoc_STRVAR(decomp_decompress__doc__,
"decompress(data, max_length) -- Return a string containing the decompressed\n"
"version of the data.\n"
"\n"
"After calling this function, some of the input data may still be stored in\n"
"internal buffers for later processing.\n"
"Call the flush() method to clear these buffers.\n"
"If the max_length parameter is specified then the return value will be\n"
"no longer than max_length. Unconsumed input data will be stored in\n"
2002-06-13 17:33:02 -03:00
"the unconsumed_tail attribute.");
1997-06-03 19:21:03 -03:00
1997-04-29 12:38:09 -03:00
static PyObject *
2000-07-10 06:57:19 -03:00
PyZlib_objdecompress(compobject *self, PyObject *args)
1997-04-29 12:38:09 -03:00
{
int err = Z_OK;
Py_ssize_t inplen, max_length = 0;
Py_ssize_t ibuflen, obuflen = DEFAULTALLOC, hard_limit;
PyObject *RetVal = NULL;
Byte *input;
if (!PyArg_ParseTuple(args, "s#|n:decompress", &input,
&inplen, &max_length))
return NULL;
if (max_length < 0) {
PyErr_SetString(PyExc_ValueError,
"max_length must be greater than zero");
return NULL;
} else if (max_length == 0)
hard_limit = PY_SSIZE_T_MAX;
else
hard_limit = max_length;
self->zst.next_in = input;
ibuflen = inplen;
/* limit amount of data allocated to max_length */
if (max_length && obuflen > max_length)
obuflen = max_length;
ENTER_ZLIB
do {
arrange_input_buffer(&self->zst, &ibuflen);
do {
obuflen = arrange_output_buffer_with_maximum(&self->zst, &RetVal,
obuflen, hard_limit);
if (obuflen == -2) {
if (max_length > 0) {
goto save;
}
PyErr_NoMemory();
}
if (obuflen < 0) {
goto abort;
}
Py_BEGIN_ALLOW_THREADS
err = inflate(&self->zst, Z_SYNC_FLUSH);
Py_END_ALLOW_THREADS
switch (err) {
case Z_OK: /* fall through */
case Z_BUF_ERROR: /* fall through */
case Z_STREAM_END:
break;
default:
goto save;
}
} while (self->zst.avail_out == 0);
} while (err != Z_STREAM_END && ibuflen != 0);
save:
if (save_unconsumed_input(self, input, inplen, err) < 0)
goto abort;
/* This is the logical place to call inflateEnd, but the old behaviour of
only calling it on flush() is preserved. */
if (err != Z_STREAM_END && err != Z_OK && err != Z_BUF_ERROR) {
/* We will only get Z_BUF_ERROR if the output buffer was full
but there wasn't more output when we tried again, so it is
not an error condition.
*/
zlib_error(self->zst, err, "while decompressing");
goto abort;
1997-04-29 12:38:09 -03:00
}
_PyString_Resize(&RetVal, self->zst.next_out -
(Byte *)PyBytes_AS_STRING(RetVal));
goto success;
abort:
Py_CLEAR(RetVal);
success:
LEAVE_ZLIB
return RetVal;
1997-04-29 12:38:09 -03:00
}
2002-06-13 17:33:02 -03:00
PyDoc_STRVAR(comp_flush__doc__,
"flush( [mode] ) -- Return a string containing any remaining compressed data.\n"
"\n"
"mode can be one of the constants Z_SYNC_FLUSH, Z_FULL_FLUSH, Z_FINISH; the\n"
"default value used when mode is not specified is Z_FINISH.\n"
"If mode == Z_FINISH, the compressor object can no longer be used after\n"
2002-06-13 17:33:02 -03:00
"calling the flush() method. Otherwise, more data can still be compressed.");
1997-06-03 19:21:03 -03:00
1997-04-29 12:38:09 -03:00
static PyObject *
2000-07-10 06:57:19 -03:00
PyZlib_flush(compobject *self, PyObject *args)
1997-04-29 12:38:09 -03:00
{
int err;
Py_ssize_t length = DEFAULTALLOC;
PyObject *RetVal = NULL;
int flushmode = Z_FINISH;
if (!PyArg_ParseTuple(args, "|i:flush", &flushmode))
return NULL;
/* Flushing with Z_NO_FLUSH is a no-op, so there's no point in
doing any work at all; just return an empty string. */
if (flushmode == Z_NO_FLUSH) {
return PyString_FromStringAndSize(NULL, 0);
}
ENTER_ZLIB
2001-10-17 00:57:20 -03:00
self->zst.avail_in = 0;
do {
length = arrange_output_buffer(&self->zst, &RetVal, length);
if (length < 0) {
Py_CLEAR(RetVal);
goto error;
}
Py_BEGIN_ALLOW_THREADS
err = deflate(&self->zst, flushmode);
Py_END_ALLOW_THREADS
if (err == Z_STREAM_ERROR) {
zlib_error(self->zst, err, "while flushing");
Py_CLEAR(RetVal);
goto error;
}
} while (self->zst.avail_out == 0);
assert(self->zst.avail_in == 0);
/* If flushmode is Z_FINISH, we also have to call deflateEnd() to free
2001-10-17 00:57:20 -03:00
various data structures. Note we should only get Z_STREAM_END when
flushmode is Z_FINISH, but checking both for safety*/
if (err == Z_STREAM_END && flushmode == Z_FINISH) {
err = deflateEnd(&self->zst);
if (err != Z_OK) {
zlib_error(self->zst, err, "from deflateEnd()");
Py_CLEAR(RetVal);
goto error;
}
else
self->is_initialised = 0;
/* We will only get Z_BUF_ERROR if the output buffer was full
but there wasn't more output when we tried again, so it is
not an error condition.
*/
} else if (err != Z_OK && err != Z_BUF_ERROR) {
zlib_error(self->zst, err, "while flushing");
Py_CLEAR(RetVal);
goto error;
}
2001-10-17 00:57:20 -03:00
_PyString_Resize(&RetVal, self->zst.next_out -
(Byte *)PyBytes_AS_STRING(RetVal));
2001-10-17 00:57:20 -03:00
error:
LEAVE_ZLIB
return RetVal;
1997-04-29 12:38:09 -03:00
}
#ifdef HAVE_ZLIB_COPY
PyDoc_STRVAR(comp_copy__doc__,
"copy() -- Return a copy of the compression object.");
static PyObject *
PyZlib_copy(compobject *self)
{
compobject *retval = NULL;
int err;
retval = newcompobject(&Comptype);
if (!retval) return NULL;
/* Copy the zstream state
* We use ENTER_ZLIB / LEAVE_ZLIB to make this thread-safe
*/
ENTER_ZLIB
err = deflateCopy(&retval->zst, &self->zst);
switch (err) {
case Z_OK:
break;
case Z_STREAM_ERROR:
PyErr_SetString(PyExc_ValueError, "Inconsistent stream state");
goto error;
case Z_MEM_ERROR:
PyErr_SetString(PyExc_MemoryError,
"Can't allocate memory for compression object");
goto error;
default:
zlib_error(self->zst, err, "while copying compression object");
goto error;
}
Py_INCREF(self->unused_data);
Py_XSETREF(retval->unused_data, self->unused_data);
Py_INCREF(self->unconsumed_tail);
Py_XSETREF(retval->unconsumed_tail, self->unconsumed_tail);
/* Mark it as being initialized */
retval->is_initialised = 1;
LEAVE_ZLIB
return (PyObject *)retval;
error:
LEAVE_ZLIB
Py_XDECREF(retval);
return NULL;
}
PyDoc_STRVAR(decomp_copy__doc__,
"copy() -- Return a copy of the decompression object.");
static PyObject *
PyZlib_uncopy(compobject *self)
{
compobject *retval = NULL;
int err;
retval = newcompobject(&Decomptype);
if (!retval) return NULL;
/* Copy the zstream state
* We use ENTER_ZLIB / LEAVE_ZLIB to make this thread-safe
*/
ENTER_ZLIB
err = inflateCopy(&retval->zst, &self->zst);
switch (err) {
case Z_OK:
break;
case Z_STREAM_ERROR:
PyErr_SetString(PyExc_ValueError, "Inconsistent stream state");
goto error;
case Z_MEM_ERROR:
PyErr_SetString(PyExc_MemoryError,
"Can't allocate memory for decompression object");
goto error;
default:
zlib_error(self->zst, err, "while copying decompression object");
goto error;
}
Py_INCREF(self->unused_data);
Py_XSETREF(retval->unused_data, self->unused_data);
Py_INCREF(self->unconsumed_tail);
Py_XSETREF(retval->unconsumed_tail, self->unconsumed_tail);
/* Mark it as being initialized */
retval->is_initialised = 1;
LEAVE_ZLIB
return (PyObject *)retval;
error:
LEAVE_ZLIB
Py_XDECREF(retval);
return NULL;
}
#endif
2002-06-13 17:33:02 -03:00
PyDoc_STRVAR(decomp_flush__doc__,
"flush( [length] ) -- Return a string containing any remaining\n"
"decompressed data. length, if given, is the initial size of the\n"
"output buffer.\n"
"\n"
2002-06-13 17:33:02 -03:00
"The decompressor object can no longer be used after this call.");
1997-06-03 19:21:03 -03:00
1997-04-29 12:38:09 -03:00
static PyObject *
2000-07-10 06:57:19 -03:00
PyZlib_unflush(compobject *self, PyObject *args)
1997-04-29 12:38:09 -03:00
{
Py_ssize_t length = DEFAULTALLOC;
int err, flush;
PyObject *RetVal = NULL;
Py_ssize_t ibuflen;
2001-10-17 00:57:20 -03:00
if (!PyArg_ParseTuple(args, "|n:flush", &length))
return NULL;
if (length <= 0) {
PyErr_SetString(PyExc_ValueError, "length must be greater than zero");
return NULL;
}
ENTER_ZLIB
self->zst.next_in = (Byte *)PyString_AS_STRING(self->unconsumed_tail);
ibuflen = PyString_GET_SIZE(self->unconsumed_tail);
do {
arrange_input_buffer(&self->zst, &ibuflen);
flush = ibuflen == 0 ? Z_FINISH : Z_NO_FLUSH;
do {
length = arrange_output_buffer(&self->zst, &RetVal, length);
if (length < 0)
goto abort;
Py_BEGIN_ALLOW_THREADS
err = inflate(&self->zst, flush);
Py_END_ALLOW_THREADS
switch (err) {
case Z_OK: /* fall through */
case Z_BUF_ERROR: /* fall through */
case Z_STREAM_END:
break;
default:
goto save;
}
} while (self->zst.avail_out == 0);
} while (err != Z_STREAM_END && ibuflen != 0);
save:
if (save_unconsumed_input(self,
(Byte *)PyString_AS_STRING(self->unconsumed_tail),
PyString_GET_SIZE(self->unconsumed_tail), err) < 0)
goto abort;
/* If flushmode is Z_FINISH, we also have to call deflateEnd() to free
various data structures. Note we should only get Z_STREAM_END when
flushmode is Z_FINISH */
if (err == Z_STREAM_END) {
err = inflateEnd(&self->zst);
self->is_initialised = 0;
if (err != Z_OK) {
zlib_error(self->zst, err, "from inflateEnd()");
goto abort;
}
}
_PyString_Resize(&RetVal, self->zst.next_out -
(Byte *)PyBytes_AS_STRING(RetVal));
goto success;
abort:
Py_CLEAR(RetVal);
success:
LEAVE_ZLIB
return RetVal;
1997-04-29 12:38:09 -03:00
}
static PyMethodDef comp_methods[] =
{
2001-10-17 00:57:20 -03:00
{"compress", (binaryfunc)PyZlib_objcompress, METH_VARARGS,
comp_compress__doc__},
2001-10-17 00:57:20 -03:00
{"flush", (binaryfunc)PyZlib_flush, METH_VARARGS,
comp_flush__doc__},
#ifdef HAVE_ZLIB_COPY
{"copy", (PyCFunction)PyZlib_copy, METH_NOARGS,
comp_copy__doc__},
#endif
{NULL, NULL}
1997-04-29 12:38:09 -03:00
};
static PyMethodDef Decomp_methods[] =
{
2001-10-17 00:57:20 -03:00
{"decompress", (binaryfunc)PyZlib_objdecompress, METH_VARARGS,
decomp_decompress__doc__},
2001-10-17 00:57:20 -03:00
{"flush", (binaryfunc)PyZlib_unflush, METH_VARARGS,
decomp_flush__doc__},
#ifdef HAVE_ZLIB_COPY
{"copy", (PyCFunction)PyZlib_uncopy, METH_NOARGS,
decomp_copy__doc__},
#endif
{NULL, NULL}
1997-04-29 12:38:09 -03:00
};
static PyObject *
2000-07-10 06:57:19 -03:00
Comp_getattr(compobject *self, char *name)
1997-04-29 12:38:09 -03:00
{
/* No ENTER/LEAVE_ZLIB is necessary because this fn doesn't touch
internal data. */
return Py_FindMethod(comp_methods, (PyObject *)self, name);
1997-04-29 12:38:09 -03:00
}
static PyObject *
2000-07-10 06:57:19 -03:00
Decomp_getattr(compobject *self, char *name)
1997-04-29 12:38:09 -03:00
{
PyObject * retval;
ENTER_ZLIB
2001-10-17 00:57:20 -03:00
if (strcmp(name, "unused_data") == 0) {
Py_INCREF(self->unused_data);
retval = self->unused_data;
2001-10-17 00:57:20 -03:00
} else if (strcmp(name, "unconsumed_tail") == 0) {
Py_INCREF(self->unconsumed_tail);
retval = self->unconsumed_tail;
2001-10-17 00:57:20 -03:00
} else
retval = Py_FindMethod(Decomp_methods, (PyObject *)self, name);
LEAVE_ZLIB
return retval;
1997-04-29 12:38:09 -03:00
}
2002-06-13 17:33:02 -03:00
PyDoc_STRVAR(adler32__doc__,
"adler32(string[, start]) -- Compute an Adler-32 checksum of string.\n"
"\n"
"An optional starting value can be specified. The returned checksum is\n"
"a signed integer.");
1997-06-03 19:21:03 -03:00
1997-04-29 12:38:09 -03:00
static PyObject *
2000-07-10 06:57:19 -03:00
PyZlib_adler32(PyObject *self, PyObject *args)
1997-04-29 12:38:09 -03:00
{
unsigned int adler32val = 1; /* adler32(0L, Z_NULL, 0) */
Byte *buf;
Py_ssize_t len;
int signed_val;
2001-10-17 00:57:20 -03:00
if (!PyArg_ParseTuple(args, "s#|I:adler32", &buf, &len, &adler32val))
return NULL;
/* Avoid truncation of length for very large buffers. adler32() takes
length as an unsigned int, which may be narrower than Py_ssize_t. */
while ((size_t)len > UINT_MAX) {
adler32val = adler32(adler32val, buf, UINT_MAX);
buf += (size_t) UINT_MAX;
len -= (size_t) UINT_MAX;
}
/* In Python 2.x we return a signed integer regardless of native platform
* long size (the 32bit unsigned long is treated as 32-bit signed and sign
* extended into a 64-bit long inside the integer object). 3.0 does the
* right thing and returns unsigned. http://bugs.python.org/issue1202 */
signed_val = adler32(adler32val, buf, (unsigned int)len);
return PyInt_FromLong(signed_val);
1997-04-29 12:38:09 -03:00
}
2001-10-17 00:57:20 -03:00
2002-06-13 17:33:02 -03:00
PyDoc_STRVAR(crc32__doc__,
"crc32(string[, start]) -- Compute a CRC-32 checksum of string.\n"
"\n"
"An optional starting value can be specified. The returned checksum is\n"
"a signed integer.");
1997-04-29 12:38:09 -03:00
static PyObject *
2000-07-10 06:57:19 -03:00
PyZlib_crc32(PyObject *self, PyObject *args)
1997-04-29 12:38:09 -03:00
{
unsigned int crc32val = 0; /* crc32(0L, Z_NULL, 0) */
Byte *buf;
Py_ssize_t len;
int signed_val;
if (!PyArg_ParseTuple(args, "s#|I:crc32", &buf, &len, &crc32val))
return NULL;
/* Avoid truncation of length for very large buffers. crc32() takes
length as an unsigned int, which may be narrower than Py_ssize_t. */
while ((size_t)len > UINT_MAX) {
crc32val = crc32(crc32val, buf, UINT_MAX);
buf += (size_t) UINT_MAX;
len -= (size_t) UINT_MAX;
}
/* In Python 2.x we return a signed integer regardless of native platform
* long size (the 32bit unsigned long is treated as 32-bit signed and sign
* extended into a 64-bit long inside the integer object). 3.0 does the
* right thing and returns unsigned. http://bugs.python.org/issue1202 */
signed_val = crc32(crc32val, buf, (unsigned int)len);
return PyInt_FromLong(signed_val);
1997-04-29 12:38:09 -03:00
}
2001-10-17 00:57:20 -03:00
1997-04-29 12:38:09 -03:00
static PyMethodDef zlib_methods[] =
{
2001-10-17 00:57:20 -03:00
{"adler32", (PyCFunction)PyZlib_adler32, METH_VARARGS,
adler32__doc__},
2001-10-17 00:57:20 -03:00
{"compress", (PyCFunction)PyZlib_compress, METH_VARARGS,
compress__doc__},
2001-10-17 00:57:20 -03:00
{"compressobj", (PyCFunction)PyZlib_compressobj, METH_VARARGS,
compressobj__doc__},
2001-10-17 00:57:20 -03:00
{"crc32", (PyCFunction)PyZlib_crc32, METH_VARARGS,
crc32__doc__},
{"decompress", (PyCFunction)PyZlib_decompress, METH_VARARGS,
decompress__doc__},
2001-10-17 00:57:20 -03:00
{"decompressobj", (PyCFunction)PyZlib_decompressobj, METH_VARARGS,
decompressobj__doc__},
{NULL, NULL}
1997-04-29 12:38:09 -03:00
};
static PyTypeObject Comptype = {
PyVarObject_HEAD_INIT(0, 0)
"zlib.Compress",
sizeof(compobject),
0,
(destructor)Comp_dealloc, /*tp_dealloc*/
0, /*tp_print*/
(getattrfunc)Comp_getattr, /*tp_getattr*/
0, /*tp_setattr*/
0, /*tp_compare*/
0, /*tp_repr*/
0, /*tp_as_number*/
0, /*tp_as_sequence*/
0, /*tp_as_mapping*/
1997-04-29 12:38:09 -03:00
};
static PyTypeObject Decomptype = {
PyVarObject_HEAD_INIT(0, 0)
"zlib.Decompress",
sizeof(compobject),
0,
(destructor)Decomp_dealloc, /*tp_dealloc*/
0, /*tp_print*/
(getattrfunc)Decomp_getattr, /*tp_getattr*/
0, /*tp_setattr*/
0, /*tp_compare*/
0, /*tp_repr*/
0, /*tp_as_number*/
0, /*tp_as_sequence*/
0, /*tp_as_mapping*/
1997-04-29 12:38:09 -03:00
};
2002-06-13 17:33:02 -03:00
PyDoc_STRVAR(zlib_module_documentation,
"The functions in this module allow compression and decompression using the\n"
"zlib library, which is based on GNU zip.\n"
"\n"
"adler32(string[, start]) -- Compute an Adler-32 checksum.\n"
"compress(string[, level]) -- Compress string, with compression level in 0-9.\n"
1997-06-03 19:21:03 -03:00
"compressobj([level]) -- Return a compressor object.\n"
"crc32(string[, start]) -- Compute a CRC-32 checksum.\n"
1999-12-20 18:13:38 -04:00
"decompress(string,[wbits],[bufsize]) -- Decompresses a compressed string.\n"
"decompressobj([wbits]) -- Return a decompressor object.\n"
"\n"
"'wbits' is window buffer size and container format.\n"
"Compressor objects support compress() and flush() methods; decompressor\n"
2002-06-13 17:33:02 -03:00
"objects support decompress() and flush().");
1997-06-03 19:21:03 -03:00
PyMODINIT_FUNC
PyInit_zlib(void)
1997-04-29 12:38:09 -03:00
{
PyObject *m, *ver;
Py_TYPE(&Comptype) = &PyType_Type;
Py_TYPE(&Decomptype) = &PyType_Type;
m = Py_InitModule4("zlib", zlib_methods,
zlib_module_documentation,
(PyObject*)NULL,PYTHON_API_VERSION);
if (m == NULL)
return;
ZlibError = PyErr_NewException("zlib.error", NULL, NULL);
if (ZlibError != NULL) {
Py_INCREF(ZlibError);
PyModule_AddObject(m, "error", ZlibError);
}
PyModule_AddIntConstant(m, "MAX_WBITS", MAX_WBITS);
PyModule_AddIntConstant(m, "DEFLATED", DEFLATED);
PyModule_AddIntConstant(m, "DEF_MEM_LEVEL", DEF_MEM_LEVEL);
PyModule_AddIntConstant(m, "Z_BEST_SPEED", Z_BEST_SPEED);
PyModule_AddIntConstant(m, "Z_BEST_COMPRESSION", Z_BEST_COMPRESSION);
PyModule_AddIntConstant(m, "Z_DEFAULT_COMPRESSION", Z_DEFAULT_COMPRESSION);
PyModule_AddIntConstant(m, "Z_FILTERED", Z_FILTERED);
PyModule_AddIntConstant(m, "Z_HUFFMAN_ONLY", Z_HUFFMAN_ONLY);
PyModule_AddIntConstant(m, "Z_DEFAULT_STRATEGY", Z_DEFAULT_STRATEGY);
2001-10-17 00:57:20 -03:00
PyModule_AddIntConstant(m, "Z_FINISH", Z_FINISH);
PyModule_AddIntConstant(m, "Z_NO_FLUSH", Z_NO_FLUSH);
PyModule_AddIntConstant(m, "Z_SYNC_FLUSH", Z_SYNC_FLUSH);
PyModule_AddIntConstant(m, "Z_FULL_FLUSH", Z_FULL_FLUSH);
2001-10-17 00:57:20 -03:00
ver = PyString_FromString(ZLIB_VERSION);
if (ver != NULL)
PyModule_AddObject(m, "ZLIB_VERSION", ver);
PyModule_AddStringConstant(m, "__version__", "1.0");
#ifdef WITH_THREAD
zlib_lock = PyThread_allocate_lock();
#endif /* WITH_THREAD */
1997-04-29 12:38:09 -03:00
}