/* * multibytecodec.h: Common Multibyte Codec Implementation * * Written by Hye-Shik Chang */ #ifndef _PYTHON_MULTIBYTECODEC_H_ #define _PYTHON_MULTIBYTECODEC_H_ #ifdef __cplusplus extern "C" { #endif #include "pycore_unicodeobject.h" // _PyUnicodeWriter #ifdef uint16_t typedef uint16_t ucs2_t, DBCHAR; #else typedef unsigned short ucs2_t, DBCHAR; #endif /* * A struct that provides 8 bytes of state for multibyte * codecs. Codecs are free to use this how they want. Note: if you * need to add a new field to this struct, ensure that its byte order * is independent of CPU endianness so that the return value of * getstate doesn't differ between little and big endian CPUs. */ typedef struct { unsigned char c[8]; } MultibyteCodec_State; struct _cjk_mod_state; struct _multibyte_codec; typedef int (*mbcodec_init)(const struct _multibyte_codec *codec); typedef Py_ssize_t (*mbencode_func)(MultibyteCodec_State *state, const struct _multibyte_codec *codec, int kind, const void *data, Py_ssize_t *inpos, Py_ssize_t inlen, unsigned char **outbuf, Py_ssize_t outleft, int flags); typedef int (*mbencodeinit_func)(MultibyteCodec_State *state, const struct _multibyte_codec *codec); typedef Py_ssize_t (*mbencodereset_func)(MultibyteCodec_State *state, const struct _multibyte_codec *codec, unsigned char **outbuf, Py_ssize_t outleft); typedef Py_ssize_t (*mbdecode_func)(MultibyteCodec_State *state, const struct _multibyte_codec *codec, const unsigned char **inbuf, Py_ssize_t inleft, _PyUnicodeWriter *writer); typedef int (*mbdecodeinit_func)(MultibyteCodec_State *state, const struct _multibyte_codec *codec); typedef Py_ssize_t (*mbdecodereset_func)(MultibyteCodec_State *state, const struct _multibyte_codec *codec); typedef struct _multibyte_codec { const char *encoding; const void *config; mbcodec_init codecinit; mbencode_func encode; mbencodeinit_func encinit; mbencodereset_func encreset; mbdecode_func decode; mbdecodeinit_func decinit; mbdecodereset_func decreset; struct _cjk_mod_state *modstate; } MultibyteCodec; typedef struct { PyObject_HEAD const MultibyteCodec *codec; PyObject *cjk_module; } MultibyteCodecObject; #define MultibyteCodec_Check(state, op) Py_IS_TYPE((op), state->multibytecodec_type) #define _MultibyteStatefulCodec_HEAD \ PyObject_HEAD \ const MultibyteCodec *codec; \ MultibyteCodec_State state; \ PyObject *errors; typedef struct { _MultibyteStatefulCodec_HEAD } MultibyteStatefulCodecContext; #define MAXENCPENDING 2 #define _MultibyteStatefulEncoder_HEAD \ _MultibyteStatefulCodec_HEAD \ PyObject *pending; typedef struct { _MultibyteStatefulEncoder_HEAD } MultibyteStatefulEncoderContext; #define MAXDECPENDING 8 #define _MultibyteStatefulDecoder_HEAD \ _MultibyteStatefulCodec_HEAD \ unsigned char pending[MAXDECPENDING]; \ Py_ssize_t pendingsize; typedef struct { _MultibyteStatefulDecoder_HEAD } MultibyteStatefulDecoderContext; typedef struct { _MultibyteStatefulEncoder_HEAD } MultibyteIncrementalEncoderObject; typedef struct { _MultibyteStatefulDecoder_HEAD } MultibyteIncrementalDecoderObject; typedef struct { _MultibyteStatefulDecoder_HEAD PyObject *stream; } MultibyteStreamReaderObject; typedef struct { _MultibyteStatefulEncoder_HEAD PyObject *stream; } MultibyteStreamWriterObject; /* positive values for illegal sequences */ #define MBERR_TOOSMALL (-1) /* insufficient output buffer space */ #define MBERR_TOOFEW (-2) /* incomplete input buffer */ #define MBERR_INTERNAL (-3) /* internal runtime error */ #define MBERR_EXCEPTION (-4) /* an exception has been raised */ #define ERROR_STRICT (PyObject *)(1) #define ERROR_IGNORE (PyObject *)(2) #define ERROR_REPLACE (PyObject *)(3) #define ERROR_ISCUSTOM(p) ((p) < ERROR_STRICT || ERROR_REPLACE < (p)) #define ERROR_DECREF(p) \ do { \ if (p != NULL && ERROR_ISCUSTOM(p)) \ Py_DECREF(p); \ } while (0); #define MBENC_FLUSH 0x0001 /* encode all characters encodable */ #define MBENC_MAX MBENC_FLUSH typedef struct { const MultibyteCodec *codec; PyObject *cjk_module; } codec_capsule; #define MAP_CAPSULE "multibytecodec.map" #define CODEC_CAPSULE "multibytecodec.codec" #ifdef __cplusplus } #endif #endif