/* ------------------------------------------------------------------------ unicodedata -- Provides access to the Unicode 3.0 data base. Data was extracted from the Unicode 3.0 UnicodeData.txt file. Written by Marc-Andre Lemburg (mal@lemburg.com). (c) Copyright CNRI, All Rights Reserved. NO WARRANTY. ------------------------------------------------------------------------ */ #include "Python.h" #include "unicodedatabase.h" /* --- Helpers ------------------------------------------------------------ */ static const _PyUnicode_DatabaseRecord *unicode_db(register int i) { register int page = i >> 12; if (page < sizeof(_PyUnicode_Database)) return &_PyUnicode_Database[page][i & 0x0fff]; return &_PyUnicode_Database[0][0]; } /* --- Module API --------------------------------------------------------- */ static PyObject * unicodedata_decimal(PyObject *self, PyObject *args) { PyUnicodeObject *v; PyObject *defobj = NULL; long rc; if (!PyArg_ParseTuple(args, "O!|O:decimal", &PyUnicode_Type, &v, &defobj)) goto onError; if (PyUnicode_GET_SIZE(v) != 1) { PyErr_SetString(PyExc_TypeError, "need a single Unicode character as parameter"); goto onError; } rc = Py_UNICODE_TODECIMAL(*PyUnicode_AS_UNICODE(v)); if (rc < 0) { if (defobj == NULL) { PyErr_SetString(PyExc_ValueError, "not a decimal"); goto onError; } else { Py_INCREF(defobj); return defobj; } } return PyInt_FromLong(rc); onError: return NULL; } static PyObject * unicodedata_digit(PyObject *self, PyObject *args) { PyUnicodeObject *v; PyObject *defobj = NULL; long rc; if (!PyArg_ParseTuple(args, "O!|O:digit", &PyUnicode_Type, &v, &defobj)) goto onError; if (PyUnicode_GET_SIZE(v) != 1) { PyErr_SetString(PyExc_TypeError, "need a single Unicode character as parameter"); goto onError; } rc = Py_UNICODE_TODIGIT(*PyUnicode_AS_UNICODE(v)); if (rc < 0) { if (defobj == NULL) { PyErr_SetString(PyExc_ValueError, "not a digit"); goto onError; } else { Py_INCREF(defobj); return defobj; } } return PyInt_FromLong(rc); onError: return NULL; } static PyObject * unicodedata_numeric(PyObject *self, PyObject *args) { PyUnicodeObject *v; PyObject *defobj = NULL; double rc; if (!PyArg_ParseTuple(args, "O!|O:numeric", &PyUnicode_Type, &v, &defobj)) goto onError; if (PyUnicode_GET_SIZE(v) != 1) { PyErr_SetString(PyExc_TypeError, "need a single Unicode character as parameter"); goto onError; } rc = Py_UNICODE_TONUMERIC(*PyUnicode_AS_UNICODE(v)); if (rc < 0) { if (defobj == NULL) { PyErr_SetString(PyExc_ValueError, "not a numeric character"); goto onError; } else { Py_INCREF(defobj); return defobj; } } return PyFloat_FromDouble(rc); onError: return NULL; } static PyObject * unicodedata_category(PyObject *self, PyObject *args) { PyUnicodeObject *v; int index; if (!PyArg_ParseTuple(args, "O!:category", &PyUnicode_Type, &v)) goto onError; if (PyUnicode_GET_SIZE(v) != 1) { PyErr_SetString(PyExc_TypeError, "need a single Unicode character as parameter"); goto onError; } index = (int)unicode_db((int)*PyUnicode_AS_UNICODE(v))->category; if (index < 0 || index > sizeof(_PyUnicode_CategoryNames) / sizeof(_PyUnicode_CategoryNames[0])) { PyErr_Format(PyExc_SystemError, "category index out of range: %i", index); goto onError; } return PyString_FromString(_PyUnicode_CategoryNames[index]); onError: return NULL; } static PyObject * unicodedata_bidirectional(PyObject *self, PyObject *args) { PyUnicodeObject *v; int index; if (!PyArg_ParseTuple(args, "O!:bidirectional", &PyUnicode_Type, &v)) goto onError; if (PyUnicode_GET_SIZE(v) != 1) { PyErr_SetString(PyExc_TypeError, "need a single Unicode character as parameter"); goto onError; } index = (int)unicode_db((int)*PyUnicode_AS_UNICODE(v))->bidirectional; if (index < 0 || index > sizeof(_PyUnicode_CategoryNames) / sizeof(_PyUnicode_CategoryNames[0])) { PyErr_Format(PyExc_SystemError, "bidirectional index out of range: %i", index); goto onError; } return PyString_FromString(_PyUnicode_BidirectionalNames[index]); onError: return NULL; } static PyObject * unicodedata_combining(PyObject *self, PyObject *args) { PyUnicodeObject *v; int value; if (!PyArg_ParseTuple(args, "O!:combining", &PyUnicode_Type, &v)) goto onError; if (PyUnicode_GET_SIZE(v) != 1) { PyErr_SetString(PyExc_TypeError, "need a single Unicode character as parameter"); goto onError; } value = (int)unicode_db((int)*PyUnicode_AS_UNICODE(v))->combining; return PyInt_FromLong(value); onError: return NULL; } static PyObject * unicodedata_mirrored(PyObject *self, PyObject *args) { PyUnicodeObject *v; int value; if (!PyArg_ParseTuple(args, "O!:mirrored", &PyUnicode_Type, &v)) goto onError; if (PyUnicode_GET_SIZE(v) != 1) { PyErr_SetString(PyExc_TypeError, "need a single Unicode character as parameter"); goto onError; } value = (int)unicode_db((int)*PyUnicode_AS_UNICODE(v))->mirrored; return PyInt_FromLong(value); onError: return NULL; } static PyObject * unicodedata_decomposition(PyObject *self, PyObject *args) { PyUnicodeObject *v; const char *value; if (!PyArg_ParseTuple(args, "O!:decomposition", &PyUnicode_Type, &v)) goto onError; if (PyUnicode_GET_SIZE(v) != 1) { PyErr_SetString(PyExc_TypeError, "need a single Unicode character as parameter"); goto onError; } value = unicode_db((int)*PyUnicode_AS_UNICODE(v))->decomposition; if (value == NULL) return PyString_FromString(""); else return PyString_FromString(value); onError: return NULL; } /* XXX Add doc strings. */ static PyMethodDef unicodedata_functions[] = { {"decimal", unicodedata_decimal, 1}, {"digit", unicodedata_digit, 1}, {"numeric", unicodedata_numeric, 1}, {"category", unicodedata_category, 1}, {"bidirectional", unicodedata_bidirectional, 1}, {"combining", unicodedata_combining, 1}, {"mirrored", unicodedata_mirrored, 1}, {"decomposition", unicodedata_decomposition, 1}, {NULL, NULL} /* sentinel */ }; DL_EXPORT(void) initunicodedata() { Py_InitModule("unicodedata", unicodedata_functions); }