summaryrefslogtreecommitdiffstats
path: root/Modules/ucnhash.c
diff options
context:
space:
mode:
authorFredrik Lundh <fredrik@pythonware.com>2001-01-19 09:45:02 (GMT)
committerFredrik Lundh <fredrik@pythonware.com>2001-01-19 09:45:02 (GMT)
commit0fdb90cafe596a03a5c3005a21e8fa2a230803e5 (patch)
treeb336a6167a1df4af3cf4ed184d68f7842dd19807 /Modules/ucnhash.c
parenta2bf2709b39b7848e4f887bc60289b64e2562f36 (diff)
downloadcpython-0fdb90cafe596a03a5c3005a21e8fa2a230803e5.zip
cpython-0fdb90cafe596a03a5c3005a21e8fa2a230803e5.tar.gz
cpython-0fdb90cafe596a03a5c3005a21e8fa2a230803e5.tar.bz2
refactored the unicodeobject/ucnhash interface, to hide the
implementation details inside the ucnhash module. also cleaned up the unicode copyright blurb a little; Secret Labs' internal revision history isn't that interesting...
Diffstat (limited to 'Modules/ucnhash.c')
-rw-r--r--Modules/ucnhash.c155
1 files changed, 74 insertions, 81 deletions
diff --git a/Modules/ucnhash.c b/Modules/ucnhash.c
index e5a9bad..67a8895 100644
--- a/Modules/ucnhash.c
+++ b/Modules/ucnhash.c
@@ -1,5 +1,13 @@
+#include "Python.h"
#include "ucnhash.h"
+/* Modified for Python 2.1 by Fredrik Lundh (fredrik@pythonware.com) */
+
+typedef struct {
+ const char* pszUCN;
+ Py_UCS4 value;
+}_Py_UnicodeCharacterName;
+
/*
* The hash is produced using the algorithm described in
* "Optimal algorithms for minimal perfect hashing",
@@ -14,11 +22,11 @@
* Generated on: Fri Jul 14 08:00:58 2000
*/
+#define cKeys 10538
#define k_cHashElements 18836
#define k_cchMaxKey 83
#define k_cKeys 10538
-
staticforward const unsigned short G[k_cHashElements];
staticforward const _Py_UnicodeCharacterName aucn[k_cKeys];
@@ -34,8 +42,7 @@ static long f1(const char *key, unsigned int cch)
while (--len >= 0)
{
/* (1000003 * x) ^ toupper(*(p++))
- * translated to handle > 32 bit longs
- */
+ * translated to handle > 32 bit longs */
x = (0xf4243 * x);
x = x & 0xFFFFFFFF;
x = x ^ toupper(*(p++));
@@ -98,110 +105,96 @@ static long f2(const char *key, unsigned int cch)
}
-static unsigned long hash(const char *key, unsigned int cch)
+static unsigned long
+hash(const char *key, unsigned int cch)
{
return ((unsigned long)(G[ f1(key, cch) ]) + (unsigned long)(G[ f2(key, cch) ]) ) % k_cHashElements;
}
-const void *getValue(unsigned long iKey)
+const _Py_UnicodeCharacterName *
+getValue(unsigned long iKey)
{
- return &aucn[iKey];
+ return (_Py_UnicodeCharacterName *) &aucn[iKey];
}
-/* Helper for adding objects to dictionaries. Check for errors with
- PyErr_Occurred() */
-static
-void insobj(PyObject *dict,
- char *name,
- PyObject *v)
+static int
+mystrnicmp(const char *s1, const char *s2, size_t count)
{
- PyDict_SetItemString(dict, name, v);
- Py_XDECREF(v);
+ char c1, c2;
+
+ if (count) {
+ do {
+ c1 = tolower(*(s1++));
+ c2 = tolower(*(s2++));
+ } while (--count && c1 == c2);
+ return c1 - c2;
+ }
+
+ return 0;
}
-static const _Py_UCNHashAPI hashAPI =
+/* bindings for the new API */
+
+static int
+ucnhash_getname(Py_UCS4 code, char* buffer, int buflen)
{
- k_cKeys,
- k_cchMaxKey,
- &hash,
- &getValue,
+ return 0;
+}
+
+static int
+ucnhash_getcode(const char* name, int namelen, Py_UCS4* code)
+{
+ unsigned long j;
+
+ j = hash(name, namelen);
+
+ if (j > cKeys || mystrnicmp(name, getValue(j)->pszUCN, namelen) != 0)
+ return 0;
+
+ *code = getValue(j)->value;
+
+ return 1;
+}
+
+static const _PyUnicode_Name_CAPI hashAPI =
+{
+ sizeof(_PyUnicode_Name_CAPI),
+ ucnhash_getname,
+ ucnhash_getcode
};
static
-PyMethodDef Module_methods[] =
+PyMethodDef ucnhash_methods[] =
{
{NULL, NULL},
};
-static char *Module_docstring = "ucnhash hash function module";
-
-/* Error reporting for module init functions */
-
-#define Py_ReportModuleInitError(modname) { \
- PyObject *exc_type, *exc_value, *exc_tb; \
- PyObject *str_type, *str_value; \
- \
- /* Fetch error objects and convert them to strings */ \
- PyErr_Fetch(&exc_type, &exc_value, &exc_tb); \
- if (exc_type && exc_value) { \
- str_type = PyObject_Str(exc_type); \
- str_value = PyObject_Str(exc_value); \
- } \
- else { \
- str_type = NULL; \
- str_value = NULL; \
- } \
- /* Try to format a more informative error message using the \
- original error */ \
- if (str_type && str_value && \
- PyString_Check(str_type) && PyString_Check(str_value)) \
- PyErr_Format( \
- PyExc_ImportError, \
- "initialization of module "modname" failed " \
- "(%s:%s)", \
- PyString_AS_STRING(str_type), \
- PyString_AS_STRING(str_value)); \
- else \
- PyErr_SetString( \
- PyExc_ImportError, \
- "initialization of module "modname" failed"); \
- Py_XDECREF(str_type); \
- Py_XDECREF(str_value); \
- Py_XDECREF(exc_type); \
- Py_XDECREF(exc_value); \
- Py_XDECREF(exc_tb); \
-}
+static char *ucnhash_docstring = "ucnhash hash function module";
/* Create PyMethodObjects and register them in the module's dict */
DL_EXPORT(void)
initucnhash(void)
{
- PyObject *module, *moddict;
- /* Create module */
- module = Py_InitModule4("ucnhash", /* Module name */
- Module_methods, /* Method list */
- Module_docstring, /* Module doc-string */
- (PyObject *)NULL, /* always pass this as *self */
- PYTHON_API_VERSION); /* API Version */
- if (module == NULL)
- goto onError;
- /* Add some constants to the module's dict */
- moddict = PyModule_GetDict(module);
- if (moddict == NULL)
- goto onError;
+ PyObject *m, *d, *v;
+
+ m = Py_InitModule4(
+ "ucnhash", /* Module name */
+ ucnhash_methods, /* Method list */
+ ucnhash_docstring, /* Module doc-string */
+ (PyObject *)NULL, /* always pass this as *self */
+ PYTHON_API_VERSION); /* API Version */
+ if (!m)
+ return;
+
+ d = PyModule_GetDict(m);
+ if (!d)
+ return;
/* Export C API */
- insobj(
- moddict,
- "ucnhashAPI",
- PyCObject_FromVoidPtr((void *)&hashAPI, NULL));
-
-onError:
- /* Check for errors and report them */
- if (PyErr_Occurred())
- Py_ReportModuleInitError("ucnhash");
- return;
+ v = PyCObject_FromVoidPtr((void *) &hashAPI, NULL);
+ PyDict_SetItemString(d, "Unicode_Names_CAPI", v);
+ Py_XDECREF(v);
}
static const unsigned short G[] =