Fix character names for control characters not being read from unicode database

Also allow unicode_names.c to be compiled with python 2 so I can re-use it in calibre.
2018-05-01 10:13:22 +05:30 · 2018-05-01 10:13:22 +05:30 · f7001ea068
commit f7001ea068
parent aa93c3fb66
6 changed files with 15978 additions and 15966 deletions
--- a/gen-wcwidth.py
+++ b/gen-wcwidth.py
@ -55,7 +55,9 @@ def parse_ucd():
    for line in get_data('ucd/UnicodeData.txt'):
        parts = [x.strip() for x in line.split(';')]
        codepoint = int(parts[0], 16)
-        name = parts[1]
+        name = parts[1] or parts[10]
+        if name == '<control>':
+            name = parts[10]
        if name:
            name_map[codepoint] = name
            for word in name.lower().split():
--- a/kittens/unicode_input/names.h
+++ b/kittens/unicode_input/names.h
--- a/kittens/unicode_input/unicode_names.c
+++ b/kittens/unicode_input/unicode_names.c
@ -85,12 +85,13 @@ nfc(PyObject *self UNUSED, PyObject *args) {
 }

 static PyMethodDef module_methods[] = {
-    METHODB(all_words, METH_NOARGS),
+    {"all_words", (PyCFunction)all_words, METH_NOARGS, ""},
    {"codepoints_for_word", (PyCFunction)cfw, METH_VARARGS, ""},
    {"name_for_codepoint", (PyCFunction)nfc, METH_VARARGS, ""},
    {NULL, NULL, 0, NULL}        /* Sentinel */
 };

+#if PY_VERSION_HEX >= 0x03000000
 static struct PyModuleDef module = {
   .m_base = PyModuleDef_HEAD_INIT,
   .m_name = "unicode_names",   /* name of module */
@ -108,3 +109,13 @@ PyInit_unicode_names(void) {
    if (m == NULL) return NULL;
    return m;
 }
+#else
+EXPORTED
+initunicode_names(void) {
+    PyObject *m;
+    m = Py_InitModule3("unicode_names", module_methods,
+    ""
+    );
+    if (m == NULL) return;
+}
+#endif
--- a/kitty/emoji.h
+++ b/kitty/emoji.h
@ -1,4 +1,4 @@
-// unicode data, built from the unicode standard on: 2018-04-24
+// unicode data, built from the unicode standard on: 2018-05-01
 // see gen-wcwidth.py
 #pragma once
 #include "data-types.h"
--- a/kitty/unicode-data.c
+++ b/kitty/unicode-data.c
@ -1,4 +1,4 @@
-// unicode data, built from the unicode standard on: 2018-04-24
+// unicode data, built from the unicode standard on: 2018-05-01
 // see gen-wcwidth.py
 #include "data-types.h"

--- a/kitty/wcwidth-std.h
+++ b/kitty/wcwidth-std.h
@ -1,4 +1,4 @@
-// unicode data, built from the unicode standard on: 2018-04-24
+// unicode data, built from the unicode standard on: 2018-05-01
 // see gen-wcwidth.py
 #pragma once
 #include "data-types.h"