compress unicode decomposition tables (this saves another 55k)

commit: 7b7dd107b3654926fb75215805d6c0c8a15bf89e [log] [tgz]
author: Fredrik Lundh <fredrik@pythonware.com> Sun Jan 21 22:41:08 2001 +0000
committer: Fredrik Lundh <fredrik@pythonware.com> Sun Jan 21 22:41:08 2001 +0000
tree: 13b2631ae40737b8f28e2466e0a64e1278564220
parent: f75c9d94b4cb9f11f0ed046aa775478e559b4081 [diff] [blame]
diff --git a/Modules/ucnhash.c b/Modules/ucnhash.c
index 248300e..bdcdab1 100644
--- a/Modules/ucnhash.c
+++ b/Modules/ucnhash.c

@@ -38,7 +38,7 @@
 
     /* get offset into phrasebook */
     offset = phrasebook_offset1[(code>>phrasebook_shift)];
-    offset = phrasebook_offset2[(offset<<phrasebook_shift)+
+    offset = phrasebook_offset2[(offset<<phrasebook_shift) +
                                (code&((1<<phrasebook_shift)-1))];
     if (!offset)
         return 0;
@@ -47,13 +47,12 @@
 
     for (;;) {
         /* get word index */
-        if (phrasebook[offset] & 128) {
-            word = phrasebook[offset] & 127;
-            offset++;
-        } else {
-            word = (phrasebook[offset]<<8) + phrasebook[offset+1];
-            offset+=2;
-        }
+        word = phrasebook[offset] - phrasebook_short;
+        if (word >= 0) {
+            word = (word << 8) + phrasebook[offset+1];
+            offset += 2;
+        } else
+            word = phrasebook[offset++];
         if (i) {
             if (i > buflen)
                 return 0; /* buffer overflow */
commit	7b7dd107b3654926fb75215805d6c0c8a15bf89e	[log] [tgz]
author	Fredrik Lundh <fredrik@pythonware.com>	Sun Jan 21 22:41:08 2001 +0000
committer	Fredrik Lundh <fredrik@pythonware.com>	Sun Jan 21 22:41:08 2001 +0000
tree	13b2631ae40737b8f28e2466e0a64e1278564220
parent	f75c9d94b4cb9f11f0ed046aa775478e559b4081 [diff] [blame]