summary refs log tree commit diff stats
path: root/lib/pure/unidecode/gen.py
diff options
context:
space:
mode:
Diffstat (limited to 'lib/pure/unidecode/gen.py')
-rw-r--r--lib/pure/unidecode/gen.py30
1 files changed, 30 insertions, 0 deletions
diff --git a/lib/pure/unidecode/gen.py b/lib/pure/unidecode/gen.py
new file mode 100644
index 000000000..2fb69f7b2
--- /dev/null
+++ b/lib/pure/unidecode/gen.py
@@ -0,0 +1,30 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+
+# Generates the unidecode.dat module
+# (c) 2010 Andreas Rumpf
+
+from unidecode import unidecode
+try:
+  import warnings
+  warnings.simplefilter("ignore")
+except ImportError:
+  pass
+
+def main():
+  f = open("unidecode.dat", "wb+")
+  for x in range(128, 0xffff + 1):
+    u = eval("u'\\u%04x'" % x)
+
+    val = unidecode(u)
+
+    # f.write("%x | " % x)
+    if x == 0x2028: # U+2028 = LINE SEPARATOR
+      val = ""
+    elif x == 0x2029: # U+2029 = PARAGRAPH SEPARATOR
+      val = ""
+    f.write("%s\n" % val)
+
+  f.close()
+
+main()