1 files changed, 193 insertions, 0 deletions
diff --git a/util/import_unicode.py b/util/import_unicode.py
new file mode 100644
index 0000000..08f8059
--- /dev/null
+++ b/util/import_unicode.py
@@ -0,0 +1,193 @@
+#*
+#*  GRUB  --  GRand Unified Bootloader
+#*  Copyright (C) 2010  Free Software Foundation, Inc.
+#*
+#*  GRUB is free software: you can redistribute it and/or modify
+#*  it under the terms of the GNU General Public License as published by
+#*  the Free Software Foundation, either version 3 of the License, or
+#*  (at your option) any later version.
+#*
+#*  GRUB is distributed in the hope that it will be useful,
+#*  but WITHOUT ANY WARRANTY; without even the implied warranty of
+#*  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+#*  GNU General Public License for more details.
+#*
+#*  You should have received a copy of the GNU General Public License
+#*  along with GRUB.  If not, see <http://www.gnu.org/licenses/>.
+#*
+
+import re
+import sys
+
+if len (sys.argv) < 3:
+    print ("Usage: %s SOURCE DESTINATION" % sys.argv[0])
+    exit (0)
+infile = open (sys.argv[3], "r")
+joining = {}
+for line in infile:
+    line = re.sub ("#.*$", "", line)
+    line = line.replace ("\n", "")
+    line = line.replace (" ", "")
+    if len (line) == 0 or line[0] == '\n':
+        continue
+    sp = line.split (";")
+    curcode = int (sp[0], 16)
+    if sp[2] == "U":
+        joining[curcode] = "NONJOINING"
+    elif sp[2] == "L":
+        joining[curcode] = "LEFT"
+    elif sp[2] == "R":
+        joining[curcode] = "RIGHT"
+    elif sp[2] == "D":
+        joining[curcode] = "DUAL"
+    elif sp[2] == "C":
+        joining[curcode] = "CAUSING"
+    else:
+        print ("Unknown joining type '%s'" % sp[2])
+        exit (1)
+infile.close ()
+
+infile = open (sys.argv[1], "r")
+outfile = open (sys.argv[4], "w")
+outfile.write ("#include <grub/unicode.h>\n")
+outfile.write ("\n")
+outfile.write ("struct grub_unicode_compact_range grub_unicode_compact[] = {\n")
+
+begincode = -2
+lastcode = -2
+lastbiditype = "X"
+lastmirrortype = False
+lastcombtype = -1
+arabicsubst = {}
+for line in infile:
+    sp = line.split (";")
+    curcode = int (sp[0], 16)
+    curcombtype = int (sp[3], 10)
+    curbiditype = sp[4]
+    curmirrortype = (sp[9] == "Y")
+    if curcombtype <= 255 and curcombtype >= 253:
+        print ("UnicodeData.txt uses combination type %d. Conflict." \
+                   % curcombtype)
+        raise
+    if sp[2] != "Lu" and sp[2] != "Ll" and sp[2] != "Lt" and sp[2] != "Lm" \
+            and sp[2] != "Lo"\
+            and sp[2] != "Me" and sp[2] != "Mc" and sp[2] != "Mn" \
+            and sp[2] != "Nd" and sp[2] != "Nl" and sp[2] != "No" \
+            and sp[2] != "Pc" and sp[2] != "Pd" and sp[2] != "Ps" \
+            and sp[2] != "Pe" and sp[2] != "Pi" and sp[2] != "Pf" \
+            and sp[2] != "Po" \
+            and sp[2] != "Sm" and sp[2] != "Sc" and sp[2] != "Sk" \
+            and sp[2] != "So"\
+            and sp[2] != "Zs" and sp[2] != "Zl" and sp[2] != "Zp" \
+            and sp[2] != "Cc" and sp[2] != "Cf" and sp[2] != "Cs" \
+            and sp[2] != "Co":
+        print ("WARNING: Unknown type %s" % sp[2])
+    if curcombtype == 0 and sp[2] == "Me":
+        curcombtype = 253
+    if curcombtype == 0 and sp[2] == "Mc":
+        curcombtype = 254
+    if curcombtype == 0 and sp[2] == "Mn":
+        curcombtype = 255
+    if (curcombtype >= 2 and curcombtype <= 6) \
+            or (curcombtype >= 37 and curcombtype != 84 and curcombtype != 91  and curcombtype != 103 and curcombtype != 107 and curcombtype != 118 and curcombtype != 122 and curcombtype != 129 and curcombtype != 130 and curcombtype != 132 and curcombtype != 202 and \
+                curcombtype != 214 and curcombtype != 216 and \
+                curcombtype != 218 and curcombtype != 220 and \
+                curcombtype != 222 and curcombtype != 224 and curcombtype != 226 and curcombtype != 228 and \
+                curcombtype != 230 and curcombtype != 232 and curcombtype != 233 and \
+                curcombtype != 234 and \
+                curcombtype != 240 and curcombtype != 253 and \
+                curcombtype != 254 and curcombtype != 255):
+        print ("WARNING: Unknown combining type %d" % curcombtype)
+    if curcode in joining:
+        curjoin = joining[curcode]
+    elif sp[2] == "Me" or sp[2] == "Mn" or sp[2] == "Cf":
+        curjoin = "TRANSPARENT"
+    else:
+        curjoin = "NONJOINING"
+    if sp[1].startswith ("ARABIC LETTER "):
+        arabname = sp[1][len ("ARABIC LETTER "):]
+        form = 0
+        if arabname.endswith (" ISOLATED FORM"):
+            arabname = arabname[0:len (arabname) - len (" ISOLATED FORM")]
+            form = 1
+        if arabname.endswith (" FINAL FORM"):
+            arabname = arabname[0:len (arabname) - len (" FINAL FORM")]
+            form = 2
+        if arabname.endswith (" MEDIAL FORM"):
+            arabname = arabname[0:len (arabname) - len (" MEDIAL FORM")]
+            form = 3
+        if arabname.endswith (" INITIAL FORM"):
+            arabname = arabname[0:len (arabname) - len (" INITIAL FORM")]
+            form = 4
+        if arabname not in arabicsubst:
+            arabicsubst[arabname]={}
+        arabicsubst[arabname][form] = curcode;
+        if form == 0:
+            arabicsubst[arabname]['join'] = curjoin
+    if lastcode + 1 != curcode or curbiditype != lastbiditype \
+            or curcombtype != lastcombtype or curmirrortype != lastmirrortype \
+            or curjoin != lastjoin:
+        if begincode != -2 and (lastbiditype != "L" or lastcombtype != 0 or \
+                                    lastmirrortype):
+            outfile.write (("{0x%x, 0x%x, GRUB_BIDI_TYPE_%s, %d, %d, GRUB_JOIN_TYPE_%s},\n" \
+                                % (begincode, lastcode - begincode + 1, \
+                                       lastbiditype, \
+                                       lastcombtype, lastmirrortype, \
+                                       lastjoin)))
+            if lastcode - begincode + 1 >= 0x200:
+                print ("Too long range")
+                raise
+        begincode = curcode
+    lastcode = curcode
+    lastjoin = curjoin
+    lastbiditype = curbiditype
+    lastcombtype = curcombtype
+    lastmirrortype = curmirrortype
+if lastbiditype != "L" or lastcombtype != 0 or lastmirrortype:
+    outfile.write (("{0x%x, 0x%x, GRUB_BIDI_TYPE_%s, %d, %d, GRUB_JOIN_TYPE_%s},\n" \
+                        % (begincode, lastcode, lastbiditype, lastcombtype, \
+                               lastmirrortype, lastjoin)))
+outfile.write ("{0, 0, 0, 0, 0, 0},\n")
+
+outfile.write ("};\n")
+
+infile.close ()
+
+infile = open (sys.argv[2], "r")
+
+outfile.write ("struct grub_unicode_bidi_pair grub_unicode_bidi_pairs[] = {\n")
+
+for line in infile:
+    line = re.sub ("#.*$", "", line)
+    line = line.replace ("\n", "")
+    line = line.replace (" ", "")
+    if len (line) == 0 or line[0] == '\n':
+        continue
+    sp = line.split (";")
+    code1 = int (sp[0], 16)
+    code2 = int (sp[1], 16)
+    outfile.write ("{0x%x, 0x%x},\n" % (code1, code2))
+outfile.write ("{0, 0},\n")
+outfile.write ("};\n")
+
+infile.close ()
+
+outfile.write ("struct grub_unicode_arabic_shape grub_unicode_arabic_shapes[] = {\n ")
+
+for x in arabicsubst:
+    try:
+        if arabicsubst[x]['join'] == "DUAL":
+            outfile.write ("{0x%x, 0x%x, 0x%x, 0x%x, 0x%x},\n " % (arabicsubst[x][0], arabicsubst[x][1], arabicsubst[x][2], arabicsubst[x][3], arabicsubst[x][4]))
+        elif arabicsubst[x]['join'] == "RIGHT":
+            outfile.write ("{0x%x, 0x%x, 0x%x, 0x%x, 0x%x},\n " % (arabicsubst[x][0], arabicsubst[x][1], arabicsubst[x][2], 0, 0))
+        elif arabicsubst[x]['join'] == "LEFT":
+            outfile.write ("{0x%x, 0x%x, 0x%x, 0x%x, 0x%x},\n " % (arabicsubst[x][0], arabicsubst[x][1], 0, 0, arabicsubst[x][4]))
+    except:
+        pass
+
+outfile.write ("{0, 0, 0, 0, 0},\n")
+outfile.write ("};\n")
+
+
+outfile.close ()
+