]> git.cameronkatri.com Git - mandoc.git/blobdiff - chars.in
Start fixing issues that beck@ helped find:
[mandoc.git] / chars.in
index c2ac4c16046f2425718b41e9b75badc33d8f13bb..098504fa164838d1880529f1bddc00be448f62a0 100644 (file)
--- a/chars.in
+++ b/chars.in
@@ -1,6 +1,7 @@
-/*     $Id: chars.in,v 1.19 2009/11/05 07:21:02 kristaps Exp $ */
+/*     $Id: chars.in,v 1.46 2014/04/20 16:46:04 schwarze Exp $ */
 /*
- * Copyright (c) 2009 Kristaps Dzonsons <kristaps@kth.se>
+ * Copyright (c) 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv>
+ * Copyright (c) 2014 Ingo Schwarze <schwarze@openbsd.org>
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
  */
 
 /*
- * The ASCII translation tables.  STRING corresponds to predefined
- * strings (cf. mdoc_samples.7 and tmac/mdoc/doc-nroff).  CHAR
- * corresponds to special characters (cf. groff_char.7).  BOTH contains
- * sequences that are equivalent in both STRING and CHAR.
+ * The ASCII translation tables.
  *
- * Either way, the left-hand side corresponds to the input sequence (\x,
- * \(xx, \*(xx and so on) whose length is listed second element.  The
- * right-hand side is what's produced by the front-end, with the fourth
- * element being its length.
+ * The left-hand side corresponds to the input sequence (\x, \(xx, \*(xx
+ * and so on) whose length is listed second element.  The right-hand
+ * side is what's produced by the front-end, with the fourth element
+ * being its length.
  *
  * XXX - C-escape strings!
  * XXX - update LINES_MAX if adding more!
  */
 
-/* Non-breaking, non-collapsing space uses unit separator. */
-static const char ascii_nbrsp[2] = { 31, 0 };
+/* Special break control characters. */
+static const char ascii_nbrsp[2] = { ASCII_NBRSP, '\0' };
+static const char ascii_break[2] = { ASCII_BREAK, '\0' };
 
 CHAR_TBL_START
 
 /* Spacing. */
-CHAR("c",                      1,      "",             0,      "",             0)
-CHAR("0",                      1,      " ",            1,      "&#8194;",      7)
-CHAR(" ",                      1,      " ",            1,      "&#8194;",      7)
-CHAR("~",                      1,      ascii_nbrsp,    1,      "&#160;",       6)
-CHAR("%",                      1,      "",             0,      "",             0)
-CHAR("&",                      1,      "",             0,      "",             0)
-CHAR("^",                      1,      "",             0,      "",             0)
-CHAR("|",                      1,      "",             0,      "",             0)
+CHAR(" ",                      ascii_nbrsp,    160)
+CHAR("~",                      ascii_nbrsp,    160)
+CHAR("0",                      " ",            8194)
+CHAR("|",                      "",             0)
+CHAR("^",                      "",             0)
+CHAR("&",                      "",             0)
+CHAR("%",                      "",             0)
+CHAR(":",                      ascii_break,    0)
+/* XXX The following three do not really belong into this file. */
+CHAR("t",                      "",             0)
+CHAR("c",                      "",             0)
+CHAR("}",                      "",             0)
 
 /* Accents. */
-CHAR("a\"",                    2,      "\"",           1,      "&#779;",       6)
-CHAR("a-",                     2,      "-",            1,      "&#175;",       6)
-CHAR("a.",                     2,      ".",            1,      "&#729;",       6)
-CHAR("a^",                     2,      "^",            1,      "&#770;",       6)
-CHAR("\'",                     1,      "\'",           1,      "&#769;",       6)
-BOTH("aa",                     2,      "\'",           1,      "&#769;",       6)
-BOTH("ga",                     2,      "`",            1,      "&#768;",       6)
-CHAR("`",                      1,      "`",            1,      "&#768;",       6)
-CHAR("ab",                     2,      "`",            1,      "&#774;",       6)
-CHAR("ac",                     2,      ",",            1,      "&#807;",       6)
-CHAR("ad",                     2,      "\"",           1,      "&#776;",       6)
-CHAR("ah",                     2,      "v",            1,      "&#711;",       6)
-CHAR("ao",                     2,      "o",            1,      "&#730;",       6)
-CHAR("a~",                     2,      "~",            1,      "&#771;",       6)
-CHAR("ho",                     2,      ",",            1,      "&#808;",       6)
-CHAR("ha",                     2,      "^",            1,      "^",            1)
-CHAR("ti",                     2,      "~",            1,      "~",            1)
+CHAR("a\"",                    "\"",           733)
+CHAR("a-",                     "-",            175)
+CHAR("a.",                     ".",            729)
+CHAR("a^",                     "^",            94)
+CHAR("\'",                     "\'",           180)
+CHAR("aa",                     "\'",           180)
+CHAR("ga",                     "`",            96)
+CHAR("`",                      "`",            96)
+CHAR("ab",                     "`",            728)
+CHAR("ac",                     ",",            184)
+CHAR("ad",                     "\"",           168)
+CHAR("ah",                     "v",            711)
+CHAR("ao",                     "o",            730)
+CHAR("a~",                     "~",            126)
+CHAR("ho",                     ",",            731)
+CHAR("ha",                     "^",            94)
+CHAR("ti",                     "~",            126)
 
 /* Quotes. */
-CHAR("Bq",                     2,      ",,",           2,      "&#8222;",      7)
-CHAR("bq",                     2,      ",",            1,      "&#8218;",      7)
-BOTH("lq",                     2,      "``",           2,      "&#8220;",      7)
-BOTH("rq",                     2,      "\'\'",         2,      "&#8221;",      7)
-CHAR("oq",                     2,      "`",            1,      "&#8216;",      7)
-CHAR("cq",                     2,      "\'",           1,      "&#8217;",      7)
-CHAR("aq",                     2,      "\'",           1,      "\'",           1)
-CHAR("dq",                     2,      "\"",           1,      "\"",           1)
-CHAR("Fo",                     2,      "<<",           2,      "&#171;",       6)
-CHAR("Fc",                     2,      ">>",           2,      "&#187;",       6)
-CHAR("fo",                     2,      "<",            1,      "&#8249;",      7)
-CHAR("fc",                     2,      ">",            1,      "&#8250;",      7)
+CHAR("Bq",                     ",,",           8222)
+CHAR("bq",                     ",",            8218)
+CHAR("lq",                     "``",           8220)
+CHAR("rq",                     "\'\'",         8221)
+CHAR("oq",                     "`",            8216)
+CHAR("cq",                     "\'",           8217)
+CHAR("aq",                     "\'",           39)
+CHAR("dq",                     "\"",           34)
+CHAR("Fo",                     "<<",           171)
+CHAR("Fc",                     ">>",           187)
+CHAR("fo",                     "<",            8249)
+CHAR("fc",                     ">",            8250)
 
 /* Brackets. */
-CHAR("lB",                     2,      "[",            1,      "[",            1)
-CHAR("rB",                     2,      "]",            1,      "]",            1)
-CHAR("lC",                     2,      "{",            1,      "{",            1)
-CHAR("rC",                     2,      "}",            1,      "}",            1)
-CHAR("la",                     2,      "<",            1,      "&#10216;",     8)
-CHAR("ra",                     2,      ">",            1,      "&#10217;",     8)
-CHAR("bv",                     2,      "|",            1,      "&#9130;",      7)
-CHAR("braceex",                        7,      "|",            1,      "&#9130;",      7)
-CHAR("bracketlefttp",          13,     "|",            1,      "&#9121;",      7)
-CHAR("bracketleftbp",          13,     "|",            1,      "&#9123;",      7)
-CHAR("bracketleftex",          13,     "|",            1,      "&#9122;",      7)
-CHAR("bracketrighttp",         14,     "|",            1,      "&#9124;",      7)
-CHAR("bracketrightbp",         14,     "|",            1,      "&#9126;",      7)
-CHAR("bracketrightex",         14,     "|",            1,      "&#9125;",      7)
-CHAR("lt",                     2,      ",-",           2,      "&#9127;",      7)
-CHAR("bracelefttp",            11,     ",-",           2,      "&#9127;",      7)
-CHAR("lk",                     2,      "{",            1,      "&#9128;",      7)
-CHAR("braceleftmid",           12,     "{",            1,      "&#9128;",      7)
-CHAR("lb",                     2,      ",-",           2,      "&#9129;",      7)
-CHAR("braceleftbp",            11,     "`-",           2,      "&#9129;",      7)
-CHAR("braceleftex",            11,     "|",            1,      "&#9130;",      7)
-CHAR("rt",                     2,      "-.",           2,      "&#9131;",      7)
-CHAR("bracerighttp",           12,     "-.",           2,      "&#9131;",      7)
-CHAR("rk",                     2,      "}",            1,      "&#9132;",      7)
-CHAR("bracerightmid",          13,     "}",            1,      "&#9132;",      7)
-CHAR("rb",                     2,      "-\'",          2,      "&#9133;",      7)
-CHAR("bracerightbp",           12,     "-\'",          2,      "&#9133;",      7)
-CHAR("bracerightex",           12,     "|",            1,      "&#9130;",      7)
-CHAR("parenlefttp",            11,     "/",            1,      "&#9115;",      7)
-CHAR("parenleftbp",            11,     "\\",           1,      "&#9117;",      7)
-CHAR("parenleftex",            11,     "|",            1,      "&#9116;",      7)
-CHAR("parenrighttp",           12,     "\\",           1,      "&#9118;",      7)
-CHAR("parenrightbp",           12,     "/",            1,      "&#9120;",      7)
-CHAR("parenrightex",           12,     "|",            1,      "&#9119;",      7)
+CHAR("lB",                     "[",            91)
+CHAR("rB",                     "]",            93)
+CHAR("lC",                     "{",            123)
+CHAR("rC",                     "}",            125)
+CHAR("la",                     "<",            60)
+CHAR("ra",                     ">",            62)
+CHAR("bv",                     "|",            9130)
+CHAR("braceex",                        "|",            9130)
+CHAR("bracketlefttp",          "|",            9121)
+CHAR("bracketleftbp",          "|",            9123)
+CHAR("bracketleftex",          "|",            9122)
+CHAR("bracketrighttp",         "|",            9124)
+CHAR("bracketrightbp",         "|",            9126)
+CHAR("bracketrightex",         "|",            9125)
+CHAR("lt",                     ",-",           9127)
+CHAR("bracelefttp",            ",-",           9127)
+CHAR("lk",                     "{",            9128)
+CHAR("braceleftmid",           "{",            9128)
+CHAR("lb",                     ",-",           9129)
+CHAR("braceleftbp",            "`-",           9129)
+CHAR("braceleftex",            "|",            9130)
+CHAR("rt",                     "-.",           9131)
+CHAR("bracerighttp",           "-.",           9131)
+CHAR("rk",                     "}",            9132)
+CHAR("bracerightmid",          "}",            9132)
+CHAR("rb",                     "-\'",          9133)
+CHAR("bracerightbp",           "-\'",          9133)
+CHAR("bracerightex",           "|",            9130)
+CHAR("parenlefttp",            "/",            9115)
+CHAR("parenleftbp",            "\\",           9117)
+CHAR("parenleftex",            "|",            9116)
+CHAR("parenrighttp",           "\\",           9118)
+CHAR("parenrightbp",           "/",            9120)
+CHAR("parenrightex",           "|",            9119)
 
 /* Greek characters. */
-CHAR("*A",                     2,      "A",            1,      "&#913;",       6)
-CHAR("*B",                     2,      "B",            1,      "&#914;",       6)
-CHAR("*G",                     2,      "|",            1,      "&#915;",       6)
-CHAR("*D",                     2,      "/\\",          2,      "&#916;",       6)
-CHAR("*E",                     2,      "E",            1,      "&#917;",       6)
-CHAR("*Z",                     2,      "Z",            1,      "&#918;",       6)
-CHAR("*Y",                     2,      "H",            1,      "&#919;",       6)
-CHAR("*H",                     2,      "O",            1,      "&#920;",       6)
-CHAR("*I",                     2,      "I",            1,      "&#921;",       6)
-CHAR("*K",                     2,      "K",            1,      "&#922;",       6)
-CHAR("*L",                     2,      "/\\",          2,      "&#923;",       6)
-CHAR("*M",                     2,      "M",            1,      "&#924;",       6)
-CHAR("*N",                     2,      "N",            1,      "&#925;",       6)
-CHAR("*C",                     2,      "H",            1,      "&#926;",       6)
-CHAR("*O",                     2,      "O",            1,      "&#927;",       6)
-CHAR("*P",                     2,      "TT",           2,      "&#928;",       6)
-CHAR("*R",                     2,      "P",            1,      "&#929;",       6)
-CHAR("*S",                     2,      ">",            1,      "&#931;",       6)
-CHAR("*T",                     2,      "T",            1,      "&#932;",       6)
-CHAR("*U",                     2,      "Y",            1,      "&#933;",       6)
-CHAR("*F",                     2,      "O_",           1,      "&#934;",       6)
-CHAR("*X",                     2,      "X",            1,      "&#935;",       6)
-CHAR("*Q",                     2,      "Y",            1,      "&#936;",       6)
-CHAR("*W",                     2,      "O",            1,      "&#937;",       6)
-CHAR("*a",                     2,      "a",            1,      "&#945;",       6)
-CHAR("*b",                     2,      "B",            1,      "&#946;",       6)
-CHAR("*g",                     2,      "y",            1,      "&#947;",       6)
-CHAR("*d",                     2,      "d",            1,      "&#948;",       6)
-CHAR("*e",                     2,      "e",            1,      "&#949;",       6)
-CHAR("*z",                     2,      "C",            1,      "&#950;",       6)
-CHAR("*y",                     2,      "n",            1,      "&#951;",       6)
-CHAR("*h",                     2,      "0",            1,      "&#952;",       6)
-CHAR("*i",                     2,      "i",            1,      "&#953;",       6)
-CHAR("*k",                     2,      "k",            1,      "&#954;",       6)
-CHAR("*l",                     2,      "\\",           1,      "&#955;",       6)
-CHAR("*m",                     2,      "u",            1,      "&#956;",       6)
-CHAR("*n",                     2,      "v",            1,      "&#957;",       6)
-CHAR("*c",                     2,      "E",            1,      "&#958;",       6)
-CHAR("*o",                     2,      "o",            1,      "&#959;",       6)
-CHAR("*p",                     2,      "n",            1,      "&#960;",       6)
-CHAR("*r",                     2,      "p",            1,      "&#961;",       6)
-CHAR("*s",                     2,      "o",            1,      "&#963;",       6)
-CHAR("*t",                     2,      "t",            1,      "&#964;",       6)
-CHAR("*u",                     2,      "u",            1,      "&#965;",       6)
-CHAR("*f",                     2,      "o",            1,      "&#981;",       6)
-CHAR("*x",                     2,      "x",            1,      "&#967;",       6)
-CHAR("*q",                     2,      "u",            1,      "&#968;",       6)
-CHAR("*w",                     2,      "w",            1,      "&#969;",       6)
-CHAR("+h",                     2,      "0",            1,      "&#977;",       6)
-CHAR("+f",                     2,      "o",            1,      "&#966;",       6)
-CHAR("+p",                     2,      "w",            1,      "&#982;",       6)
-CHAR("+e",                     2,      "e",            1,      "&#1013;",      7)
-CHAR("ts",                     2,      "s",            1,      "&#962;",       6)
+CHAR("*A",                     "A",            913)
+CHAR("*B",                     "B",            914)
+CHAR("*G",                     "|",            915)
+CHAR("*D",                     "/\\",          916)
+CHAR("*E",                     "E",            917)
+CHAR("*Z",                     "Z",            918)
+CHAR("*Y",                     "H",            919)
+CHAR("*H",                     "O",            920)
+CHAR("*I",                     "I",            921)
+CHAR("*K",                     "K",            922)
+CHAR("*L",                     "/\\",          923)
+CHAR("*M",                     "M",            924)
+CHAR("*N",                     "N",            925)
+CHAR("*C",                     "H",            926)
+CHAR("*O",                     "O",            927)
+CHAR("*P",                     "TT",           928)
+CHAR("*R",                     "P",            929)
+CHAR("*S",                     ">",            931)
+CHAR("*T",                     "T",            932)
+CHAR("*U",                     "Y",            933)
+CHAR("*F",                     "O_",           934)
+CHAR("*X",                     "X",            935)
+CHAR("*Q",                     "Y",            936)
+CHAR("*W",                     "O",            937)
+CHAR("*a",                     "a",            945)
+CHAR("*b",                     "B",            946)
+CHAR("*g",                     "y",            947)
+CHAR("*d",                     "d",            948)
+CHAR("*e",                     "e",            949)
+CHAR("*z",                     "C",            950)
+CHAR("*y",                     "n",            951)
+CHAR("*h",                     "0",            952)
+CHAR("*i",                     "i",            953)
+CHAR("*k",                     "k",            954)
+CHAR("*l",                     "\\",           955)
+CHAR("*m",                     "u",            956)
+CHAR("*n",                     "v",            957)
+CHAR("*c",                     "E",            958)
+CHAR("*o",                     "o",            959)
+CHAR("*p",                     "n",            960)
+CHAR("*r",                     "p",            961)
+CHAR("*s",                     "o",            963)
+CHAR("*t",                     "t",            964)
+CHAR("*u",                     "u",            965)
+CHAR("*f",                     "o",            981)
+CHAR("*x",                     "x",            967)
+CHAR("*q",                     "u",            968)
+CHAR("*w",                     "w",            969)
+CHAR("+h",                     "0",            977)
+CHAR("+f",                     "o",            966)
+CHAR("+p",                     "w",            982)
+CHAR("+e",                     "e",            1013)
+CHAR("ts",                     "s",            962)
 
 /* Accented letters. */
-CHAR(",C",                     2,      "C",            1,      "&#199;",       6)
-CHAR(",c",                     2,      "c",            1,      "&#231;",       6)
-CHAR("/L",                     2,      "L",            1,      "&#321;",       6)
-CHAR("/O",                     2,      "O",            1,      "&#216;",       6)
-CHAR("/l",                     2,      "l",            1,      "&#322;",       6)
-CHAR("/o",                     2,      "o",            1,      "&#248;",       6)
-CHAR("oA",                     2,      "A",            1,      "&#197;",       6)
-CHAR("oa",                     2,      "a",            1,      "&#229;",       6)
-CHAR(":A",                     2,      "A",            1,      "&#196;",       6)
-CHAR(":E",                     2,      "E",            1,      "&#203;",       6)
-CHAR(":I",                     2,      "I",            1,      "&#207;",       6)
-CHAR(":O",                     2,      "O",            1,      "&#214;",       6)
-CHAR(":U",                     2,      "U",            1,      "&#220;",       6)
-CHAR(":a",                     2,      "a",            1,      "&#228;",       6)
-CHAR(":e",                     2,      "e",            1,      "&#235;",       6)
-CHAR(":i",                     2,      "i",            1,      "&#239;",       6)
-CHAR(":o",                     2,      "o",            1,      "&#245;",       6)
-CHAR(":u",                     2,      "u",            1,      "&#252;",       6)
-CHAR(":y",                     2,      "y",            1,      "&#255;",       6)
-CHAR("\'A",                    2,      "A",            1,      "&#193;",       6)
-CHAR("\'E",                    2,      "E",            1,      "&#201;",       6)
-CHAR("\'I",                    2,      "I",            1,      "&#205;",       6)
-CHAR("\'O",                    2,      "O",            1,      "&#211;",       6)
-CHAR("\'U",                    2,      "U",            1,      "&#218;",       6)
-CHAR("\'a",                    2,      "a",            1,      "&#225;",       6)
-CHAR("\'e",                    2,      "e",            1,      "&#233;",       6)
-CHAR("\'i",                    2,      "i",            1,      "&#237;",       6)
-CHAR("\'o",                    2,      "o",            1,      "&#243;",       6)
-CHAR("\'u",                    2,      "u",            1,      "&#250;",       6)
-CHAR("^A",                     2,      "A",            1,      "&#194;",       6)
-CHAR("^E",                     2,      "E",            1,      "&#202;",       6)
-CHAR("^I",                     2,      "I",            1,      "&#206;",       6)
-CHAR("^O",                     2,      "O",            1,      "&#212;",       6)
-CHAR("^U",                     2,      "U",            1,      "&#219;",       6)
-CHAR("^a",                     2,      "a",            1,      "&#226;",       6)
-CHAR("^e",                     2,      "e",            1,      "&#234;",       6)
-CHAR("^i",                     2,      "i",            1,      "&#238;",       6)
-CHAR("^o",                     2,      "o",            1,      "&#244;",       6)
-CHAR("^u",                     2,      "u",            1,      "&#251;",       6)
-CHAR("`A",                     2,      "A",            1,      "&#192;",       6)
-CHAR("`E",                     2,      "E",            1,      "&#200;",       6)
-CHAR("`I",                     2,      "I",            1,      "&#204;",       6)
-CHAR("`O",                     2,      "O",            1,      "&#210;",       6)
-CHAR("`U",                     2,      "U",            1,      "&#217;",       6)
-CHAR("`a",                     2,      "a",            1,      "&#224;",       6)
-CHAR("`e",                     2,      "e",            1,      "&#232;",       6)
-CHAR("`i",                     2,      "i",            1,      "&#236;",       6)
-CHAR("`o",                     2,      "o",            1,      "&#242;",       6)
-CHAR("`u",                     2,      "u",            1,      "&#249;",       6)
-CHAR("~A",                     2,      "A",            1,      "&#195;",       6)
-CHAR("~N",                     2,      "N",            1,      "&#209;",       6)
-CHAR("~O",                     2,      "O",            1,      "&#213;",       6)
-CHAR("~a",                     2,      "a",            1,      "&#227;",       6)
-CHAR("~n",                     2,      "n",            1,      "&#241;",       6)
-CHAR("~o",                     2,      "o",            1,      "&#245;",       6)
+CHAR(",C",                     "C",            199)
+CHAR(",c",                     "c",            231)
+CHAR("/L",                     "L",            321)
+CHAR("/O",                     "O",            216)
+CHAR("/l",                     "l",            322)
+CHAR("/o",                     "o",            248)
+CHAR("oA",                     "A",            197)
+CHAR("oa",                     "a",            229)
+CHAR(":A",                     "A",            196)
+CHAR(":E",                     "E",            203)
+CHAR(":I",                     "I",            207)
+CHAR(":O",                     "O",            214)
+CHAR(":U",                     "U",            220)
+CHAR(":a",                     "a",            228)
+CHAR(":e",                     "e",            235)
+CHAR(":i",                     "i",            239)
+CHAR(":o",                     "o",            246)
+CHAR(":u",                     "u",            252)
+CHAR(":y",                     "y",            255)
+CHAR("\'A",                    "A",            193)
+CHAR("\'E",                    "E",            201)
+CHAR("\'I",                    "I",            205)
+CHAR("\'O",                    "O",            211)
+CHAR("\'U",                    "U",            218)
+CHAR("\'a",                    "a",            225)
+CHAR("\'e",                    "e",            233)
+CHAR("\'i",                    "i",            237)
+CHAR("\'o",                    "o",            243)
+CHAR("\'u",                    "u",            250)
+CHAR("^A",                     "A",            194)
+CHAR("^E",                     "E",            202)
+CHAR("^I",                     "I",            206)
+CHAR("^O",                     "O",            212)
+CHAR("^U",                     "U",            219)
+CHAR("^a",                     "a",            226)
+CHAR("^e",                     "e",            234)
+CHAR("^i",                     "i",            238)
+CHAR("^o",                     "o",            244)
+CHAR("^u",                     "u",            251)
+CHAR("`A",                     "A",            192)
+CHAR("`E",                     "E",            200)
+CHAR("`I",                     "I",            204)
+CHAR("`O",                     "O",            210)
+CHAR("`U",                     "U",            217)
+CHAR("`a",                     "a",            224)
+CHAR("`e",                     "e",            232)
+CHAR("`i",                     "i",            236)
+CHAR("`o",                     "o",            242)
+CHAR("`u",                     "u",            249)
+CHAR("~A",                     "A",            195)
+CHAR("~N",                     "N",            209)
+CHAR("~O",                     "O",            213)
+CHAR("~a",                     "a",            227)
+CHAR("~n",                     "n",            241)
+CHAR("~o",                     "o",            245)
 
 /* Arrows and lines. */
-CHAR("<-",                     2,      "<-",           2,      "&#8592;",      7)
-CHAR("->",                     2,      "->",           2,      "&#8594;",      7)
-CHAR("<>",                     2,      "<>",           2,      "&#8596;",      7)
-CHAR("da",                     2,      "v",            1,      "&#8595;",      7)
-BOTH("ua",                     2,      "^",            1,      "&#8593;",      7)
-BOTH("va",                     2,      "^v",           2,      "&#8597;",      7)
-CHAR("lA",                     2,      "<=",           2,      "&#8656;",      7)
-CHAR("rA",                     2,      "=>",           2,      "&#8658;",      7)
-CHAR("hA",                     2,      "<=>",          3,      "&#8660;",      7)
-CHAR("dA",                     2,      "v",            1,      "&#8659;",      7)
-CHAR("uA",                     2,      "^",            1,      "&#8657;",      7)
-CHAR("vA",                     2,      "^=v",          3,      "&#8661;",      7)
+CHAR("<-",                     "<-",           8592)
+CHAR("->",                     "->",           8594)
+CHAR("<>",                     "<>",           8596)
+CHAR("da",                     "v",            8595)
+CHAR("ua",                     "^",            8593)
+CHAR("va",                     "^v",           8597)
+CHAR("lA",                     "<=",           8656)
+CHAR("rA",                     "=>",           8658)
+CHAR("hA",                     "<=>",          8660)
+CHAR("dA",                     "v",            8659)
+CHAR("uA",                     "^",            8657)
+CHAR("vA",                     "^=v",          8661)
 
 /* Logic. */
-CHAR("AN",                     2,      "^",            1,      "&#8743;",      7)
-CHAR("OR",                     2,      "v",            1,      "&#8744;",      7)
-CHAR("no",                     2,      "~",            1,      "&#172;",       6)
-CHAR("tno",                    3,      "~",            1,      "&#172;",       6)
-CHAR("te",                     2,      "3",            1,      "&#8707;",      7)
-CHAR("fa",                     2,      "V",            1,      "&#8704;",      7)
-CHAR("st",                     2,      "-)",           2,      "&#8715;",      7)
-CHAR("tf",                     2,      ".:.",          3,      "&#8756;",      7)
-CHAR("3d",                     2,      ".:.",          3,      "&#8756;",      7)
-CHAR("or",                     2,      "|",            1,      "|",            1)
+CHAR("AN",                     "^",            8743)
+CHAR("OR",                     "v",            8744)
+CHAR("no",                     "~",            172)
+CHAR("tno",                    "~",            172)
+CHAR("te",                     "3",            8707)
+CHAR("fa",                     "V",            8704)
+CHAR("st",                     "-)",           8715)
+CHAR("tf",                     ".:.",          8756)
+CHAR("3d",                     ".:.",          8756)
+CHAR("or",                     "|",            124)
 
 /* Mathematicals. */
-CHAR("pl",                     2,      "+",            1,      "&#43;",        5)
-CHAR("mi",                     2,      "-",            1,      "&#8722;",      7)
-CHAR("-",                      1,      "-",            1,      "-",            1)
-CHAR("-+",                     2,      "-+",           2,      "&#8723;",      7)
-CHAR("+-",                     2,      "+-",           2,      "&#177;",       6)
-CHAR("t+-",                    3,      "+-",           2,      "&#177;",       6)
-CHAR("pc",                     2,      ".",            1,      "&#183;",       6)
-CHAR("md",                     2,      ".",            1,      "&#8901;",      7)
-CHAR("mu",                     2,      "x",            1,      "&#215;",       6)
-CHAR("tmu",                    3,      "x",            1,      "&#215;",       6)
-CHAR("c*",                     2,      "x",            1,      "&#8855;",      7)
-CHAR("c+",                     2,      "+",            1,      "&#8853;",      7)
-CHAR("di",                     2,      "-:-",          3,      "&#247;",       6)
-CHAR("tdi",                    3,      "-:-",          3,      "&#247;",       6)
-CHAR("f/",                     2,      "/",            1,      "&#8260;",      7)
-CHAR("**",                     2,      "*",            1,      "&#8727;",      7)
-BOTH("<=",                     2,      "<=",           2,      "&#8804;",      7)
-BOTH(">=",                     2,      ">=",           2,      "&#8805;",      7)
-CHAR("<<",                     2,      "<<",           2,      "&#8810;",      7)
-CHAR(">>",                     2,      ">>",           2,      "&#8811;",      7)
-CHAR("eq",                     2,      "=",            1,      "&#61;",        5)
-CHAR("!=",                     2,      "!=",           2,      "&#8800;",      7)
-CHAR("==",                     2,      "==",           2,      "&#8801;",      7)
-CHAR("ne",                     2,      "!==",          3,      "&#8802;",      7)
-CHAR("=~",                     2,      "=~",           2,      "&#8773;",      7)
-CHAR("-~",                     2,      "-~",           2,      "&#8771;",      7)
-CHAR("ap",                     2,      "~",            1,      "&#8764;",      7)
-CHAR("~~",                     2,      "~~",           2,      "&#8776;",      7)
-CHAR("~=",                     2,      "~=",           2,      "&#8780;",      7)
-CHAR("pt",                     2,      "oc",           2,      "&#8733;",      7)
-CHAR("es",                     2,      "{}",           2,      "&#8709;",      7)
-CHAR("mo",                     2,      "E",            1,      "&#8712;",      7)
-CHAR("nm",                     2,      "!E",           2,      "&#8713;",      7)
-CHAR("sb",                     2,      "(=",           2,      "&#8834;",      7)
-CHAR("nb",                     2,      "(!=",          3,      "&#8836;",      7)
-CHAR("sp",                     2,      "=)",           2,      "&#8835;",      7)
-CHAR("nc",                     2,      "!=)",          3,      "&#8837;",      7)
-CHAR("ib",                     2,      "(=",           2,      "&#8838;",      7)
-CHAR("ip",                     2,      "=)",           2,      "&#8839;",      7)
-CHAR("ca",                     2,      "(^)",          3,      "&#8745;",      7)
-CHAR("cu",                     2,      "U",            1,      "&#8746;",      7)
-CHAR("/_",                     2,      "/_",           2,      "&#8736;",      7)
-CHAR("pp",                     2,      "_|_",          3,      "&#8869;",      7)
-CHAR("is",                     2,      "I",            1,      "&#8747;",      7)
-CHAR("integral",               8,      "I",            1,      "&#8747;",      7)
-CHAR("sum",                    3,      "E",            1,      "&#8721;",      7)
-CHAR("product",                        7,      "TT",           2,      "&#8719;",      7)
-CHAR("coproduct",              9,      "U",            1,      "&#8720;",      7)
-CHAR("gr",                     2,      "V",            1,      "&#8711;",      7)
-CHAR("sr",                     2,      "\\/",          2,      "&#8730;",      7)
-CHAR("sqrt",                   4,      "\\/",          2,      "&#8730;",      7)
-CHAR("lc",                     2,      "|~",           2,      "&#8968;",      7)
-CHAR("rc",                     2,      "~|",           2,      "&#8969;",      7)
-CHAR("lf",                     2,      "|_",           2,      "&#8970;",      7)
-CHAR("rf",                     2,      "_|",           2,      "&#8971;",      7)
-CHAR("if",                     2,      "oo",           2,      "&#8734;",      7)
-CHAR("Ah",                     2,      "N",            1,      "&#8501;",      7)
-CHAR("Im",                     2,      "I",            1,      "&#8465;",      7)
-CHAR("Re",                     2,      "R",            1,      "&#8476;",      7)
-CHAR("pd",                     2,      "a",            1,      "&#8706;",      7)
-CHAR("-h",                     2,      "/h",           2,      "&#8463;",      7)
+CHAR("pl",                     "+",            43)
+CHAR("mi",                     "-",            8722)
+CHAR("-",                      "-",            45)
+CHAR("-+",                     "-+",           8723)
+CHAR("+-",                     "+-",           177)
+CHAR("t+-",                    "+-",           177)
+CHAR("pc",                     ".",            183)
+CHAR("md",                     ".",            8901)
+CHAR("mu",                     "x",            215)
+CHAR("tmu",                    "x",            215)
+CHAR("c*",                     "x",            8855)
+CHAR("c+",                     "+",            8853)
+CHAR("di",                     "-:-",          247)
+CHAR("tdi",                    "-:-",          247)
+CHAR("f/",                     "/",            8260)
+CHAR("**",                     "*",            8727)
+CHAR("<=",                     "<=",           8804)
+CHAR(">=",                     ">=",           8805)
+CHAR("<<",                     "<<",           8810)
+CHAR(">>",                     ">>",           8811)
+CHAR("eq",                     "=",            61)
+CHAR("!=",                     "!=",           8800)
+CHAR("==",                     "==",           8801)
+CHAR("ne",                     "!==",          8802)
+CHAR("=~",                     "=~",           8773)
+CHAR("-~",                     "-~",           8771)
+CHAR("ap",                     "~",            8764)
+CHAR("~~",                     "~~",           8776)
+CHAR("~=",                     "~=",           8780)
+CHAR("pt",                     "oc",           8733)
+CHAR("es",                     "{}",           8709)
+CHAR("mo",                     "E",            8712)
+CHAR("nm",                     "!E",           8713)
+CHAR("sb",                     "(=",           8834)
+CHAR("nb",                     "(!=",          8836)
+CHAR("sp",                     "=)",           8835)
+CHAR("nc",                     "!=)",          8837)
+CHAR("ib",                     "(=",           8838)
+CHAR("ip",                     "=)",           8839)
+CHAR("ca",                     "(^)",          8745)
+CHAR("cu",                     "U",            8746)
+CHAR("/_",                     "/_",           8736)
+CHAR("pp",                     "_|_",          8869)
+CHAR("is",                     "I",            8747)
+CHAR("integral",               "I",            8747)
+CHAR("sum",                    "E",            8721)
+CHAR("product",                        "TT",           8719)
+CHAR("coproduct",              "U",            8720)
+CHAR("gr",                     "V",            8711)
+CHAR("sr",                     "\\/",          8730)
+CHAR("sqrt",                   "\\/",          8730)
+CHAR("lc",                     "|~",           8968)
+CHAR("rc",                     "~|",           8969)
+CHAR("lf",                     "|_",           8970)
+CHAR("rf",                     "_|",           8971)
+CHAR("if",                     "oo",           8734)
+CHAR("Ah",                     "N",            8501)
+CHAR("Im",                     "I",            8465)
+CHAR("Re",                     "R",            8476)
+CHAR("pd",                     "a",            8706)
+CHAR("-h",                     "/h",           8463)
+CHAR("12",                     "1/2",          189)
+CHAR("14",                     "1/4",          188)
+CHAR("34",                     "3/4",          190)
 
 /* Ligatures. */
-CHAR("ff",                     2,      "ff",           2,      "&#64256;",     8)
-CHAR("fi",                     2,      "fi",           2,      "&#64257;",     8)
-CHAR("fl",                     2,      "fl",           2,      "&#64258;",     8)
-CHAR("Fi",                     2,      "ffi",          3,      "&#64259;",     8)
-CHAR("Fl",                     2,      "ffl",          3,      "&#64260;",     8)
-CHAR("AE",                     2,      "AE",           2,      "&#198;",       6)
-CHAR("ae",                     2,      "ae",           2,      "&#230;",       6)
-CHAR("OE",                     2,      "OE",           2,      "&#338;",       6)
-CHAR("oe",                     2,      "oe",           2,      "&#339;",       6)
-CHAR("ss",                     2,      "ss",           2,      "&#223;",       6)
-CHAR("IJ",                     2,      "IJ",           2,      "&#306;",       6)
-CHAR("ij",                     2,      "ij",           2,      "&#307;",       6)
+CHAR("ff",                     "ff",           64256)
+CHAR("fi",                     "fi",           64257)
+CHAR("fl",                     "fl",           64258)
+CHAR("Fi",                     "ffi",          64259)
+CHAR("Fl",                     "ffl",          64260)
+CHAR("AE",                     "AE",           198)
+CHAR("ae",                     "ae",           230)
+CHAR("OE",                     "OE",           338)
+CHAR("oe",                     "oe",           339)
+CHAR("ss",                     "ss",           223)
+CHAR("IJ",                     "IJ",           306)
+CHAR("ij",                     "ij",           307)
 
 /* Special letters. */
-CHAR("-D",                     2,      "D",            1,      "&#208;",       6)
-CHAR("Sd",                     2,      "o",            1,      "&#240;",       6)
-CHAR("TP",                     2,      "b",            1,      "&#222;",       6)
-CHAR("Tp",                     2,      "b",            1,      "&#254;",       6)
-CHAR(".i",                     2,      "i",            1,      "&#305;",       6)
-CHAR(".j",                     2,      "j",            1,      "&#567;",       6)
+CHAR("-D",                     "D",            208)
+CHAR("Sd",                     "o",            240)
+CHAR("TP",                     "b",            222)
+CHAR("Tp",                     "b",            254)
+CHAR(".i",                     "i",            305)
+CHAR(".j",                     "j",            567)
 
 /* Currency. */
-CHAR("Do",                     2,      "$",            1,      "$",            1)
-CHAR("ct",                     2,      "c",            1,      "&#162;",       6)
-CHAR("Eu",                     2,      "EUR",          3,      "&#8364;",      7)
-CHAR("eu",                     2,      "EUR",          3,      "&#8364;",      7)
-CHAR("Ye",                     2,      "Y",            1,      "&#165;",       6)
-CHAR("Po",                     2,      "L",            1,      "&#163;",       6)
-CHAR("Cs",                     2,      "x",            1,      "&#164;",       6)
-CHAR("Fn",                     2,      "f",            1,      "&#402;",       6)
-
-/* Old style. */
-STRING("Am",                   2,      "&",            1,      "&amp;",        5)
-STRING("Ba",                   2,      "|",            1,      "|",            1)
-STRING("Ge",                   2,      ">=",           2,      "&#8805;",      7)
-STRING("Gt",                   2,      ">",            1,      "&gt;",         4)
-STRING("If",                   2,      "infinity",     8,      "infinity",     8)
-STRING("Le",                   2,      "<=",           2,      "&#8804;",      7)
-STRING("Lq",                   2,      "``",           2,      "&#8220;",      7)
-STRING("Lt",                   2,      "<",            1,      "&lt;",         4)
-STRING("Na",                   2,      "NaN",          3,      "NaN",          3)
-STRING("Ne",                   2,      "!=",           2,      "&#8800;",      7)
-STRING("Pi",                   2,      "pi",           2,      "&#960;",       6)
-STRING("Pm",                   2,      "+-",           2,      "&#177;",       6)
-STRING("R",                    1,      "(R)",          3,      "&#174;",       6)
-STRING("Rq",                   2,      "\'\'",         2,      "&#8221;",      7)
-STRING("Tm",                   2,      "tm",           2,      "&#8482;",      7)
-STRING("left-bracket",         12,     "[",            1,      "[",            1)
-STRING("left-parenthesis",     16,     "(",            1,      "(",            1)
-STRING("left-singlequote",     16,     "`",            1,      "&#8216;",      7)
-STRING("lp",                   2,      "(",            1,      "(",            1)
-STRING("q",                    1,      "\"",           1,      "&quot;",       6)
-STRING("quote-left",           10,     "`",            1,      "&#8216;",      7)
-STRING("quote-right",          11,     "\'",           1,      "&#8217;",      7)
-STRING("right-bracket",                13,     "]",            1,      "]",            1)
-STRING("right-parenthesis",    17,     ")",            1,      ")",            1)
-STRING("right-singlequote",    17,     "\'",           1,      "&#8217;",      7)
-STRING("rp",                   2,      ")",            1,      ")",            1)
+CHAR("Do",                     "$",            36)
+CHAR("ct",                     "c",            162)
+CHAR("Eu",                     "EUR",          8364)
+CHAR("eu",                     "EUR",          8364)
+CHAR("Ye",                     "Y",            165)
+CHAR("Po",                     "L",            163)
+CHAR("Cs",                     "x",            164)
+CHAR("Fn",                     "f",            402)
 
 /* Lines. */
-CHAR("ba",                     2,      "|",            1,      "&#124;",       6)
-CHAR("br",                     2,      "|",            1,      "&#9474;",      7)
-CHAR("ul",                     2,      "_",            1,      "&#95;",        5)
-CHAR("rl",                     2,      "-",            1,      "&#8254;",      7)
-CHAR("bb",                     2,      "|",            1,      "&#166;",       6)
-CHAR("sl",                     2,      "/",            1,      "&#47;",        5)
-CHAR("rs",                     2,      "\\",           1,      "&#92;",        5)
+CHAR("ba",                     "|",            124)
+CHAR("br",                     "|",            9474)
+CHAR("ul",                     "_",            95)
+CHAR("rl",                     "-",            8254)
+CHAR("bb",                     "|",            166)
+CHAR("sl",                     "/",            47)
+CHAR("rs",                     "\\",           92)
 
 /* Text markers. */
-CHAR("ci",                     2,      "o",            1,      "&#9675;",      7)
-CHAR("bu",                     2,      "o",            1,      "&#8226;",      7)
-CHAR("dd",                     2,      "=",            1,      "&#8225;",      7)
-CHAR("dg",                     2,      "-",            1,      "&#8224;",      7)
-CHAR("lz",                     2,      "<>",           2,      "&#9674;",      7)
-CHAR("sq",                     2,      "[]",           2,      "&#9633;",      7)
-CHAR("ps",                     2,      "9|",           2,      "&#182;",       6)
-CHAR("sc",                     2,      "S",            1,      "&#167;",       6)
-CHAR("lh",                     2,      "<=",           2,      "&#9756;",      7)
-CHAR("rh",                     2,      "=>",           2,      "&#9758;",      7)
-CHAR("at",                     2,      "@",            1,      "&#64;",        5)
-CHAR("sh",                     2,      "#",            1,      "&#35;",        5)
-CHAR("CR",                     2,      "_|",           2,      "&#8629;",      7)
-CHAR("OK",                     2,      "\\/",          2,      "&#10003;",     8)
+CHAR("ci",                     "o",            9675)
+CHAR("bu",                     "o",            8226)
+CHAR("dd",                     "=",            8225)
+CHAR("dg",                     "-",            8224)
+CHAR("lz",                     "<>",           9674)
+CHAR("sq",                     "[]",           9633)
+CHAR("ps",                     "9|",           182)
+CHAR("sc",                     "S",            167)
+CHAR("lh",                     "<=",           9756)
+CHAR("rh",                     "=>",           9758)
+CHAR("at",                     "@",            64)
+CHAR("sh",                     "#",            35)
+CHAR("CR",                     "_|",           8629)
+CHAR("OK",                     "\\/",          10003)
 
 /* Legal symbols. */
-CHAR("co",                     2,      "(C)",          3,      "&#169;",       6)
-CHAR("rg",                     2,      "(R)",          3,      "&#174;",       6)
-CHAR("tm",                     2,      "tm",           2,      "&#8482;",      7)
+CHAR("co",                     "(C)",          169)
+CHAR("rg",                     "(R)",          174)
+CHAR("tm",                     "tm",           8482)
 
 /* Punctuation. */
-CHAR(".",                      1,      ".",            1,      ".",            1)
-CHAR("r!",                     2,      "i",            1,      "&#161;",       6)
-CHAR("r?",                     2,      "c",            1,      "&#191;",       6)
-CHAR("em",                     2,      "--",           2,      "&#8212;",      7)
-CHAR("en",                     2,      "-",            1,      "&#8211;",      7)
-CHAR("hy",                     2,      "-",            1,      "&#8208;",      7)
-CHAR("\\",                     1,      "\\",           1,      "\\",           1)
-CHAR("e",                      1,      "\\",           1,      "\\",           1)
+CHAR(".",                      ".",            46)
+CHAR("r!",                     "i",            161)
+CHAR("r?",                     "c",            191)
+CHAR("em",                     "--",           8212)
+CHAR("en",                     "-",            8211)
+CHAR("hy",                     "-",            8208)
+CHAR("e",                      "\\",           92)
 
 /* Units. */
-CHAR("de",                     2,      "o",            1,      "&#176;",       6)
-CHAR("%0",                     2,      "%o",           2,      "&#8240;",      7)
-CHAR("fm",                     2,      "\'",           1,      "&#8242;",      7)
-CHAR("sd",                     2,      "\"",           1,      "&#8243;",      7)
-CHAR("mc",                     2,      "mu",           2,      "&#181;",       6)
+CHAR("de",                     "o",            176)
+CHAR("%0",                     "%o",           8240)
+CHAR("fm",                     "\'",           8242)
+CHAR("sd",                     "\"",           8243)
+CHAR("mc",                     "mu",           181)
 
 CHAR_TBL_END