]> git.cameronkatri.com Git - mandoc.git/blobdiff - chars.c
In the fallback code to look for manual pages without using mandoc.db(5),
[mandoc.git] / chars.c
diff --git a/chars.c b/chars.c
index f1f5d5d78ca8c322f26b7a9995c5754e402ffd82..d54fc458aea2c05aab00491b805de18394c81dea 100644 (file)
--- a/chars.c
+++ b/chars.c
@@ -1,7 +1,8 @@
-/*     $Id: chars.c,v 1.69 2017/02/17 18:28:06 schwarze Exp $ */
+/*     $Id: chars.c,v 1.79 2020/02/13 16:18:29 schwarze Exp $ */
 /*
  * Copyright (c) 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv>
- * Copyright (c) 2011, 2014, 2015 Ingo Schwarze <schwarze@openbsd.org>
+ * Copyright (c) 2011, 2014, 2015, 2017, 2018, 2020
+ *               Ingo Schwarze <schwarze@openbsd.org>
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
@@ -23,6 +24,7 @@
 #include <ctype.h>
 #include <stddef.h>
 #include <stdint.h>
+#include <stdio.h>
 #include <stdlib.h>
 #include <string.h>
 
@@ -46,21 +48,15 @@ static struct ln lines[] = {
        /* Spacing. */
        { " ",                  ascii_nbrsp,    0x00a0  },
        { "~",                  ascii_nbrsp,    0x00a0  },
-       { "0",                  " ",            0x2002  },
-       { "|",                  "",             0       },
-       { "^",                  "",             0       },
-       { "&",                  "",             0       },
-       { "%",                  "",             0       },
+       { "0",                  ascii_nbrsp,    0x00a0  },
        { ":",                  ascii_break,    0       },
-       /* XXX The following three do not really belong here. */
-       { "t",                  "",             0       },
-       { "c",                  "",             0       },
-       { "}",                  "",             0       },
 
        /* Lines. */
        { "ba",                 "|",            0x007c  },
        { "br",                 "|",            0x2502  },
        { "ul",                 "_",            0x005f  },
+       { "_",                  "_",            0x005f  },
+       { "ru",                 "_",            0x005f  },
        { "rn",                 "-",            0x203e  },
        { "bb",                 "|",            0x00a6  },
        { "sl",                 "/",            0x002f  },
@@ -69,18 +65,22 @@ static struct ln lines[] = {
        /* Text markers. */
        { "ci",                 "O",            0x25cb  },
        { "bu",                 "+\bo",         0x2022  },
-       { "dd",                 "|\b=",         0x2021  },
-       { "dg",                 "|\b-",         0x2020  },
+       { "dd",                 "<**>",         0x2021  },
+       { "dg",                 "<*>",          0x2020  },
        { "lz",                 "<>",           0x25ca  },
        { "sq",                 "[]",           0x25a1  },
-       { "ps",                 "<par>",        0x00b6  },
-       { "sc",                 "<sec>",        0x00a7  },
+       { "ps",                 "<paragraph>",  0x00b6  },
+       { "sc",                 "<section>",    0x00a7  },
        { "lh",                 "<=",           0x261c  },
        { "rh",                 "=>",           0x261e  },
        { "at",                 "@",            0x0040  },
        { "sh",                 "#",            0x0023  },
-       { "CR",                 "_|",           0x21b5  },
+       { "CR",                 "<cr>",         0x21b5  },
        { "OK",                 "\\/",          0x2713  },
+       { "CL",                 "C",            0x2663  },
+       { "SP",                 "S",            0x2660  },
+       { "HE",                 "H",            0x2665  },
+       { "DI",                 "D",            0x2666  },
 
        /* Legal symbols. */
        { "co",                 "(C)",          0x00a9  },
@@ -161,17 +161,18 @@ static struct ln lines[] = {
        { "uA",                 "=\b^",         0x21d1  },
        { "dA",                 "=\bv",         0x21d3  },
        { "vA",                 "^=v",          0x21d5  },
+       { "an",                 "-",            0x23af  },
 
        /* Logic. */
        { "AN",                 "^",            0x2227  },
        { "OR",                 "v",            0x2228  },
        { "no",                 "~",            0x00ac  },
        { "tno",                "~",            0x00ac  },
-       { "te",                 "3",            0x2203  },
-       { "fa",                 "-\bV",         0x2200  },
-       { "st",                 "-)",           0x220b  },
-       { "tf",                 ".:.",          0x2234  },
-       { "3d",                 ".:.",          0x2234  },
+       { "te",                 "<there\037exists>", 0x2203 },
+       { "fa",                 "<for\037all>", 0x2200  },
+       { "st",                 "<such\037that>", 0x220b },
+       { "tf",                 "<therefore>",  0x2234  },
+       { "3d",                 "<therefore>",  0x2234  },
        { "or",                 "|",            0x007c  },
 
        /* Mathematicals. */
@@ -187,8 +188,8 @@ static struct ln lines[] = {
        { "tmu",                "x",            0x00d7  },
        { "c*",                 "O\bx",         0x2297  },
        { "c+",                 "O\b+",         0x2295  },
-       { "di",                 "-:-",          0x00f7  },
-       { "tdi",                "-:-",          0x00f7  },
+       { "di",                 "/",            0x00f7  },
+       { "tdi",                "/",            0x00f7  },
        { "f/",                 "/",            0x2044  },
        { "**",                 "*",            0x2217  },
        { "<=",                 "<=",           0x2264  },
@@ -204,41 +205,50 @@ static struct ln lines[] = {
        { "=~",                 "=~",           0x2245  },
        { "~~",                 "~~",           0x2248  },
        { "~=",                 "~=",           0x2248  },
-       { "pt",                 "oc",           0x221d  },
+       { "pt",                 "<proportional\037to>", 0x221d },
        { "es",                 "{}",           0x2205  },
-       { "mo",                 "E",            0x2208  },
-       { "nm",                 "!E",           0x2209  },
-       { "sb",                 "(=",           0x2282  },
-       { "nb",                 "(!=",          0x2284  },
-       { "sp",                 "=)",           0x2283  },
-       { "nc",                 "!=)",          0x2285  },
-       { "ib",                 "(=\b_",        0x2286  },
-       { "ip",                 "=\b_)",        0x2287  },
-       { "ca",                 "(^)",          0x2229  },
-       { "cu",                 "U",            0x222a  },
-       { "/_",                 "_\b/",         0x2220  },
-       { "pp",                 "_\b|",         0x22a5  },
-       { "is",                 "'\b,\bI",      0x222b  },
-       { "integral",           "'\b,\bI",      0x222b  },
-       { "sum",                "E",            0x2211  },
-       { "product",            "TT",           0x220f  },
-       { "coproduct",          "U",            0x2210  },
-       { "gr",                 "V",            0x2207  },
-       { "sr",                 "\\/",          0x221a  },
-       { "sqrt",               "\\/",          0x221a  },
+       { "mo",                 "<element\037of>", 0x2208 },
+       { "nm",                 "<not\037element\037of>", 0x2209 },
+       { "sb",                 "<proper\037subset>", 0x2282 },
+       { "nb",                 "<not\037subset>", 0x2284 },
+       { "sp",                 "<proper\037superset>", 0x2283 },
+       { "nc",                 "<not\037superset>", 0x2285 },
+       { "ib",                 "<subset\037or\037equal>", 0x2286 },
+       { "ip",                 "<superset\037or\037equal>", 0x2287 },
+       { "ca",                 "<intersection>", 0x2229 },
+       { "cu",                 "<union>",      0x222a  },
+       { "/_",                 "<angle>",      0x2220  },
+       { "pp",                 "<perpendicular>", 0x22a5 },
+       { "is",                 "<integral>",   0x222b  },
+       { "integral",           "<integral>",   0x222b  },
+       { "sum",                "<sum>",        0x2211  },
+       { "product",            "<product>",    0x220f  },
+       { "coproduct",          "<coproduct>",  0x2210  },
+       { "gr",                 "<nabla>",      0x2207  },
+       { "sr",                 "<sqrt>",       0x221a  },
+       { "sqrt",               "<sqrt>",       0x221a  },
        { "lc",                 "|~",           0x2308  },
        { "rc",                 "~|",           0x2309  },
        { "lf",                 "|_",           0x230a  },
        { "rf",                 "_|",           0x230b  },
-       { "if",                 "oo",           0x221e  },
-       { "Ah",                 "N",            0x2135  },
-       { "Im",                 "I",            0x2111  },
-       { "Re",                 "R",            0x211c  },
-       { "pd",                 "a",            0x2202  },
+       { "if",                 "<infinity>",   0x221e  },
+       { "Ah",                 "<Aleph>",      0x2135  },
+       { "Im",                 "<Im>",         0x2111  },
+       { "Re",                 "<Re>",         0x211c  },
+       { "wp",                 "p",            0x2118  },
+       { "pd",                 "<del>",        0x2202  },
        { "-h",                 "/h",           0x210f  },
+       { "hbar",               "/h",           0x210f  },
        { "12",                 "1/2",          0x00bd  },
        { "14",                 "1/4",          0x00bc  },
        { "34",                 "3/4",          0x00be  },
+       { "18",                 "1/8",          0x215B  },
+       { "38",                 "3/8",          0x215C  },
+       { "58",                 "5/8",          0x215D  },
+       { "78",                 "7/8",          0x215E  },
+       { "S1",                 "^1",           0x00B9  },
+       { "S2",                 "^2",           0x00B2  },
+       { "S3",                 "^3",           0x00B3  },
 
        /* Ligatures. */
        { "ff",                 "ff",           0xfb00  },
@@ -272,6 +282,7 @@ static struct ln lines[] = {
        { "ho",                 ",",            0x02db  },
        { "ha",                 "^",            0x005e  },
        { "ti",                 "~",            0x007e  },
+       { "u02DC",              "~",            0x02dc  },
 
        /* Accented letters. */
        { "'A",                 "'\bA",         0x00c1  },
@@ -279,11 +290,13 @@ static struct ln lines[] = {
        { "'I",                 "'\bI",         0x00cd  },
        { "'O",                 "'\bO",         0x00d3  },
        { "'U",                 "'\bU",         0x00da  },
+       { "'Y",                 "'\bY",         0x00dd  },
        { "'a",                 "'\ba",         0x00e1  },
        { "'e",                 "'\be",         0x00e9  },
        { "'i",                 "'\bi",         0x00ed  },
        { "'o",                 "'\bo",         0x00f3  },
        { "'u",                 "'\bu",         0x00fa  },
+       { "'y",                 "'\by",         0x00fd  },
        { "`A",                 "`\bA",         0x00c0  },
        { "`E",                 "`\bE",         0x00c8  },
        { "`I",                 "`\bI",         0x00cc  },
@@ -331,8 +344,8 @@ static struct ln lines[] = {
        { "oa",                 "o\ba",         0x00e5  },
 
        /* Special letters. */
-       { "-D",                 "-\bD",         0x00d0  },
-       { "Sd",                 "d",            0x00f0  },
+       { "-D",                 "Dh",           0x00d0  },
+       { "Sd",                 "dh",           0x00f0  },
        { "TP",                 "Th",           0x00de  },
        { "Tp",                 "th",           0x00fe  },
        { ".i",                 "i",            0x0131  },
@@ -344,71 +357,73 @@ static struct ln lines[] = {
        { "Eu",                 "EUR",          0x20ac  },
        { "eu",                 "EUR",          0x20ac  },
        { "Ye",                 "=\bY",         0x00a5  },
-       { "Po",                 "GBP",          0x00a3  },
+       { "Po",                 "-\bL",         0x00a3  },
        { "Cs",                 "o\bx",         0x00a4  },
        { "Fn",                 ",\bf",         0x0192  },
 
        /* Units. */
-       { "de",                 "<deg>",        0x00b0  },
-       { "%0",                 "%o",           0x2030  },
+       { "de",                 "<degree>",     0x00b0  },
+       { "%0",                 "<permille>",   0x2030  },
        { "fm",                 "\'",           0x2032  },
        { "sd",                 "''",           0x2033  },
-       { "mc",                 ",\bu",         0x00b5  },
+       { "mc",                 "<micro>",      0x00b5  },
+       { "Of",                 "_\ba",         0x00aa  },
+       { "Om",                 "_\bo",         0x00ba  },
 
        /* Greek characters. */
        { "*A",                 "A",            0x0391  },
        { "*B",                 "B",            0x0392  },
-       { "*G",                 "G",            0x0393  },
-       { "*D",                 "_\b/_\b\\",    0x0394  },
+       { "*G",                 "<Gamma>",      0x0393  },
+       { "*D",                 "<Delta>",      0x0394  },
        { "*E",                 "E",            0x0395  },
        { "*Z",                 "Z",            0x0396  },
        { "*Y",                 "H",            0x0397  },
-       { "*H",                 "-\bO",         0x0398  },
+       { "*H",                 "<Theta>",      0x0398  },
        { "*I",                 "I",            0x0399  },
        { "*K",                 "K",            0x039a  },
-       { "*L",                 "/\\",          0x039b  },
+       { "*L",                 "<Lambda>",     0x039b  },
        { "*M",                 "M",            0x039c  },
        { "*N",                 "N",            0x039d  },
-       { "*C",                 "_\bH",         0x039e  },
+       { "*C",                 "<Xi>",         0x039e  },
        { "*O",                 "O",            0x039f  },
-       { "*P",                 "TT",           0x03a0  },
+       { "*P",                 "<Pi>",         0x03a0  },
        { "*R",                 "P",            0x03a1  },
-       { "*S",                 "S",            0x03a3  },
+       { "*S",                 "<Sigma>",      0x03a3  },
        { "*T",                 "T",            0x03a4  },
        { "*U",                 "Y",            0x03a5  },
-       { "*F",                 "I\bO",         0x03a6  },
+       { "*F",                 "<Phi>",        0x03a6  },
        { "*X",                 "X",            0x03a7  },
-       { "*Q",                 "I\bY",         0x03a8  },
-       { "*W",                 "_\bO",         0x03a9  },
-       { "*a",                 "a",            0x03b1  },
-       { "*b",                 "B",            0x03b2  },
-       { "*g",                 "y",            0x03b3  },
-       { "*d",                 "d",            0x03b4  },
-       { "*e",                 "e",            0x03b5  },
-       { "*z",                 ",\bC",         0x03b6  },
-       { "*y",                 "n",            0x03b7  },
-       { "*h",                 "-\b0",         0x03b8  },
-       { "*i",                 "i",            0x03b9  },
-       { "*k",                 "k",            0x03ba  },
-       { "*l",                 ">\b\\",        0x03bb  },
-       { "*m",                 ",\bu",         0x03bc  },
-       { "*n",                 "v",            0x03bd  },
-       { "*c",                 ",\bE",         0x03be  },
+       { "*Q",                 "<Psi>",        0x03a8  },
+       { "*W",                 "<Omega>",      0x03a9  },
+       { "*a",                 "<alpha>",      0x03b1  },
+       { "*b",                 "<beta>",       0x03b2  },
+       { "*g",                 "<gamma>",      0x03b3  },
+       { "*d",                 "<delta>",      0x03b4  },
+       { "*e",                 "<epsilon>",    0x03b5  },
+       { "*z",                 "<zeta>",       0x03b6  },
+       { "*y",                 "<eta>",        0x03b7  },
+       { "*h",                 "<theta>",      0x03b8  },
+       { "*i",                 "<iota>",       0x03b9  },
+       { "*k",                 "<kappa>",      0x03ba  },
+       { "*l",                 "<lambda>",     0x03bb  },
+       { "*m",                 "<mu>",         0x03bc  },
+       { "*n",                 "<nu>",         0x03bd  },
+       { "*c",                 "<xi>",         0x03be  },
        { "*o",                 "o",            0x03bf  },
-       { "*p",                 "-\bn",         0x03c0  },
-       { "*r",                 "p",            0x03c1  },
-       { "*s",                 "-\bo",         0x03c3  },
-       { "*t",                 "~\bt",         0x03c4  },
-       { "*u",                 "u",            0x03c5  },
-       { "*f",                 "|\bo",         0x03d5  },
-       { "*x",                 "x",            0x03c7  },
-       { "*q",                 "|\bu",         0x03c8  },
-       { "*w",                 "w",            0x03c9  },
-       { "+h",                 "-\b0",         0x03d1  },
-       { "+f",                 "|\bo",         0x03c6  },
-       { "+p",                 "-\bw",         0x03d6  },
-       { "+e",                 "e",            0x03f5  },
-       { "ts",                 "s",            0x03c2  },
+       { "*p",                 "<pi>",         0x03c0  },
+       { "*r",                 "<rho>",        0x03c1  },
+       { "*s",                 "<sigma>",      0x03c3  },
+       { "*t",                 "<tau>",        0x03c4  },
+       { "*u",                 "<upsilon>",    0x03c5  },
+       { "*f",                 "<phi>",        0x03d5  },
+       { "*x",                 "<chi>",        0x03c7  },
+       { "*q",                 "<psi>",        0x03c8  },
+       { "*w",                 "<omega>",      0x03c9  },
+       { "+h",                 "<theta>",      0x03d1  },
+       { "+f",                 "<phi>",        0x03c6  },
+       { "+p",                 "<pi>",         0x03d6  },
+       { "+e",                 "<epsilon>",    0x03f5  },
+       { "ts",                 "<sigma>",      0x03c2  },
 };
 
 static struct ohash      mchars;
@@ -443,7 +458,7 @@ mchars_spec2cp(const char *p, size_t sz)
 
        end = p + sz;
        ln = ohash_find(&mchars, ohash_qlookupi(&mchars, p, &end));
-       return ln != NULL ? ln->unicode : sz == 1 ? (unsigned char)*p : -1;
+       return ln != NULL ? ln->unicode : -1;
 }
 
 int
@@ -473,10 +488,8 @@ mchars_spec2str(const char *p, size_t sz, size_t *rsz)
 
        end = p + sz;
        ln = ohash_find(&mchars, ohash_qlookupi(&mchars, p, &end));
-       if (ln == NULL) {
-               *rsz = 1;
-               return sz == 1 ? p : NULL;
-       }
+       if (ln == NULL)
+               return NULL;
 
        *rsz = strlen(ln->ascii);
        return ln->ascii;