]> git.cameronkatri.com Git - mandoc.git/blobdiff - mdoc_validate.c
The .Dd and .TH macros must interrupt .ce, too;
[mandoc.git] / mdoc_validate.c
index da9be6d113589f7b2285a5ba077bb82197dbb73e..e968c7ec91508ffa6ab9b08c52b4b4e4ad4bbc7b 100644 (file)
@@ -1,4 +1,4 @@
-/*     $Id: mdoc_validate.c,v 1.342 2017/06/24 18:58:33 schwarze Exp $ */
+/*     $Id: mdoc_validate.c,v 1.348 2017/07/03 17:33:06 schwarze Exp $ */
 /*
  * Copyright (c) 2008-2012 Kristaps Dzonsons <kristaps@bsd.lv>
  * Copyright (c) 2010-2017 Ingo Schwarze <schwarze@openbsd.org>
@@ -33,6 +33,7 @@
 
 #include "mandoc_aux.h"
 #include "mandoc.h"
+#include "mandoc_xr.h"
 #include "roff.h"
 #include "mdoc.h"
 #include "libmandoc.h"
@@ -60,6 +61,7 @@ static        void     check_toptext(struct roff_man *, int, int, const char *);
 static int      child_an(const struct roff_node *);
 static size_t          macro2len(enum roff_tok);
 static void     rewrite_macro2len(struct roff_man *, char **);
+static int      similar(const char *, const char *);
 
 static void     post_an(POST_ARGS);
 static void     post_an_norm(POST_ARGS);
@@ -76,6 +78,7 @@ static        void     post_defaults(POST_ARGS);
 static void     post_display(POST_ARGS);
 static void     post_dd(POST_ARGS);
 static void     post_delim(POST_ARGS);
+static void     post_delim_nb(POST_ARGS);
 static void     post_dt(POST_ARGS);
 static void     post_en(POST_ARGS);
 static void     post_es(POST_ARGS);
@@ -107,6 +110,7 @@ static      void     post_sh_authors(POST_ARGS);
 static void     post_sm(POST_ARGS);
 static void     post_st(POST_ARGS);
 static void     post_std(POST_ARGS);
+static void     post_sx(POST_ARGS);
 static void     post_useless(POST_ARGS);
 static void     post_xr(POST_ARGS);
 static void     post_xx(POST_ARGS);
@@ -125,33 +129,33 @@ static    const v_post __mdoc_valids[MDOC_MAX - MDOC_Dd] = {
        post_bl,        /* Bl */
        NULL,           /* El */
        post_it,        /* It */
-       post_delim,     /* Ad */
+       post_delim_nb,  /* Ad */
        post_an,        /* An */
        NULL,           /* Ap */
        post_defaults,  /* Ar */
        NULL,           /* Cd */
-       post_delim,     /* Cm */
-       post_delim,     /* Dv */
-       post_delim,     /* Er */
-       post_delim,     /* Ev */
+       post_delim_nb,  /* Cm */
+       post_delim_nb,  /* Dv */
+       post_delim_nb,  /* Er */
+       post_delim_nb,  /* Ev */
        post_ex,        /* Ex */
        post_fa,        /* Fa */
        NULL,           /* Fd */
-       post_delim,     /* Fl */
+       post_delim_nb,  /* Fl */
        post_fn,        /* Fn */
-       post_delim,     /* Ft */
-       post_delim,     /* Ic */
-       post_delim,     /* In */
+       post_delim_nb,  /* Ft */
+       post_delim_nb,  /* Ic */
+       post_delim_nb,  /* In */
        post_defaults,  /* Li */
        post_nd,        /* Nd */
        post_nm,        /* Nm */
-       post_delim,     /* Op */
+       post_delim_nb,  /* Op */
        post_obsolete,  /* Ot */
        post_defaults,  /* Pa */
        post_rv,        /* Rv */
        post_st,        /* St */
-       post_delim,     /* Va */
-       post_delim,     /* Vt */
+       post_delim_nb,  /* Va */
+       post_delim_nb,  /* Vt */
        post_xr,        /* Xr */
        NULL,           /* %A */
        post_hyph,      /* %B */ /* FIXME: can be used outside Rs/Re. */
@@ -165,12 +169,12 @@ static    const v_post __mdoc_valids[MDOC_MAX - MDOC_Dd] = {
        post_hyph,      /* %T */ /* FIXME: can be used outside Rs/Re. */
        NULL,           /* %V */
        NULL,           /* Ac */
-       post_delim,     /* Ao */
-       post_delim,     /* Aq */
+       post_delim_nb,  /* Ao */
+       post_delim_nb,  /* Aq */
        post_at,        /* At */
        NULL,           /* Bc */
        post_bf,        /* Bf */
-       post_delim,     /* Bo */
+       post_delim_nb,  /* Bo */
        NULL,           /* Bq */
        post_xx,        /* Bsx */
        post_bx,        /* Bx */
@@ -180,37 +184,37 @@ static    const v_post __mdoc_valids[MDOC_MAX - MDOC_Dd] = {
        NULL,           /* Dq */
        NULL,           /* Ec */
        NULL,           /* Ef */
-       post_delim,     /* Em */
+       post_delim_nb,  /* Em */
        NULL,           /* Eo */
        post_xx,        /* Fx */
-       post_delim,     /* Ms */
+       post_delim_nb,  /* Ms */
        NULL,           /* No */
        post_ns,        /* Ns */
        post_xx,        /* Nx */
        post_xx,        /* Ox */
        NULL,           /* Pc */
        NULL,           /* Pf */
-       post_delim,     /* Po */
-       post_delim,     /* Pq */
+       post_delim_nb,  /* Po */
+       post_delim_nb,  /* Pq */
        NULL,           /* Qc */
-       post_delim,     /* Ql */
-       post_delim,     /* Qo */
-       post_delim,     /* Qq */
+       post_delim_nb,  /* Ql */
+       post_delim_nb,  /* Qo */
+       post_delim_nb,  /* Qq */
        NULL,           /* Re */
        post_rs,        /* Rs */
        NULL,           /* Sc */
-       post_delim,     /* So */
-       post_delim,     /* Sq */
+       post_delim_nb,  /* So */
+       post_delim_nb,  /* Sq */
        post_sm,        /* Sm */
-       post_hyph,      /* Sx */
-       post_delim,     /* Sy */
+       post_sx,        /* Sx */
+       post_delim_nb,  /* Sy */
        post_useless,   /* Tn */
        post_xx,        /* Ux */
        NULL,           /* Xc */
        NULL,           /* Xo */
        post_fo,        /* Fo */
        NULL,           /* Fc */
-       post_delim,     /* Oo */
+       post_delim_nb,  /* Oo */
        NULL,           /* Oc */
        post_bk,        /* Bk */
        NULL,           /* Ek */
@@ -220,10 +224,10 @@ static    const v_post __mdoc_valids[MDOC_MAX - MDOC_Dd] = {
        post_eoln,      /* Ud */
        post_lb,        /* Lb */
        post_par,       /* Lp */
-       post_delim,     /* Lk */
+       post_delim_nb,  /* Lk */
        post_defaults,  /* Mt */
-       post_delim,     /* Brq */
-       post_delim,     /* Bro */
+       post_delim_nb,  /* Brq */
+       post_delim_nb,  /* Bro */
        NULL,           /* Brc */
        NULL,           /* %C */
        post_es,        /* Es */
@@ -427,6 +431,34 @@ check_toptext(struct roff_man *mdoc, int ln, int pos, const char *p)
 
 static void
 post_delim(POST_ARGS)
+{
+       const struct roff_node  *nch;
+       const char              *lc;
+       enum mdelim              delim;
+       enum roff_tok            tok;
+
+       tok = mdoc->last->tok;
+       nch = mdoc->last->last;
+       if (nch == NULL || nch->type != ROFFT_TEXT)
+               return;
+       lc = strchr(nch->string, '\0') - 1;
+       if (lc < nch->string)
+               return;
+       delim = mdoc_isdelim(lc);
+       if (delim == DELIM_NONE || delim == DELIM_OPEN)
+               return;
+       if (*lc == ')' && (tok == MDOC_Nd || tok == MDOC_Sh ||
+           tok == MDOC_Ss || tok == MDOC_Fo))
+               return;
+
+       mandoc_vmsg(MANDOCERR_DELIM, mdoc->parse,
+           nch->line, nch->pos + (lc - nch->string),
+           "%s%s %s", roff_name[tok],
+           nch == mdoc->last->child ? "" : " ...", nch->string);
+}
+
+static void
+post_delim_nb(POST_ARGS)
 {
        const struct roff_node  *nch;
        const char              *lc, *cp;
@@ -514,7 +546,7 @@ post_delim(POST_ARGS)
                }
        }
 
-       mandoc_vmsg(MANDOCERR_DELIM, mdoc->parse,
+       mandoc_vmsg(MANDOCERR_DELIM_NB, mdoc->parse,
            nch->line, nch->pos + (lc - nch->string),
            "%s%s %s", roff_name[tok],
            nch == mdoc->last->child ? "" : " ...", nch->string);
@@ -895,7 +927,7 @@ post_lb(POST_ARGS)
        struct roff_node        *n;
        const char              *p;
 
-       post_delim(mdoc);
+       post_delim_nb(mdoc);
 
        n = mdoc->last;
        assert(n->child->type == ROFFT_TEXT);
@@ -966,6 +998,8 @@ post_std(POST_ARGS)
 {
        struct roff_node *n;
 
+       post_delim(mdoc);
+
        n = mdoc->last;
        if (n->args && n->args->argc == 1)
                if (n->args->argv[0].arg == MDOC_Std)
@@ -1102,6 +1136,8 @@ post_fname(POST_ARGS)
        if ( ! (cp[0] == '\0' || (cp[0] == '(' && cp[1] == '*')))
                mandoc_msg(MANDOCERR_FN_PAREN, mdoc->parse,
                    n->line, n->pos + pos, n->string);
+       if (n->sec == SEC_SYNOPSIS && mdoc->meta.msec != NULL)
+               mandoc_xr_add(mdoc->meta.msec, n->string, -1, -1);
 }
 
 static void
@@ -1133,7 +1169,8 @@ post_fo(POST_ARGS)
                    "Fo ... %s", n->child->next->string);
                while (n->child != n->last)
                        roff_node_delete(mdoc, n->last);
-       }
+       } else
+               post_delim(mdoc);
 
        post_fname(mdoc);
 }
@@ -1157,7 +1194,7 @@ post_fa(POST_ARGS)
                        break;
                }
        }
-       post_delim(mdoc);
+       post_delim_nb(mdoc);
 }
 
 static void
@@ -1167,6 +1204,11 @@ post_nm(POST_ARGS)
 
        n = mdoc->last;
 
+       if ((n->sec == SEC_NAME || n->sec == SEC_SYNOPSIS) &&
+           n->child != NULL && n->child->type == ROFFT_TEXT &&
+           mdoc->meta.msec != NULL)
+               mandoc_xr_add(mdoc->meta.msec, n->child->string, -1, -1);
+
        if (n->last != NULL &&
            (n->last->tok == MDOC_Pp ||
             n->last->tok == MDOC_Lp))
@@ -1180,11 +1222,18 @@ post_nm(POST_ARGS)
                mandoc_msg(MANDOCERR_NM_NONAME, mdoc->parse,
                    n->line, n->pos, "Nm");
 
-       if (n->type == ROFFT_ELEM)
+       switch (n->type) {
+       case ROFFT_ELEM:
+               post_delim_nb(mdoc);
+               break;
+       case ROFFT_HEAD:
                post_delim(mdoc);
+               break;
+       default:
+               return;
+       }
 
-       if ((n->type != ROFFT_ELEM && n->type != ROFFT_HEAD) ||
-           (n->child != NULL && n->child->type == ROFFT_TEXT) ||
+       if ((n->child != NULL && n->child->type == ROFFT_TEXT) ||
            mdoc->meta.name == NULL)
                return;
 
@@ -1198,7 +1247,6 @@ static void
 post_nd(POST_ARGS)
 {
        struct roff_node        *n;
-       size_t                   sz;
 
        n = mdoc->last;
 
@@ -1212,11 +1260,8 @@ post_nd(POST_ARGS)
        if (n->child == NULL)
                mandoc_msg(MANDOCERR_ND_EMPTY, mdoc->parse,
                    n->line, n->pos, "Nd");
-       else if (n->last->type == ROFFT_TEXT &&
-           (sz = strlen(n->last->string)) != 0 &&
-           n->last->string[sz - 1] == '.')
-               mandoc_msg(MANDOCERR_ND_DOT, mdoc->parse,
-                   n->last->line, n->last->pos + sz - 1, NULL);
+       else
+               post_delim(mdoc);
 
        post_hyph(mdoc);
 }
@@ -1274,7 +1319,7 @@ post_defaults(POST_ARGS)
        struct roff_node *nn;
 
        if (mdoc->last->child != NULL) {
-               post_delim(mdoc);
+               post_delim_nb(mdoc);
                return;
        }
 
@@ -1349,7 +1394,7 @@ post_an(POST_ARGS)
                        mandoc_msg(MANDOCERR_MACRO_EMPTY, mdoc->parse,
                            np->line, np->pos, "An");
                else
-                       post_delim(mdoc);
+                       post_delim_nb(mdoc);
        } else if (nch != NULL)
                mandoc_vmsg(MANDOCERR_ARG_EXCESS, mdoc->parse,
                    nch->line, nch->pos, "An ... %s", nch->string);
@@ -1378,7 +1423,7 @@ post_xx(POST_ARGS)
        struct roff_node        *n;
        const char              *os;
 
-       post_delim(mdoc);
+       post_delim_nb(mdoc);
 
        n = mdoc->last;
        switch (n->tok) {
@@ -1459,15 +1504,30 @@ post_it(POST_ARGS)
 
                assert(nit->head->child == NULL);
 
-               i = 0;
-               for (nch = nit->child; nch != NULL; nch = nch->next)
-                       if (nch->type == ROFFT_BODY)
-                               i++;
+               if (nit->head->next->child == NULL &&
+                   nit->head->next->next == NULL) {
+                       mandoc_msg(MANDOCERR_MACRO_EMPTY, mdoc->parse,
+                           nit->line, nit->pos, "It");
+                       roff_node_delete(mdoc, nit);
+                       break;
+               }
 
+               i = 0;
+               for (nch = nit->child; nch != NULL; nch = nch->next) {
+                       if (nch->type != ROFFT_BODY)
+                               continue;
+                       if (i++ && nch->flags & NODE_LINE)
+                               mandoc_msg(MANDOCERR_TA_LINE, mdoc->parse,
+                                   nch->line, nch->pos, "Ta");
+               }
                if (i < cols || i > cols + 1)
                        mandoc_vmsg(MANDOCERR_BL_COL,
                            mdoc->parse, nit->line, nit->pos,
                            "%d columns, %d cells", cols, i);
+               else if (nit->head->next->child != NULL &&
+                   nit->head->next->child->line > nit->line)
+                       mandoc_msg(MANDOCERR_IT_NOARG, mdoc->parse,
+                           nit->line, nit->pos, "Bl -column It");
                break;
        default:
                abort();
@@ -1982,10 +2042,20 @@ post_hyph(POST_ARGS)
 static void
 post_ns(POST_ARGS)
 {
+       struct roff_node        *n;
 
-       if (mdoc->last->flags & NODE_LINE)
+       n = mdoc->last;
+       if (n->flags & NODE_LINE ||
+           (n->next != NULL && n->next->flags & NODE_DELIMC))
                mandoc_msg(MANDOCERR_NS_SKIP, mdoc->parse,
-                   mdoc->last->line, mdoc->last->pos, NULL);
+                   n->line, n->pos, NULL);
+}
+
+static void
+post_sx(POST_ARGS)
+{
+       post_delim(mdoc);
+       post_hyph(mdoc);
 }
 
 static void
@@ -2148,11 +2218,54 @@ post_sh_authors(POST_ARGS)
                    mdoc->last->line, mdoc->last->pos, NULL);
 }
 
+/*
+ * Return an upper bound for the string distance (allowing
+ * transpositions).  Not a full Levenshtein implementation
+ * because Levenshtein is quadratic in the string length
+ * and this function is called for every standard name,
+ * so the check for each custom name would be cubic.
+ * The following crude heuristics is linear, resulting
+ * in quadratic behaviour for checking one custom name,
+ * which does not cause measurable slowdown.
+ */
+static int
+similar(const char *s1, const char *s2)
+{
+       const int       maxdist = 3;
+       int             dist = 0;
+
+       while (s1[0] != '\0' && s2[0] != '\0') {
+               if (s1[0] == s2[0]) {
+                       s1++;
+                       s2++;
+                       continue;
+               }
+               if (++dist > maxdist)
+                       return INT_MAX;
+               if (s1[1] == s2[1]) {  /* replacement */
+                       s1++;
+                       s2++;
+               } else if (s1[0] == s2[1] && s1[1] == s2[0]) {
+                       s1 += 2;        /* transposition */
+                       s2 += 2;
+               } else if (s1[0] == s2[1])  /* insertion */
+                       s2++;
+               else if (s1[1] == s2[0])  /* deletion */
+                       s1++;
+               else
+                       return INT_MAX;
+       }
+       dist += strlen(s1) + strlen(s2);
+       return dist > maxdist ? INT_MAX : dist;
+}
+
 static void
 post_sh_head(POST_ARGS)
 {
        struct roff_node        *nch;
        const char              *goodsec;
+       const char *const       *testsec;
+       int                      dist, mindist;
        enum roff_sec            sec;
 
        /*
@@ -2190,8 +2303,25 @@ post_sh_head(POST_ARGS)
 
        /* We don't care about custom sections after this. */
 
-       if (sec == SEC_CUSTOM)
+       if (sec == SEC_CUSTOM) {
+               if ((nch = mdoc->last->child) == NULL ||
+                   nch->type != ROFFT_TEXT || nch->next != NULL)
+                       return;
+               goodsec = NULL;
+               mindist = INT_MAX;
+               for (testsec = secnames + 1; *testsec != NULL; testsec++) {
+                       dist = similar(nch->string, *testsec);
+                       if (dist < mindist) {
+                               goodsec = *testsec;
+                               mindist = dist;
+                       }
+               }
+               if (goodsec != NULL)
+                       mandoc_vmsg(MANDOCERR_SEC_TYPO, mdoc->parse,
+                           nch->line, nch->pos, "Sh %s instead of %s",
+                           nch->string, goodsec);
                return;
+       }
 
        /*
         * Check whether our non-custom section is being repeated or is
@@ -2257,9 +2387,15 @@ post_xr(POST_ARGS)
        if (nch->next == NULL) {
                mandoc_vmsg(MANDOCERR_XR_NOSEC, mdoc->parse,
                    n->line, n->pos, "Xr %s", nch->string);
-       } else
+       } else {
                assert(nch->next == n->last);
-       post_delim(mdoc);
+               if(mandoc_xr_add(nch->next->string, nch->string,
+                   nch->line, nch->pos))
+                       mandoc_vmsg(MANDOCERR_XR_SELF, mdoc->parse,
+                           nch->line, nch->pos, "Xr %s %s",
+                           nch->string, nch->next->string);
+       }
+       post_delim_nb(mdoc);
 }
 
 static void
@@ -2272,6 +2408,7 @@ post_ignpar(POST_ARGS)
                post_prevpar(mdoc);
                return;
        case ROFFT_HEAD:
+               post_delim(mdoc);
                post_hyph(mdoc);
                return;
        case ROFFT_BODY:
@@ -2508,7 +2645,7 @@ post_bx(POST_ARGS)
        struct roff_node        *n, *nch;
        const char              *macro;
 
-       post_delim(mdoc);
+       post_delim_nb(mdoc);
 
        n = mdoc->last;
        nch = n->child;
@@ -2574,6 +2711,8 @@ post_os(POST_ARGS)
                mandoc_msg(MANDOCERR_PROLOG_LATE, mdoc->parse,
                    n->line, n->pos, "Os");
 
+       post_delim(mdoc);
+
        /*
         * Set the operating system by way of the `Os' macro.
         * The order of precedence is: