]> git.cameronkatri.com Git - mandoc.git/blobdiff - man_html.c
In HTML output, avoid printing a newline right after <pre>
[mandoc.git] / man_html.c
index 0eb482b0e55c27b6e4c8a23a1c433969679b5b1a..147c20e46443118f00cbacd8609b713254452b48 100644 (file)
@@ -1,7 +1,7 @@
-/*     $Id: man_html.c,v 1.165 2019/01/05 21:55:11 schwarze Exp $ */
+/* $Id: man_html.c,v 1.179 2020/10/16 17:22:43 schwarze Exp $ */
 /*
+ * Copyright (c) 2013-2015, 2017-2020 Ingo Schwarze <schwarze@openbsd.org>
  * Copyright (c) 2008-2012, 2014 Kristaps Dzonsons <kristaps@bsd.lv>
- * Copyright (c) 2013-2015, 2017-2019 Ingo Schwarze <schwarze@openbsd.org>
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
@@ -14,6 +14,8 @@
  * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ *
+ * HTML formatter for man(7) used by mandoc(1).
  */
 #include "config.h"
 
@@ -34,7 +36,7 @@
 #include "main.h"
 
 #define        MAN_ARGS          const struct roff_meta *man, \
-                         const struct roff_node *n, \
+                         struct roff_node *n, \
                          struct html *h
 
 struct man_html_act {
@@ -42,14 +44,13 @@ struct      man_html_act {
        int             (*post)(MAN_ARGS);
 };
 
-static void              print_bvspace(struct html *,
-                               const struct roff_node *);
 static void              print_man_head(const struct roff_meta *,
                                struct html *);
 static void              print_man_nodelist(MAN_ARGS);
 static void              print_man_node(MAN_ARGS);
+static char              list_continues(const struct roff_node *,
+                               const struct roff_node *);
 static int               man_B_pre(MAN_ARGS);
-static int               man_HP_pre(MAN_ARGS);
 static int               man_IP_pre(MAN_ARGS);
 static int               man_I_pre(MAN_ARGS);
 static int               man_OP_pre(MAN_ARGS);
@@ -57,7 +58,6 @@ static        int               man_PP_pre(MAN_ARGS);
 static int               man_RS_pre(MAN_ARGS);
 static int               man_SH_pre(MAN_ARGS);
 static int               man_SM_pre(MAN_ARGS);
-static int               man_SS_pre(MAN_ARGS);
 static int               man_SY_pre(MAN_ARGS);
 static int               man_UR_pre(MAN_ARGS);
 static int               man_abort_pre(MAN_ARGS);
@@ -72,14 +72,14 @@ static      void              man_root_pre(const struct roff_meta *,
 static const struct man_html_act man_html_acts[MAN_MAX - MAN_TH] = {
        { NULL, NULL }, /* TH */
        { man_SH_pre, NULL }, /* SH */
-       { man_SS_pre, NULL }, /* SS */
+       { man_SH_pre, NULL }, /* SS */
        { man_IP_pre, NULL }, /* TP */
        { man_IP_pre, NULL }, /* TQ */
        { man_abort_pre, NULL }, /* LP */
        { man_PP_pre, NULL }, /* PP */
        { man_abort_pre, NULL }, /* P */
        { man_IP_pre, NULL }, /* IP */
-       { man_HP_pre, NULL }, /* HP */
+       { man_PP_pre, NULL }, /* HP */
        { man_SM_pre, NULL }, /* SM */
        { man_SM_pre, NULL }, /* SB */
        { man_alt_pre, NULL }, /* BI */
@@ -110,27 +110,6 @@ static     const struct man_html_act man_html_acts[MAN_MAX - MAN_TH] = {
 };
 
 
-/*
- * Printing leading vertical space before a block.
- * This is used for the paragraph macros.
- * The rules are pretty simple, since there's very little nesting going
- * on here.  Basically, if we're the first within another block (SS/SH),
- * then don't emit vertical space.  If we are (RS), then do.  If not the
- * first, print it.
- */
-static void
-print_bvspace(struct html *h, const struct roff_node *n)
-{
-       if (n->body != NULL && n->body->child != NULL &&
-           n->body->child->type == ROFFT_TBL)
-               return;
-
-       if (n->prev == NULL && n->parent->tok != MAN_RS)
-               return;
-
-       print_paragraph(h);
-}
-
 void
 html_man(void *arg, const struct roff_meta *man)
 {
@@ -144,7 +123,7 @@ html_man(void *arg, const struct roff_meta *man)
        if ((h->oflags & HTML_FRAGMENT) == 0) {
                print_gen_decls(h);
                print_otag(h, TAG_HTML, "");
-               if (n->type == ROFFT_COMMENT)
+               if (n != NULL && n->type == ROFFT_COMMENT)
                        print_gen_comment(h, n);
                t = print_otag(h, TAG_HEAD, "");
                print_man_head(man, h);
@@ -187,7 +166,15 @@ print_man_node(MAN_ARGS)
        struct tag      *t;
        int              child;
 
-       html_fillmode(h, n->flags & NODE_NOFILL ? ROFF_nf : ROFF_fi);
+       if (n->type == ROFFT_COMMENT || n->flags & NODE_NOPRT)
+               return;
+
+       if ((n->flags & NODE_NOFILL) == 0)
+               html_fillmode(h, ROFF_fi);
+       else if (html_fillmode(h, ROFF_nf) == ROFF_nf &&
+           n->tok != ROFF_fi && n->flags & NODE_LINE &&
+           (n->prev == NULL || n->prev->tok != MAN_YS))
+               print_endline(h);
 
        child = 1;
        switch (n->type) {
@@ -196,18 +183,18 @@ print_man_node(MAN_ARGS)
                        print_endline(h);
                        return;
                }
-               t = h->tag;
                if (*n->string == ' ' && n->flags & NODE_LINE &&
                    (h->flags & HTML_NONEWLINE) == 0)
-                       print_endline(h);
+                       print_otag(h, TAG_BR, "");
                else if (n->flags & NODE_DELIMC)
                        h->flags |= HTML_NOSPACE;
+               t = h->tag;
+               t->refcnt++;
                print_text(h, n->string);
                break;
-       case ROFFT_COMMENT:
-               return;
        case ROFFT_EQN:
                t = h->tag;
+               t->refcnt++;
                print_eqn(h, n->eqn);
                break;
        case ROFFT_TBL:
@@ -223,9 +210,9 @@ print_man_node(MAN_ARGS)
                 * Close out scope of font prior to opening a macro
                 * scope.
                 */
-               if (HTMLFONT_NONE != h->metac) {
+               if (h->metac != ESCAPE_FONTROMAN) {
                        h->metal = h->metac;
-                       h->metac = HTMLFONT_NONE;
+                       h->metac = ESCAPE_FONTROMAN;
                }
 
                /*
@@ -235,14 +222,14 @@ print_man_node(MAN_ARGS)
                 */
                if (h->tblt != NULL)
                        print_tblclose(h);
-
                t = h->tag;
+               t->refcnt++;
                if (n->tok < ROFF_MAX) {
                        roff_html_pre(h, n);
+                       t->refcnt--;
                        print_stagq(h, t);
                        return;
                }
-
                assert(n->tok >= MAN_TH && n->tok < MAN_MAX);
                if (man_html_acts[n->tok - MAN_TH].pre != NULL)
                        child = (*man_html_acts[n->tok - MAN_TH].pre)(man,
@@ -254,14 +241,23 @@ print_man_node(MAN_ARGS)
                print_man_nodelist(man, n->child, h);
 
        /* This will automatically close out any font scope. */
-       print_stagq(h, t);
-
-       if (n->flags & NODE_NOFILL && n->tok != MAN_YS &&
-           (n->next != NULL && n->next->flags & NODE_LINE)) {
-               /* In .nf = <pre>, print even empty lines. */
-               h->col++;
-               print_endline(h);
+       t->refcnt--;
+       if (n->type == ROFFT_BLOCK &&
+           (n->tok == MAN_IP || n->tok == MAN_TP || n->tok == MAN_TQ)) {
+               t = h->tag;
+               while (t->tag != TAG_DL && t->tag != TAG_UL)
+                       t = t->next;
+               /*
+                * Close the list if no further item of the same type
+                * follows; otherwise, close the item only.
+                */
+               if (list_continues(n, roff_node_next(n)) == '\0') {
+                       print_tagq(h, t);
+                       t = NULL;
+               }
        }
+       if (t != NULL)
+               print_stagq(h, t);
 }
 
 static void
@@ -313,13 +309,28 @@ man_root_post(const struct roff_meta *man, struct html *h)
 static int
 man_SH_pre(MAN_ARGS)
 {
-       char    *id;
-
-       if (n->type == ROFFT_HEAD) {
-               id = html_make_id(n, 1);
-               print_otag(h, TAG_H1, "cTi", "Sh", id);
-               if (id != NULL)
-                       print_otag(h, TAG_A, "chR", "permalink", id);
+       const char      *class;
+       enum htmltag     tag;
+
+       if (n->tok == MAN_SH) {
+               tag = TAG_H1;
+               class = "Sh";
+       } else {
+               tag = TAG_H2;
+               class = "Ss";
+       }
+       switch (n->type) {
+       case ROFFT_BLOCK:
+               html_close_paragraph(h);
+               print_otag(h, TAG_SECTION, "c", class);
+               break;
+       case ROFFT_HEAD:
+               print_otag_id(h, tag, class, n);
+               break;
+       case ROFFT_BODY:
+               break;
+       default:
+               abort();
        }
        return 1;
 }
@@ -380,45 +391,108 @@ man_SM_pre(MAN_ARGS)
 }
 
 static int
-man_SS_pre(MAN_ARGS)
+man_PP_pre(MAN_ARGS)
 {
-       char    *id;
-
-       if (n->type == ROFFT_HEAD) {
-               id = html_make_id(n, 1);
-               print_otag(h, TAG_H2, "cTi", "Ss", id);
-               if (id != NULL)
-                       print_otag(h, TAG_A, "chR", "permalink", id);
+       switch (n->type) {
+       case ROFFT_BLOCK:
+               html_close_paragraph(h);
+               break;
+       case ROFFT_HEAD:
+               return 0;
+       case ROFFT_BODY:
+               if (n->child != NULL &&
+                   (n->child->flags & NODE_NOFILL) == 0)
+                       print_otag(h, TAG_P, "c",
+                           n->tok == MAN_PP ? "Pp" : "Pp HP");
+               break;
+       default:
+               abort();
        }
        return 1;
 }
 
-static int
-man_PP_pre(MAN_ARGS)
+static char
+list_continues(const struct roff_node *n1, const struct roff_node *n2)
 {
-       if (n->type == ROFFT_HEAD)
-               return 0;
-       else if (n->type == ROFFT_BLOCK)
-               print_bvspace(h, n);
-
-       return 1;
+       const char *s1, *s2;
+       char c1, c2;
+
+       if (n1 == NULL || n1->type != ROFFT_BLOCK ||
+           n2 == NULL || n2->type != ROFFT_BLOCK)
+               return '\0';
+       if ((n1->tok == MAN_TP || n1->tok == MAN_TQ) &&
+           (n2->tok == MAN_TP || n2->tok == MAN_TQ))
+               return ' ';
+       if (n1->tok != MAN_IP || n2->tok != MAN_IP)
+               return '\0';
+       n1 = n1->head->child;
+       n2 = n2->head->child;
+       s1 = n1 == NULL ? "" : n1->string;
+       s2 = n2 == NULL ? "" : n2->string;
+       c1 = strcmp(s1, "*") == 0 ? '*' :
+            strcmp(s1, "\\-") == 0 ? '-' :
+            strcmp(s1, "\\(bu") == 0 ? 'b' : ' ';
+       c2 = strcmp(s2, "*") == 0 ? '*' :
+            strcmp(s2, "\\-") == 0 ? '-' :
+            strcmp(s2, "\\(bu") == 0 ? 'b' : ' ';
+       return c1 != c2 ? '\0' : c1 == 'b' ? '*' : c1;
 }
 
 static int
 man_IP_pre(MAN_ARGS)
 {
-       const struct roff_node  *nn;
+       struct roff_node        *nn;
+       const char              *list_class;
+       enum htmltag             list_elem, body_elem;
+       char                     list_type;
+
+       nn = n->type == ROFFT_BLOCK ? n : n->parent;
+       list_type = list_continues(roff_node_prev(nn), nn);
+       if (list_type == '\0') {
+               /* Start a new list. */
+               list_type = list_continues(nn, roff_node_next(nn));
+               if (list_type == '\0')
+                       list_type = ' ';
+               switch (list_type) {
+               case ' ':
+                       list_class = "Bl-tag";
+                       list_elem = TAG_DL;
+                       break;
+               case '*':
+                       list_class = "Bl-bullet";
+                       list_elem = TAG_UL;
+                       break;
+               case '-':
+                       list_class = "Bl-dash";
+                       list_elem = TAG_UL;
+                       break;
+               default:
+                       abort();
+               }
+       } else {
+               /* Continue a list that was started earlier. */
+               list_class = NULL;
+               list_elem = TAG_MAX;
+       }
+       body_elem = list_type == ' ' ? TAG_DD : TAG_LI;
 
-       if (n->type == ROFFT_BODY) {
-               print_otag(h, TAG_DD, "");
+       switch (n->type) {
+       case ROFFT_BLOCK:
+               html_close_paragraph(h);
+               if (list_elem != TAG_MAX)
+                       print_otag(h, list_elem, "c", list_class);
                return 1;
-       } else if (n->type != ROFFT_HEAD) {
-               print_otag(h, TAG_DL, "c", "Bl-tag");
+       case ROFFT_HEAD:
+               if (body_elem == TAG_LI)
+                       return 0;
+               print_otag_id(h, TAG_DT, NULL, n);
+               break;
+       case ROFFT_BODY:
+               print_otag(h, body_elem, "");
                return 1;
+       default:
+               abort();
        }
-
-       print_otag(h, TAG_DT, "");
-
        switch(n->tok) {
        case MAN_IP:  /* Only print the first header element. */
                if (n->child != NULL)
@@ -440,19 +514,6 @@ man_IP_pre(MAN_ARGS)
        return 0;
 }
 
-static int
-man_HP_pre(MAN_ARGS)
-{
-       if (n->type == ROFFT_HEAD)
-               return 0;
-
-       if (n->type == ROFFT_BLOCK) {
-               print_bvspace(h, n);
-               print_otag(h, TAG_DIV, "c", "HP");
-       }
-       return 1;
-}
-
 static int
 man_OP_pre(MAN_ARGS)
 {
@@ -510,10 +571,18 @@ man_ign_pre(MAN_ARGS)
 static int
 man_RS_pre(MAN_ARGS)
 {
-       if (n->type == ROFFT_HEAD)
+       switch (n->type) {
+       case ROFFT_BLOCK:
+               html_close_paragraph(h);
+               break;
+       case ROFFT_HEAD:
                return 0;
-       if (n->type == ROFFT_BLOCK)
+       case ROFFT_BODY:
                print_otag(h, TAG_DIV, "c", "Bd-indent");
+               break;
+       default:
+               abort();
+       }
        return 1;
 }
 
@@ -522,12 +591,13 @@ man_SY_pre(MAN_ARGS)
 {
        switch (n->type) {
        case ROFFT_BLOCK:
+               html_close_paragraph(h);
                print_otag(h, TAG_TABLE, "c", "Nm");
                print_otag(h, TAG_TR, "");
                break;
        case ROFFT_HEAD:
                print_otag(h, TAG_TD, "");
-               print_otag(h, TAG_CODE, "cT", "Nm");
+               print_otag(h, TAG_CODE, "c", "Nm");
                break;
        case ROFFT_BODY:
                print_otag(h, TAG_TD, "");
@@ -549,10 +619,10 @@ man_UR_pre(MAN_ARGS)
                assert(n->child->type == ROFFT_TEXT);
                if (n->tok == MAN_MT) {
                        mandoc_asprintf(&cp, "mailto:%s", n->child->string);
-                       print_otag(h, TAG_A, "cTh", "Mt", cp);
+                       print_otag(h, TAG_A, "ch", "Mt", cp);
                        free(cp);
                } else
-                       print_otag(h, TAG_A, "cTh", "Lk", n->child->string);
+                       print_otag(h, TAG_A, "ch", "Lk", n->child->string);
        }
 
        assert(n->next->type == ROFFT_BODY);