-/* $Id: term.c,v 1.12 2009/02/23 15:19:47 kristaps Exp $ */
+/* $Id: term.c,v 1.167 2010/08/20 01:02:07 schwarze Exp $ */
/*
- * Copyright (c) 2009 Kristaps Dzonsons <kristaps@kth.se>
+ * Copyright (c) 2008, 2009, 2010 Kristaps Dzonsons <kristaps@bsd.lv>
+ * Copyright (c) 2010 Ingo Schwarze <schwarze@openbsd.org>
*
* Permission to use, copy, modify, and distribute this software for any
- * purpose with or without fee is hereby granted, provided that the
- * above copyright notice and this permission notice appear in all
- * copies.
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice and this permission notice appear in all copies.
*
- * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL
- * WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED
- * WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE
- * AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
- * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
- * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
- * TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
- * PERFORMANCE OF THIS SOFTWARE.
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
*/
+#ifdef HAVE_CONFIG_H
+#include "config.h"
+#endif
+
+#include <sys/types.h>
+
#include <assert.h>
+#include <ctype.h>
+#include <stdint.h>
+#include <stdio.h>
#include <stdlib.h>
#include <string.h>
+#include "mandoc.h"
+#include "chars.h"
+#include "out.h"
#include "term.h"
+#include "main.h"
-#define INDENT 4
-
-/*
- * Performs actions on nodes of the abstract syntax tree. Both pre- and
- * post-fix operations are defined here.
- */
-
-/* FIXME: indent/tab. */
-/* FIXME: handle nested lists. */
-
-#define TTYPE_PROG 0
-#define TTYPE_CMD_FLAG 1
-#define TTYPE_CMD_ARG 2
-#define TTYPE_SECTION 3
-#define TTYPE_FUNC_DECL 4
-#define TTYPE_VAR_DECL 5
-#define TTYPE_FUNC_TYPE 6
-#define TTYPE_FUNC_NAME 7
-#define TTYPE_FUNC_ARG 8
-#define TTYPE_LINK 9
-#define TTYPE_SSECTION 10
-#define TTYPE_FILE 11
-#define TTYPE_EMPH 12
-#define TTYPE_NMAX 13
-
-/*
- * These define "styles" for element types, like command arguments or
- * executable names. This is useful when multiple macros must decorate
- * the same thing (like .Ex -std cmd and .Nm cmd).
- */
-
-const int ttypes[TTYPE_NMAX] = {
- TERMP_BOLD, /* TTYPE_PROG */
- TERMP_BOLD, /* TTYPE_CMD_FLAG */
- TERMP_UNDERLINE, /* TTYPE_CMD_ARG */
- TERMP_BOLD, /* TTYPE_SECTION */
- TERMP_BOLD, /* TTYPE_FUNC_DECL */
- TERMP_UNDERLINE, /* TTYPE_VAR_DECL */
- TERMP_UNDERLINE, /* TTYPE_FUNC_TYPE */
- TERMP_BOLD, /* TTYPE_FUNC_NAME */
- TERMP_UNDERLINE, /* TTYPE_FUNC_ARG */
- TERMP_UNDERLINE, /* TTYPE_LINK */
- TERMP_BOLD, /* TTYPE_SSECTION */
- TERMP_UNDERLINE, /* TTYPE_FILE */
- TERMP_UNDERLINE /* TTYPE_EMPH */
-};
-
-static int arg_hasattr(int, size_t,
- const struct mdoc_arg *);
-static int arg_getattr(int, size_t,
- const struct mdoc_arg *);
-static size_t arg_offset(const struct mdoc_arg *);
-static size_t arg_width(const struct mdoc_arg *);
-
-/*
- * What follows describes prefix and postfix operations for the abstract
- * syntax tree descent.
- */
-
-#define DECL_ARGS \
- struct termp *p, \
- const struct mdoc_meta *meta, \
- const struct mdoc_node *node
-
-#define DECL_PRE(name) \
-static int name##_pre(DECL_ARGS)
-#define DECL_POST(name) \
-static void name##_post(DECL_ARGS)
-#define DECL_PREPOST(name) \
-DECL_PRE(name); \
-DECL_POST(name);
-
-DECL_PREPOST(termp_aq);
-DECL_PREPOST(termp_ar);
-DECL_PREPOST(termp_bd);
-DECL_PREPOST(termp_d1);
-DECL_PREPOST(termp_dq);
-DECL_PREPOST(termp_em);
-DECL_PREPOST(termp_fa);
-DECL_PREPOST(termp_fd);
-DECL_PREPOST(termp_fl);
-DECL_PREPOST(termp_fn);
-DECL_PREPOST(termp_ft);
-DECL_PREPOST(termp_it);
-DECL_PREPOST(termp_nm);
-DECL_PREPOST(termp_op);
-DECL_PREPOST(termp_pa);
-DECL_PREPOST(termp_pf);
-DECL_PREPOST(termp_qo);
-DECL_PREPOST(termp_qq);
-DECL_PREPOST(termp_sh);
-DECL_PREPOST(termp_ss);
-DECL_PREPOST(termp_sq);
-DECL_PREPOST(termp_sx);
-DECL_PREPOST(termp_va);
-DECL_PREPOST(termp_vt);
-
-DECL_PRE(termp_bx);
-DECL_PRE(termp_ex);
-DECL_PRE(termp_nd);
-DECL_PRE(termp_ns);
-DECL_PRE(termp_nx);
-DECL_PRE(termp_ox);
-DECL_PRE(termp_pp);
-DECL_PRE(termp_ud);
-DECL_PRE(termp_xr);
-
-DECL_POST(termp_bl);
-
-const struct termact __termacts[MDOC_MAX] = {
- { NULL, NULL }, /* \" */
- { NULL, NULL }, /* Dd */
- { NULL, NULL }, /* Dt */
- { NULL, NULL }, /* Os */
- { termp_sh_pre, termp_sh_post }, /* Sh */
- { termp_ss_pre, termp_ss_post }, /* Ss */
- { termp_pp_pre, NULL }, /* Pp */
- { termp_d1_pre, termp_d1_post }, /* D1 */
- { NULL, NULL }, /* Dl */
- { termp_bd_pre, termp_bd_post }, /* Bd */
- { NULL, NULL }, /* Ed */
- { NULL, termp_bl_post }, /* Bl */
- { NULL, NULL }, /* El */
- { termp_it_pre, termp_it_post }, /* It */
- { NULL, NULL }, /* Ad */
- { NULL, NULL }, /* An */
- { termp_ar_pre, termp_ar_post }, /* Ar */
- { NULL, NULL }, /* Cd */
- { NULL, NULL }, /* Cm */
- { NULL, NULL }, /* Dv */
- { NULL, NULL }, /* Er */
- { NULL, NULL }, /* Ev */
- { termp_ex_pre, NULL }, /* Ex */
- { termp_fa_pre, termp_fa_post }, /* Fa */
- { termp_fd_pre, termp_fd_post }, /* Fd */
- { termp_fl_pre, termp_fl_post }, /* Fl */
- { termp_fn_pre, termp_fn_post }, /* Fn */
- { termp_ft_pre, termp_ft_post }, /* Ft */
- { NULL, NULL }, /* Ic */
- { NULL, NULL }, /* In */
- { NULL, NULL }, /* Li */
- { termp_nd_pre, NULL }, /* Nd */
- { termp_nm_pre, termp_nm_post }, /* Nm */
- { termp_op_pre, termp_op_post }, /* Op */
- { NULL, NULL }, /* Ot */
- { termp_pa_pre, termp_pa_post }, /* Pa */
- { NULL, NULL }, /* Rv */
- { NULL, NULL }, /* St */
- { termp_va_pre, termp_va_post }, /* Va */
- { termp_vt_pre, termp_vt_post }, /* Vt */
- { termp_xr_pre, NULL }, /* Xr */
- { NULL, NULL }, /* %A */
- { NULL, NULL }, /* %B */
- { NULL, NULL }, /* %D */
- { NULL, NULL }, /* %I */
- { NULL, NULL }, /* %J */
- { NULL, NULL }, /* %N */
- { NULL, NULL }, /* %O */
- { NULL, NULL }, /* %P */
- { NULL, NULL }, /* %R */
- { NULL, NULL }, /* %T */
- { NULL, NULL }, /* %V */
- { NULL, NULL }, /* Ac */
- { NULL, NULL }, /* Ao */
- { termp_aq_pre, termp_aq_post }, /* Aq */
- { NULL, NULL }, /* At */
- { NULL, NULL }, /* Bc */
- { NULL, NULL }, /* Bf */
- { NULL, NULL }, /* Bo */
- { NULL, NULL }, /* Bq */
- { NULL, NULL }, /* Bsx */
- { termp_bx_pre, NULL }, /* Bx */
- { NULL, NULL }, /* Db */
- { NULL, NULL }, /* Dc */
- { NULL, NULL }, /* Do */
- { termp_dq_pre, termp_dq_post }, /* Dq */
- { NULL, NULL }, /* Ec */
- { NULL, NULL }, /* Ef */
- { termp_em_pre, termp_em_post }, /* Em */
- { NULL, NULL }, /* Eo */
- { NULL, NULL }, /* Fx */
- { NULL, NULL }, /* Ms */
- { NULL, NULL }, /* No */
- { termp_ns_pre, NULL }, /* Ns */
- { termp_nx_pre, NULL }, /* Nx */
- { termp_ox_pre, NULL }, /* Ox */
- { NULL, NULL }, /* Pc */
- { termp_pf_pre, termp_pf_post }, /* Pf */
- { NULL, NULL }, /* Po */
- { NULL, NULL }, /* Pq */
- { NULL, NULL }, /* Qc */
- { NULL, NULL }, /* Ql */
- { termp_qo_pre, termp_qo_post }, /* Qo */
- { termp_qq_pre, termp_qq_post }, /* Qq */
- { NULL, NULL }, /* Re */
- { NULL, NULL }, /* Rs */
- { NULL, NULL }, /* Sc */
- { NULL, NULL }, /* So */
- { termp_sq_pre, termp_sq_post }, /* Sq */
- { NULL, NULL }, /* Sm */
- { termp_sx_pre, termp_sx_post }, /* Sx */
- { NULL, NULL }, /* Sy */
- { NULL, NULL }, /* Tn */
- { NULL, NULL }, /* Ux */
- { NULL, NULL }, /* Xc */
- { NULL, NULL }, /* Xo */
- { NULL, NULL }, /* Fo */
- { NULL, NULL }, /* Fc */
- { NULL, NULL }, /* Oo */
- { NULL, NULL }, /* Oc */
- { NULL, NULL }, /* Bk */
- { NULL, NULL }, /* Ek */
- { NULL, NULL }, /* Bt */
- { NULL, NULL }, /* Hf */
- { NULL, NULL }, /* Fr */
- { termp_ud_pre, NULL }, /* Ud */
-};
-
-const struct termact *termacts = __termacts;
-
-
-static size_t
-arg_width(const struct mdoc_arg *arg)
-{
-
- /* TODO */
- assert(*arg->value);
- return(strlen(*arg->value));
-}
+static void spec(struct termp *, enum roffdeco,
+ const char *, size_t);
+static void res(struct termp *, const char *, size_t);
+static void bufferc(struct termp *, char);
+static void adjbuf(struct termp *p, size_t);
+static void encode(struct termp *, const char *, size_t);
-static size_t
-arg_offset(const struct mdoc_arg *arg)
+void
+term_free(struct termp *p)
{
- /* TODO */
- assert(*arg->value);
- if (0 == strcmp(*arg->value, "indent"))
- return(INDENT);
- if (0 == strcmp(*arg->value, "indent-two"))
- return(INDENT * 2);
+ if (p->buf)
+ free(p->buf);
+ if (p->symtab)
+ chars_free(p->symtab);
- return(strlen(*arg->value));
+ free(p);
}
-static int
-arg_hasattr(int arg, size_t argc, const struct mdoc_arg *argv)
+void
+term_begin(struct termp *p, term_margin head,
+ term_margin foot, const void *arg)
{
- return(-1 != arg_getattr(arg, argc, argv));
+ p->headf = head;
+ p->footf = foot;
+ p->argf = arg;
+ (*p->begin)(p);
}
-static int
-arg_getattr(int arg, size_t argc, const struct mdoc_arg *argv)
+void
+term_end(struct termp *p)
{
- int i;
- for (i = 0; i < (int)argc; i++)
- if (argv[i].arg == arg)
- return(i);
- return(-1);
+ (*p->end)(p);
}
-/* ARGSUSED */
-static int
-termp_dq_pre(DECL_ARGS)
-{
-
- if (MDOC_BODY != node->type)
- return(1);
-
- word(p, "``");
- p->flags |= TERMP_NOSPACE;
- return(1);
-}
-
-
-/* ARGSUSED */
-static void
-termp_dq_post(DECL_ARGS)
+struct termp *
+term_alloc(enum termenc enc)
{
+ struct termp *p;
- if (MDOC_BODY != node->type)
- return;
+ p = calloc(1, sizeof(struct termp));
+ if (NULL == p) {
+ perror(NULL);
+ exit(MANDOCLEVEL_SYSERR);
+ }
- p->flags |= TERMP_NOSPACE;
- word(p, "''");
+ p->enc = enc;
+ return(p);
}
-/* ARGSUSED */
-static void
-termp_it_post(DECL_ARGS)
-{
- const struct mdoc_node *n, *it;
- const struct mdoc_block *bl;
- int i;
- size_t width, offset;
+/*
+ * Flush a line of text. A "line" is loosely defined as being something
+ * that should be followed by a newline, regardless of whether it's
+ * broken apart by newlines getting there. A line can also be a
+ * fragment of a columnar list (`Bl -tag' or `Bl -column'), which does
+ * not have a trailing newline.
+ *
+ * The following flags may be specified:
+ *
+ * - TERMP_NOLPAD: when beginning to write the line, don't left-pad the
+ * offset value. This is useful when doing columnar lists where the
+ * prior column has right-padded.
+ *
+ * - TERMP_NOBREAK: this is the most important and is used when making
+ * columns. In short: don't print a newline and instead pad to the
+ * right margin. Used in conjunction with TERMP_NOLPAD.
+ *
+ * - TERMP_TWOSPACE: when padding, make sure there are at least two
+ * space characters of padding. Otherwise, rather break the line.
+ *
+ * - TERMP_DANGLE: don't newline when TERMP_NOBREAK is specified and
+ * the line is overrun, and don't pad-right if it's underrun.
+ *
+ * - TERMP_HANG: like TERMP_DANGLE, but doesn't newline when
+ * overruning, instead save the position and continue at that point
+ * when the next invocation.
+ *
+ * In-line line breaking:
+ *
+ * If TERMP_NOBREAK is specified and the line overruns the right
+ * margin, it will break and pad-right to the right margin after
+ * writing. If maxrmargin is violated, it will break and continue
+ * writing from the right-margin, which will lead to the above scenario
+ * upon exit. Otherwise, the line will break at the right margin.
+ */
+void
+term_flushln(struct termp *p)
+{
+ int i; /* current input position in p->buf */
+ size_t vis; /* current visual position on output */
+ size_t vbl; /* number of blanks to prepend to output */
+ size_t vend; /* end of word visual position on output */
+ size_t bp; /* visual right border position */
+ int j; /* temporary loop index for p->buf */
+ int jhy; /* last hyph before overflow w/r/t j */
+ size_t maxvis; /* output position of visible boundary */
+ size_t mmax; /* used in calculating bp */
/*
- * This (and termp_it_pre()) are the most complicated functions
- * here. They must account for a considerable number of
- * switches that completely change the output behaviour, like
- * -tag versus -column. Yech.
+ * First, establish the maximum columns of "visible" content.
+ * This is usually the difference between the right-margin and
+ * an indentation, but can be, for tagged lists or columns, a
+ * small set of values.
*/
- switch (node->type) {
- case (MDOC_BODY):
- /* FALLTHROUGH */
- case (MDOC_HEAD):
- break;
- default:
- return;
- }
-
- it = node->parent;
- assert(MDOC_BLOCK == it->type);
- assert(MDOC_It == it->tok);
-
- n = it->parent;
- assert(MDOC_BODY == n->type);
- assert(MDOC_Bl == n->tok);
- n = n->parent;
- bl = &n->data.block;
-
- /* If `-tag', adjust our margins accordingly. */
-
- if (arg_hasattr(MDOC_Tag, bl->argc, bl->argv)) {
- flushln(p);
-
- /* FIXME: this should auto-size. */
- i = arg_getattr(MDOC_Width, bl->argc, bl->argv);
- width = i >= 0 ? arg_width(&bl->argv[i]) : 10;
+ assert(p->offset < p->rmargin);
- /* FIXME: nesting! Should happen at block. */
- i = arg_getattr(MDOC_Offset, bl->argc, bl->argv);
- offset = i >= 0 ? arg_width(&bl->argv[i]) : 0;
+ maxvis = (int)(p->rmargin - p->offset) - p->overstep < 0 ?
+ /* LINTED */
+ 0 : p->rmargin - p->offset - p->overstep;
+ mmax = (int)(p->maxrmargin - p->offset) - p->overstep < 0 ?
+ /* LINTED */
+ 0 : p->maxrmargin - p->offset - p->overstep;
- if (MDOC_HEAD == node->type) {
- p->rmargin = p->maxrmargin;
- p->offset -= offset;
- p->flags &= ~TERMP_NOBREAK;
- } else {
- p->offset -= width;
- p->flags &= ~TERMP_NOLPAD;
- }
- }
-
- if (arg_hasattr(MDOC_Ohang, bl->argc, bl->argv)) {
- i = arg_getattr(MDOC_Offset, bl->argc, bl->argv);
- offset = i >= 0 ? arg_offset(&bl->argv[i]) : 0;
-
- flushln(p);
- p->offset -= offset;
- return;
- }
-}
-
-
-/* ARGSUSED */
-static int
-termp_it_pre(DECL_ARGS)
-{
- const struct mdoc_node *n, *it;
- const struct mdoc_block *bl;
- int i;
- size_t width, offset;
+ bp = TERMP_NOBREAK & p->flags ? mmax : maxvis;
/*
- * Also see termp_it_post() for general comments.
+ * Indent the first line of a paragraph.
*/
-
- switch (node->type) {
- case (MDOC_BODY):
- /* FALLTHROUGH */
- case (MDOC_HEAD):
- it = node->parent;
- break;
- case (MDOC_BLOCK):
- it = node;
- break;
- default:
- return(1);
- }
-
- assert(MDOC_BLOCK == it->type);
- assert(MDOC_It == it->tok);
-
- n = it->parent;
- assert(MDOC_BODY == n->type);
- assert(MDOC_Bl == n->tok);
- n = n->parent;
- bl = &n->data.block;
-
- /* If `-compact', don't assert vertical space. */
-
- if (MDOC_BLOCK == node->type) {
- if (arg_hasattr(MDOC_Compact, bl->argc, bl->argv))
- newln(p);
- else
- vspace(p);
- return(1);
- }
-
- assert(MDOC_HEAD == node->type
- || MDOC_BODY == node->type);
-
- /* FIXME: see termp_it_post(). */
-
- /* If `-tag', adjust our margins accordingly. */
-
- if (arg_hasattr(MDOC_Tag, bl->argc, bl->argv)) {
- p->flags |= TERMP_NOSPACE;
-
- i = arg_getattr(MDOC_Width, bl->argc, bl->argv);
- width = i >= 0 ? arg_width(&bl->argv[i]) : 10;
-
- i = arg_getattr(MDOC_Offset, bl->argc, bl->argv);
- offset = i >= 0 ? arg_offset(&bl->argv[i]) : 0;
-
- if (MDOC_HEAD == node->type) {
- p->flags |= TERMP_NOBREAK;
- p->offset += offset;
- p->rmargin = p->offset + width;
- } else {
- p->flags |= TERMP_NOSPACE;
- p->flags |= TERMP_NOLPAD;
- p->offset += width;
+ vbl = p->flags & TERMP_NOLPAD ? 0 : p->offset;
+
+ vis = vend = i = 0;
+
+ while (i < (int)p->col) {
+ /*
+ * Handle literal tab characters: collapse all
+ * subsequent tabs into a single huge set of spaces.
+ */
+ for (j = i; j < (int)p->col; j++) {
+ if ('\t' != p->buf[j])
+ break;
+ vend = (vis / p->tabwidth + 1) * p->tabwidth;
+ vbl += vend - vis;
+ vis = vend;
}
- return(1);
- }
- /* If `-ohang', adjust left-margin. */
+ /*
+ * Count up visible word characters. Control sequences
+ * (starting with the CSI) aren't counted. A space
+ * generates a non-printing word, which is valid (the
+ * space is printed according to regular spacing rules).
+ */
+
+ /* LINTED */
+ for (jhy = 0; j < (int)p->col; j++) {
+ if ((j && ' ' == p->buf[j]) || '\t' == p->buf[j])
+ break;
+
+ /* Back over the the last printed character. */
+ if (8 == p->buf[j]) {
+ assert(j);
+ vend -= (*p->width)(p, p->buf[j - 1]);
+ continue;
+ }
+
+ /* Regular word. */
+ /* Break at the hyphen point if we overrun. */
+ if (vend > vis && vend < bp &&
+ ASCII_HYPH == p->buf[j])
+ jhy = j;
+
+ vend += (*p->width)(p, p->buf[j]);
+ }
- if (arg_hasattr(MDOC_Ohang, bl->argc, bl->argv)) {
- i = arg_getattr(MDOC_Offset, bl->argc, bl->argv);
- offset = i >= 0 ? arg_offset(&bl->argv[i]) : 0;
+ /*
+ * Find out whether we would exceed the right margin.
+ * If so, break to the next line.
+ */
+ if (vend > bp && 0 == jhy && vis > 0) {
+ vend -= vis;
+ (*p->endline)(p);
+ if (TERMP_NOBREAK & p->flags) {
+ p->viscol = p->rmargin;
+ (*p->advance)(p, p->rmargin);
+ vend += p->rmargin - p->offset;
+ } else {
+ p->viscol = 0;
+ vbl = p->offset;
+ }
+
+ /* Remove the p->overstep width. */
+
+ bp += (int)/* LINTED */
+ p->overstep;
+ p->overstep = 0;
+ }
- p->flags |= TERMP_NOSPACE;
- p->offset += offset;
- return(1);
+ /*
+ * Skip leading tabs, they were handled above.
+ */
+ while (i < (int)p->col && '\t' == p->buf[i])
+ i++;
+
+ /* Write out the [remaining] word. */
+ for ( ; i < (int)p->col; i++) {
+ if (vend > bp && jhy > 0 && i > jhy)
+ break;
+ if ('\t' == p->buf[i])
+ break;
+ if (' ' == p->buf[i]) {
+ j = i;
+ while (' ' == p->buf[i])
+ i++;
+ vbl += (i - j) * (*p->width)(p, ' ');
+ break;
+ }
+ if (ASCII_NBRSP == p->buf[i]) {
+ vbl += (*p->width)(p, ' ');
+ continue;
+ }
+
+ /*
+ * Now we definitely know there will be
+ * printable characters to output,
+ * so write preceding white space now.
+ */
+ if (vbl) {
+ (*p->advance)(p, vbl);
+ p->viscol += vbl;
+ vbl = 0;
+ }
+
+ if (ASCII_HYPH == p->buf[i]) {
+ (*p->letter)(p, '-');
+ p->viscol += (*p->width)(p, '-');
+ } else {
+ (*p->letter)(p, p->buf[i]);
+ p->viscol += (*p->width)(p, p->buf[i]);
+ }
+ }
+ vend += vbl;
+ vis = vend;
}
- return(1);
-}
-
-
-/* ARGSUSED */
-static void
-termp_nm_post(DECL_ARGS)
-{
-
- p->flags &= ~ttypes[TTYPE_PROG];
-}
-
-
-/* ARGSUSED */
-static void
-termp_fl_post(DECL_ARGS)
-{
-
- p->flags &= ~ttypes[TTYPE_CMD_FLAG];
-}
-
+ p->col = 0;
+ p->overstep = 0;
-/* ARGSUSED */
-static int
-termp_ar_pre(DECL_ARGS)
-{
-
- p->flags |= ttypes[TTYPE_CMD_ARG];
- if (NULL == node->child)
- word(p, "...");
- return(1);
-}
-
-
-/* ARGSUSED */
-static int
-termp_nm_pre(DECL_ARGS)
-{
-
- p->flags |= ttypes[TTYPE_PROG];
- if (NULL == node->child)
- word(p, meta->name);
- return(1);
-}
-
-
-/* ARGSUSED */
-static int
-termp_ns_pre(DECL_ARGS)
-{
-
- p->flags |= TERMP_NOSPACE;
- return(1);
-}
-
-
-/* ARGSUSED */
-static int
-termp_pp_pre(DECL_ARGS)
-{
-
- vspace(p);
- return(1);
-}
-
-
-/* ARGSUSED */
-static void
-termp_ar_post(DECL_ARGS)
-{
-
- p->flags &= ~ttypes[TTYPE_CMD_ARG];
-}
-
-
-/* ARGSUSED */
-static int
-termp_ex_pre(DECL_ARGS)
-{
- int i;
-
- i = arg_getattr(MDOC_Std, node->data.elem.argc,
- node->data.elem.argv);
- assert(i >= 0);
-
- word(p, "The");
- p->flags |= ttypes[TTYPE_PROG];
- word(p, *node->data.elem.argv[i].value);
- p->flags &= ~ttypes[TTYPE_PROG];
- word(p, "utility exits 0 on success, and >0 if an error occurs.");
-
- return(1);
-}
-
-
-/* ARGSUSED */
-static int
-termp_nd_pre(DECL_ARGS)
-{
-
- word(p, "\\-");
- return(1);
-}
-
-
-/* ARGSUSED */
-static void
-termp_bl_post(DECL_ARGS)
-{
-
- if (MDOC_BLOCK == node->type)
- newln(p);
-}
-
-
-/* ARGSUSED */
-static void
-termp_op_post(DECL_ARGS)
-{
-
- if (MDOC_BODY != node->type)
+ if ( ! (TERMP_NOBREAK & p->flags)) {
+ p->viscol = 0;
+ (*p->endline)(p);
return;
- p->flags |= TERMP_NOSPACE;
- word(p, "\\(rB");
-}
-
-
-/* ARGSUSED */
-static void
-termp_sh_post(DECL_ARGS)
-{
-
- switch (node->type) {
- case (MDOC_HEAD):
- p->flags &= ~ttypes[TTYPE_SECTION];
- newln(p);
- break;
- case (MDOC_BODY):
- newln(p);
- p->offset = 0;
- break;
- default:
- break;
}
-}
-
-
-/* ARGSUSED */
-static int
-termp_xr_pre(DECL_ARGS)
-{
- const struct mdoc_node *n;
-
- n = node->child;
- assert(n);
-
- assert(MDOC_TEXT == n->type);
- word(p, n->data.text.string);
-
- if (NULL == (n = n->next))
- return(0);
-
- assert(MDOC_TEXT == n->type);
- p->flags |= TERMP_NOSPACE;
- word(p, "(");
- p->flags |= TERMP_NOSPACE;
- word(p, n->data.text.string);
- p->flags |= TERMP_NOSPACE;
- word(p, ")");
-
- return(0);
-}
-
-
-/* ARGSUSED */
-static int
-termp_vt_pre(DECL_ARGS)
-{
-
- /* FIXME: this can be "type name". */
- p->flags |= ttypes[TTYPE_VAR_DECL];
- return(1);
-}
-
-
-/* ARGSUSED */
-static void
-termp_vt_post(DECL_ARGS)
-{
-
- p->flags &= ~ttypes[TTYPE_VAR_DECL];
- if (node->sec == SEC_SYNOPSIS)
- vspace(p);
-}
-
-
-/* ARGSUSED */
-static int
-termp_fd_pre(DECL_ARGS)
-{
-
- /*
- * FIXME: this naming is bad. This value is used, in general,
- * for the #include header or other preprocessor statement.
- */
- p->flags |= ttypes[TTYPE_FUNC_DECL];
- return(1);
-}
-
-
-/* ARGSUSED */
-static void
-termp_fd_post(DECL_ARGS)
-{
-
- p->flags &= ~ttypes[TTYPE_FUNC_DECL];
- if (node->sec == SEC_SYNOPSIS)
- vspace(p);
-
-}
-
-
-/* ARGSUSED */
-static int
-termp_sh_pre(DECL_ARGS)
-{
-
- switch (node->type) {
- case (MDOC_HEAD):
- vspace(p);
- p->flags |= ttypes[TTYPE_SECTION];
- break;
- case (MDOC_BODY):
- p->offset = INDENT;
- break;
- default:
- break;
- }
- return(1);
-}
+ if (TERMP_HANG & p->flags) {
+ /* We need one blank after the tag. */
+ p->overstep = /* LINTED */
+ vis - maxvis + (*p->width)(p, ' ');
+
+ /*
+ * Behave exactly the same way as groff:
+ * If we have overstepped the margin, temporarily move
+ * it to the right and flag the rest of the line to be
+ * shorter.
+ * If we landed right at the margin, be happy.
+ * If we are one step before the margin, temporarily
+ * move it one step LEFT and flag the rest of the line
+ * to be longer.
+ */
+ if (p->overstep >= -1) {
+ assert((int)maxvis + p->overstep >= 0);
+ /* LINTED */
+ maxvis += p->overstep;
+ } else
+ p->overstep = 0;
-/* ARGSUSED */
-static int
-termp_op_pre(DECL_ARGS)
-{
+ } else if (TERMP_DANGLE & p->flags)
+ return;
- switch (node->type) {
- case (MDOC_BODY):
- word(p, "\\(lB");
- p->flags |= TERMP_NOSPACE;
- break;
- default:
- break;
+ /* Right-pad. */
+ if (maxvis > vis + /* LINTED */
+ ((TERMP_TWOSPACE & p->flags) ?
+ (*p->width)(p, ' ') : 0)) {
+ p->viscol += maxvis - vis;
+ (*p->advance)(p, maxvis - vis);
+ vis += (maxvis - vis);
+ } else { /* ...or newline break. */
+ (*p->endline)(p);
+ p->viscol = p->rmargin;
+ (*p->advance)(p, p->rmargin);
}
- return(1);
-}
-
-
-/* ARGSUSED */
-static int
-termp_ud_pre(DECL_ARGS)
-{
-
- word(p, "currently under development.");
- return(1);
}
-/* ARGSUSED */
-static int
-termp_fl_pre(DECL_ARGS)
+/*
+ * A newline only breaks an existing line; it won't assert vertical
+ * space. All data in the output buffer is flushed prior to the newline
+ * assertion.
+ */
+void
+term_newln(struct termp *p)
{
- p->flags |= ttypes[TTYPE_CMD_FLAG];
- word(p, "\\-");
p->flags |= TERMP_NOSPACE;
- return(1);
-}
-
-
-/* ARGSUSED */
-static int
-termp_d1_pre(DECL_ARGS)
-{
-
- if (MDOC_BODY != node->type)
- return(1);
- newln(p);
- p->offset += INDENT;
- return(1);
-}
-
-
-/* ARGSUSED */
-static void
-termp_d1_post(DECL_ARGS)
-{
-
- if (MDOC_BODY != node->type)
+ if (0 == p->col && 0 == p->viscol) {
+ p->flags &= ~TERMP_NOLPAD;
return;
- newln(p);
- p->offset -= INDENT;
+ }
+ term_flushln(p);
+ p->flags &= ~TERMP_NOLPAD;
}
-/* ARGSUSED */
-static int
-termp_aq_pre(DECL_ARGS)
+/*
+ * Asserts a vertical space (a full, empty line-break between lines).
+ * Note that if used twice, this will cause two blank spaces and so on.
+ * All data in the output buffer is flushed prior to the newline
+ * assertion.
+ */
+void
+term_vspace(struct termp *p)
{
- if (MDOC_BODY != node->type)
- return(1);
- word(p, "<");
- p->flags |= TERMP_NOSPACE;
- return(1);
+ term_newln(p);
+ p->viscol = 0;
+ (*p->endline)(p);
}
-/* ARGSUSED */
static void
-termp_aq_post(DECL_ARGS)
+spec(struct termp *p, enum roffdeco d, const char *word, size_t len)
{
+ const char *rhs;
+ size_t sz;
- if (MDOC_BODY != node->type)
- return;
- p->flags |= TERMP_NOSPACE;
- word(p, ">");
+ rhs = chars_spec2str(p->symtab, word, len, &sz);
+ if (rhs)
+ encode(p, rhs, sz);
+ else if (DECO_SSPECIAL == d)
+ encode(p, word, len);
}
-/* ARGSUSED */
-static int
-termp_ft_pre(DECL_ARGS)
-{
-
- p->flags |= ttypes[TTYPE_FUNC_TYPE];
- return(1);
-}
-
-
-/* ARGSUSED */
static void
-termp_ft_post(DECL_ARGS)
-{
-
- p->flags &= ~ttypes[TTYPE_FUNC_TYPE];
- if (node->sec == SEC_SYNOPSIS)
- newln(p);
-
-}
-
-
-/* ARGSUSED */
-static int
-termp_fn_pre(DECL_ARGS)
+res(struct termp *p, const char *word, size_t len)
{
- const struct mdoc_node *n;
-
- assert(node->child);
- assert(MDOC_TEXT == node->child->type);
-
- /* FIXME: can be "type funcname" "type varname"... */
-
- p->flags |= ttypes[TTYPE_FUNC_NAME];
- word(p, node->child->data.text.string);
- p->flags &= ~ttypes[TTYPE_FUNC_NAME];
-
- p->flags |= TERMP_NOSPACE;
- word(p, "(");
-
- p->flags |= TERMP_NOSPACE;
- for (n = node->child->next; n; n = n->next) {
- assert(MDOC_TEXT == n->type);
- p->flags |= ttypes[TTYPE_FUNC_ARG];
- word(p, n->data.text.string);
- p->flags &= ~ttypes[TTYPE_FUNC_ARG];
- if ((n->next))
- word(p, ",");
- }
-
- p->flags |= TERMP_NOSPACE;
- word(p, ")");
-
- if (SEC_SYNOPSIS == node->sec)
- word(p, ";");
+ const char *rhs;
+ size_t sz;
- return(0);
+ rhs = chars_res2str(p->symtab, word, len, &sz);
+ if (rhs)
+ encode(p, rhs, sz);
}
-/* ARGSUSED */
-static void
-termp_fn_post(DECL_ARGS)
+void
+term_fontlast(struct termp *p)
{
+ enum termfont f;
- if (node->sec == SEC_SYNOPSIS)
- vspace(p);
-
+ f = p->fontl;
+ p->fontl = p->fontq[p->fonti];
+ p->fontq[p->fonti] = f;
}
-/* ARGSUSED */
-static int
-termp_sx_pre(DECL_ARGS)
+void
+term_fontrepl(struct termp *p, enum termfont f)
{
- p->flags |= ttypes[TTYPE_LINK];
- return(1);
+ p->fontl = p->fontq[p->fonti];
+ p->fontq[p->fonti] = f;
}
-/* ARGSUSED */
-static void
-termp_sx_post(DECL_ARGS)
+void
+term_fontpush(struct termp *p, enum termfont f)
{
- p->flags &= ~ttypes[TTYPE_LINK];
+ assert(p->fonti + 1 < 10);
+ p->fontl = p->fontq[p->fonti];
+ p->fontq[++p->fonti] = f;
}
-/* ARGSUSED */
-static int
-termp_fa_pre(DECL_ARGS)
+const void *
+term_fontq(struct termp *p)
{
- p->flags |= ttypes[TTYPE_FUNC_ARG];
- return(1);
+ return(&p->fontq[p->fonti]);
}
-/* ARGSUSED */
-static void
-termp_fa_post(DECL_ARGS)
+enum termfont
+term_fonttop(struct termp *p)
{
- p->flags &= ~ttypes[TTYPE_FUNC_ARG];
+ return(p->fontq[p->fonti]);
}
-/* ARGSUSED */
-static int
-termp_va_pre(DECL_ARGS)
+void
+term_fontpopq(struct termp *p, const void *key)
{
- p->flags |= ttypes[TTYPE_VAR_DECL];
- return(1);
+ while (p->fonti >= 0 && key != &p->fontq[p->fonti])
+ p->fonti--;
+ assert(p->fonti >= 0);
}
-/* ARGSUSED */
-static void
-termp_va_post(DECL_ARGS)
+void
+term_fontpop(struct termp *p)
{
- p->flags &= ~ttypes[TTYPE_VAR_DECL];
+ assert(p->fonti);
+ p->fonti--;
}
-/* ARGSUSED */
-static int
-termp_bd_pre(DECL_ARGS)
-{
- const struct mdoc_block *bl;
- const struct mdoc_node *n;
- int i;
-
- if (MDOC_BLOCK == node->type) {
- vspace(p);
- return(1);
- } else if (MDOC_BODY != node->type)
- return(1);
-
- assert(MDOC_BLOCK == node->parent->type);
-
- bl = &node->parent->data.block;
+/*
+ * Handle pwords, partial words, which may be either a single word or a
+ * phrase that cannot be broken down (such as a literal string). This
+ * handles word styling.
+ */
+void
+term_word(struct termp *p, const char *word)
+{
+ const char *sv, *seq;
+ int sz;
+ size_t ssz;
+ enum roffdeco deco;
+
+ sv = word;
+
+ if (word[0] && '\0' == word[1])
+ switch (word[0]) {
+ case('.'):
+ /* FALLTHROUGH */
+ case(','):
+ /* FALLTHROUGH */
+ case(';'):
+ /* FALLTHROUGH */
+ case(':'):
+ /* FALLTHROUGH */
+ case('?'):
+ /* FALLTHROUGH */
+ case('!'):
+ /* FALLTHROUGH */
+ case(')'):
+ /* FALLTHROUGH */
+ case(']'):
+ if ( ! (TERMP_IGNDELIM & p->flags))
+ p->flags |= TERMP_NOSPACE;
+ break;
+ default:
+ break;
+ }
- i = arg_getattr(MDOC_Offset, bl->argc, bl->argv);
- if (-1 != i) {
- assert(1 == bl->argv[i].sz);
- p->offset += arg_offset(&bl->argv[i]);
+ if ( ! (TERMP_NOSPACE & p->flags)) {
+ if ( ! (TERMP_KEEP & p->flags)) {
+ if (TERMP_PREKEEP & p->flags)
+ p->flags |= TERMP_KEEP;
+ bufferc(p, ' ');
+ if (TERMP_SENTENCE & p->flags)
+ bufferc(p, ' ');
+ } else
+ bufferc(p, ASCII_NBRSP);
}
- if ( ! arg_hasattr(MDOC_Literal, bl->argc, bl->argv))
- return(1);
-
- p->flags |= TERMP_LITERAL;
+ if ( ! (p->flags & TERMP_NONOSPACE))
+ p->flags &= ~TERMP_NOSPACE;
+ else
+ p->flags |= TERMP_NOSPACE;
- for (n = node->child; n; n = n->next) {
- assert(MDOC_TEXT == n->type); /* FIXME */
- if ((*n->data.text.string)) {
- word(p, n->data.text.string);
- flushln(p);
- } else
- vspace(p);
+ p->flags &= ~TERMP_SENTENCE;
+
+ while (*word) {
+ if ((ssz = strcspn(word, "\\")) > 0)
+ encode(p, word, ssz);
+
+ word += ssz;
+ if ('\\' != *word)
+ continue;
+
+ seq = ++word;
+ sz = a2roffdeco(&deco, &seq, &ssz);
+
+ switch (deco) {
+ case (DECO_RESERVED):
+ res(p, seq, ssz);
+ break;
+ case (DECO_SPECIAL):
+ /* FALLTHROUGH */
+ case (DECO_SSPECIAL):
+ spec(p, deco, seq, ssz);
+ break;
+ case (DECO_BOLD):
+ term_fontrepl(p, TERMFONT_BOLD);
+ break;
+ case (DECO_ITALIC):
+ term_fontrepl(p, TERMFONT_UNDER);
+ break;
+ case (DECO_ROMAN):
+ term_fontrepl(p, TERMFONT_NONE);
+ break;
+ case (DECO_PREVIOUS):
+ term_fontlast(p);
+ break;
+ default:
+ break;
+ }
+ word += sz;
+ if (DECO_NOSPACE == deco && '\0' == *word)
+ p->flags |= TERMP_NOSPACE;
}
- p->flags &= ~TERMP_LITERAL;
- return(0);
+ /*
+ * Note that we don't process the pipe: the parser sees it as
+ * punctuation, but we don't in terms of typography.
+ */
+ if (sv[0] && '\0' == sv[1])
+ switch (sv[0]) {
+ case('('):
+ /* FALLTHROUGH */
+ case('['):
+ p->flags |= TERMP_NOSPACE;
+ break;
+ default:
+ break;
+ }
}
-/* ARGSUSED */
static void
-termp_bd_post(DECL_ARGS)
+adjbuf(struct termp *p, size_t sz)
{
- int i;
- const struct mdoc_block *bl;
-
- if (MDOC_BODY != node->type)
- return;
- assert(MDOC_BLOCK == node->parent->type);
- bl = &node->parent->data.block;
+ if (0 == p->maxcols)
+ p->maxcols = 1024;
+ while (sz >= p->maxcols)
+ p->maxcols <<= 2;
- i = arg_getattr(MDOC_Offset, bl->argc, bl->argv);
- if (-1 != i) {
- assert(1 == bl->argv[i].sz);
- p->offset -= arg_offset(&bl->argv[i]);
+ p->buf = realloc(p->buf, p->maxcols);
+ if (NULL == p->buf) {
+ perror(NULL);
+ exit(MANDOCLEVEL_SYSERR);
}
}
-/* ARGSUSED */
-static int
-termp_qq_pre(DECL_ARGS)
-{
-
- if (MDOC_BODY != node->type)
- return(1);
- word(p, "\"");
- p->flags |= TERMP_NOSPACE;
- return(1);
-}
-
-
-/* ARGSUSED */
static void
-termp_qq_post(DECL_ARGS)
+bufferc(struct termp *p, char c)
{
- if (MDOC_BODY != node->type)
- return;
- p->flags |= TERMP_NOSPACE;
- word(p, "\"");
-}
-
-
-/* ARGSUSED */
-static int
-termp_bx_pre(DECL_ARGS)
-{
+ if (p->col + 1 >= p->maxcols)
+ adjbuf(p, p->col + 1);
- word(p, "BSD");
- return(1);
+ p->buf[(int)p->col++] = c;
}
-/* ARGSUSED */
-static int
-termp_ox_pre(DECL_ARGS)
+static void
+encode(struct termp *p, const char *word, size_t sz)
{
+ enum termfont f;
+ int i;
- word(p, "OpenBSD");
- return(1);
-}
+ /*
+ * Encode and buffer a string of characters. If the current
+ * font mode is unset, buffer directly, else encode then buffer
+ * character by character.
+ */
+ if (TERMFONT_NONE == (f = term_fonttop(p))) {
+ if (p->col + sz >= p->maxcols)
+ adjbuf(p, p->col + sz);
+ memcpy(&p->buf[(int)p->col], word, sz);
+ p->col += sz;
+ return;
+ }
-/* ARGSUSED */
-static int
-termp_nx_pre(DECL_ARGS)
-{
+ /* Pre-buffer, assuming worst-case. */
- word(p, "NetBSD");
- return(1);
-}
+ if (p->col + 1 + (sz * 3) >= p->maxcols)
+ adjbuf(p, p->col + 1 + (sz * 3));
+ for (i = 0; i < (int)sz; i++) {
+ if ( ! isgraph((u_char)word[i])) {
+ p->buf[(int)p->col++] = word[i];
+ continue;
+ }
-/* ARGSUSED */
-static int
-termp_sq_pre(DECL_ARGS)
-{
+ if (TERMFONT_UNDER == f)
+ p->buf[(int)p->col++] = '_';
+ else
+ p->buf[(int)p->col++] = word[i];
- if (MDOC_BODY != node->type)
- return(1);
- word(p, "`");
- p->flags |= TERMP_NOSPACE;
- return(1);
+ p->buf[(int)p->col++] = 8;
+ p->buf[(int)p->col++] = word[i];
+ }
}
-/* ARGSUSED */
-static void
-termp_sq_post(DECL_ARGS)
+size_t
+term_len(const struct termp *p, size_t sz)
{
- if (MDOC_BODY != node->type)
- return;
- p->flags |= TERMP_NOSPACE;
- word(p, "\'");
+ return((*p->width)(p, ' ') * sz);
}
-/* ARGSUSED */
-static int
-termp_pf_pre(DECL_ARGS)
+size_t
+term_strlen(const struct termp *p, const char *cp)
{
+ size_t sz;
- p->flags |= TERMP_IGNDELIM;
- return(1);
-}
-
+ for (sz = 0; *cp; cp++)
+ sz += (*p->width)(p, *cp);
-/* ARGSUSED */
-static void
-termp_pf_post(DECL_ARGS)
-{
-
- p->flags &= ~TERMP_IGNDELIM;
- p->flags |= TERMP_NOSPACE;
+ return(sz);
}
/* ARGSUSED */
-static int
-termp_ss_pre(DECL_ARGS)
+size_t
+term_vspan(const struct termp *p, const struct roffsu *su)
{
+ double r;
- switch (node->type) {
- case (MDOC_HEAD):
- vspace(p);
- p->flags |= ttypes[TTYPE_SSECTION];
- p->offset = INDENT / 2;
+ switch (su->unit) {
+ case (SCALE_CM):
+ r = su->scale * 2;
break;
- default:
+ case (SCALE_IN):
+ r = su->scale * 6;
break;
- }
-
- return(1);
-}
-
-
-/* ARGSUSED */
-static void
-termp_ss_post(DECL_ARGS)
-{
-
- switch (node->type) {
- case (MDOC_HEAD):
- p->flags &= ~ttypes[TTYPE_SSECTION];
- newln(p);
- p->offset = INDENT;
+ case (SCALE_PC):
+ r = su->scale;
+ break;
+ case (SCALE_PT):
+ r = su->scale / 8;
+ break;
+ case (SCALE_MM):
+ r = su->scale / 1000;
+ break;
+ case (SCALE_VS):
+ r = su->scale;
break;
default:
+ r = su->scale - 1;
break;
}
-}
-
-
-/* ARGSUSED */
-static int
-termp_pa_pre(DECL_ARGS)
-{
- p->flags |= ttypes[TTYPE_FILE];
- return(1);
+ if (r < 0.0)
+ r = 0.0;
+ return(/* LINTED */(size_t)
+ r);
}
-/* ARGSUSED */
-static void
-termp_pa_post(DECL_ARGS)
-{
-
- p->flags &= ~ttypes[TTYPE_FILE];
-}
-
-
-/* ARGSUSED */
-static int
-termp_qo_pre(DECL_ARGS)
-{
-
- if (MDOC_BODY != node->type)
- return(1);
- word(p, "\"");
- p->flags |= TERMP_NOSPACE;
- return(1);
-}
-
-
-/* ARGSUSED */
-static void
-termp_qo_post(DECL_ARGS)
-{
-
- if (MDOC_BODY != node->type)
- return;
- p->flags |= TERMP_NOSPACE;
- word(p, "\"");
-}
-
-
-/* ARGSUSED */
-static int
-termp_em_pre(DECL_ARGS)
-{
-
- p->flags |= ttypes[TTYPE_EMPH];
- return(1);
-}
-
-
-/* ARGSUSED */
-static void
-termp_em_post(DECL_ARGS)
+size_t
+term_hspan(const struct termp *p, const struct roffsu *su)
{
+ double v;
- p->flags &= ~ttypes[TTYPE_EMPH];
+ v = ((*p->hspan)(p, su));
+ if (v < 0.0)
+ v = 0.0;
+ return((size_t) /* LINTED */
+ v);
}