]>
git.cameronkatri.com Git - mandoc.git/blob - mdoc_macro.c
1 /* $Id: mdoc_macro.c,v 1.69 2010/05/26 09:35:35 kristaps Exp $ */
3 * Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@kth.se>
5 * Permission to use, copy, modify, and distribute this software for any
6 * purpose with or without fee is hereby granted, provided that the above
7 * copyright notice and this permission notice appear in all copies.
9 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
30 #include "libmandoc.h"
38 static int blk_full(MACRO_PROT_ARGS
);
39 static int blk_exp_close(MACRO_PROT_ARGS
);
40 static int blk_part_exp(MACRO_PROT_ARGS
);
41 static int blk_part_imp(MACRO_PROT_ARGS
);
42 static int ctx_synopsis(MACRO_PROT_ARGS
);
43 static int in_line_eoln(MACRO_PROT_ARGS
);
44 static int in_line_argn(MACRO_PROT_ARGS
);
45 static int in_line(MACRO_PROT_ARGS
);
46 static int obsolete(MACRO_PROT_ARGS
);
48 static int append_delims(struct mdoc
*,
50 static enum mdoct
lookup(enum mdoct
, const char *);
51 static enum mdoct
lookup_raw(const char *);
52 static int phrase(struct mdoc
*, int, int,
53 char *, enum margserr
);
54 static enum mdoct
rew_alt(enum mdoct
);
55 static int rew_dobreak(enum mdoct
,
56 const struct mdoc_node
*);
57 static enum rew
rew_dohalt(enum mdoct
, enum mdoc_type
,
58 const struct mdoc_node
*);
59 static int rew_elem(struct mdoc
*, enum mdoct
);
60 static int rew_last(struct mdoc
*,
61 const struct mdoc_node
*);
62 static int rew_sub(enum mdoc_type
, struct mdoc
*,
63 enum mdoct
, int, int);
64 static int swarn(struct mdoc
*, enum mdoc_type
, int,
65 int, const struct mdoc_node
*);
67 const struct mdoc_macro __mdoc_macros
[MDOC_MAX
] = {
68 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ap */
69 { in_line_eoln
, MDOC_PROLOGUE
}, /* Dd */
70 { in_line_eoln
, MDOC_PROLOGUE
}, /* Dt */
71 { in_line_eoln
, MDOC_PROLOGUE
}, /* Os */
72 { blk_full
, 0 }, /* Sh */
73 { blk_full
, 0 }, /* Ss */
74 { in_line_eoln
, 0 }, /* Pp */
75 { blk_part_imp
, MDOC_PARSED
}, /* D1 */
76 { blk_part_imp
, MDOC_PARSED
}, /* Dl */
77 { blk_full
, MDOC_EXPLICIT
}, /* Bd */
78 { blk_exp_close
, MDOC_EXPLICIT
}, /* Ed */
79 { blk_full
, MDOC_EXPLICIT
}, /* Bl */
80 { blk_exp_close
, MDOC_EXPLICIT
}, /* El */
81 { blk_full
, MDOC_PARSED
}, /* It */
82 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ad */
83 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* An */
84 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ar */
85 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Cd */
86 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Cm */
87 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Dv */
88 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Er */
89 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ev */
90 { in_line_eoln
, 0 }, /* Ex */
91 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fa */
92 { in_line_eoln
, 0 }, /* Fd */
93 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fl */
94 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fn */
95 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ft */
96 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ic */
97 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* In */
98 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Li */
99 { blk_full
, 0 }, /* Nd */
100 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Nm */
101 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Op */
102 { obsolete
, 0 }, /* Ot */
103 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Pa */
104 { in_line_eoln
, 0 }, /* Rv */
105 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* St */
106 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Va */
107 { ctx_synopsis
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Vt */
108 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Xr */
109 { in_line_eoln
, 0 }, /* %A */
110 { in_line_eoln
, 0 }, /* %B */
111 { in_line_eoln
, 0 }, /* %D */
112 { in_line_eoln
, 0 }, /* %I */
113 { in_line_eoln
, 0 }, /* %J */
114 { in_line_eoln
, 0 }, /* %N */
115 { in_line_eoln
, 0 }, /* %O */
116 { in_line_eoln
, 0 }, /* %P */
117 { in_line_eoln
, 0 }, /* %R */
118 { in_line_eoln
, 0 }, /* %T */
119 { in_line_eoln
, 0 }, /* %V */
120 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Ac */
121 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Ao */
122 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Aq */
123 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* At */
124 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Bc */
125 { blk_full
, MDOC_EXPLICIT
}, /* Bf */
126 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Bo */
127 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Bq */
128 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Bsx */
129 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Bx */
130 { in_line_eoln
, 0 }, /* Db */
131 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Dc */
132 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Do */
133 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Dq */
134 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Ec */
135 { blk_exp_close
, MDOC_EXPLICIT
}, /* Ef */
136 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Em */
137 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Eo */
138 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fx */
139 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ms */
140 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* No */
141 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ns */
142 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Nx */
143 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ox */
144 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Pc */
145 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_IGNDELIM
}, /* Pf */
146 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Po */
147 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Pq */
148 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Qc */
149 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ql */
150 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Qo */
151 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Qq */
152 { blk_exp_close
, MDOC_EXPLICIT
}, /* Re */
153 { blk_full
, MDOC_EXPLICIT
}, /* Rs */
154 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Sc */
155 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* So */
156 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Sq */
157 { in_line_eoln
, 0 }, /* Sm */
158 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Sx */
159 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Sy */
160 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Tn */
161 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ux */
162 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Xc */
163 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Xo */
164 { blk_full
, MDOC_EXPLICIT
| MDOC_CALLABLE
}, /* Fo */
165 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Fc */
166 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Oo */
167 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Oc */
168 { blk_full
, MDOC_EXPLICIT
}, /* Bk */
169 { blk_exp_close
, MDOC_EXPLICIT
}, /* Ek */
170 { in_line_eoln
, 0 }, /* Bt */
171 { in_line_eoln
, 0 }, /* Hf */
172 { obsolete
, 0 }, /* Fr */
173 { in_line_eoln
, 0 }, /* Ud */
174 { in_line
, 0 }, /* Lb */
175 { in_line_eoln
, 0 }, /* Lp */
176 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Lk */
177 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Mt */
178 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Brq */
179 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Bro */
180 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Brc */
181 { in_line_eoln
, 0 }, /* %C */
182 { obsolete
, 0 }, /* Es */
183 { obsolete
, 0 }, /* En */
184 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Dx */
185 { in_line_eoln
, 0 }, /* %Q */
186 { in_line_eoln
, 0 }, /* br */
187 { in_line_eoln
, 0 }, /* sp */
188 { in_line_eoln
, 0 }, /* %U */
191 const struct mdoc_macro
* const mdoc_macros
= __mdoc_macros
;
195 swarn(struct mdoc
*mdoc
, enum mdoc_type type
,
196 int line
, int pos
, const struct mdoc_node
*p
)
198 const char *n
, *t
, *tt
;
217 n
= mdoc_macronames
[p
->tok
];
221 n
= mdoc_macronames
[p
->tok
];
225 n
= mdoc_macronames
[p
->tok
];
232 rc
= mdoc_vmsg(mdoc
, MANDOCERR_SCOPE
, line
, pos
,
233 "%s scope breaks %s of %s", tt
, t
, n
);
235 /* FIXME: logic should be in driver. */
236 return(MDOC_IGN_SCOPE
& mdoc
->pflags
? rc
: 0);
241 * This is called at the end of parsing. It must traverse up the tree,
242 * closing out open [implicit] scopes. Obviously, open explicit scopes
246 mdoc_macroend(struct mdoc
*m
)
250 /* Scan for open explicit scopes. */
252 n
= MDOC_VALID
& m
->last
->flags
? m
->last
->parent
: m
->last
;
254 for ( ; n
; n
= n
->parent
) {
255 if (MDOC_BLOCK
!= n
->type
)
257 if ( ! (MDOC_EXPLICIT
& mdoc_macros
[n
->tok
].flags
))
259 mdoc_nmsg(m
, n
, MANDOCERR_SYNTSCOPE
);
263 /* Rewind to the first. */
265 return(rew_last(m
, m
->first
));
270 * Look up a macro from within a subsequent context.
273 lookup(enum mdoct from
, const char *p
)
275 /* FIXME: make -diag lists be un-PARSED. */
277 if ( ! (MDOC_PARSED
& mdoc_macros
[from
].flags
))
279 return(lookup_raw(p
));
284 * Lookup a macro following the initial line macro.
287 lookup_raw(const char *p
)
291 if (MDOC_MAX
== (res
= mdoc_hash_find(p
)))
293 if (MDOC_CALLABLE
& mdoc_macros
[res
].flags
)
300 rew_last(struct mdoc
*mdoc
, const struct mdoc_node
*to
)
304 mdoc
->next
= MDOC_NEXT_SIBLING
;
307 while (mdoc
->last
!= to
) {
308 if ( ! mdoc_valid_post(mdoc
))
310 if ( ! mdoc_action_post(mdoc
))
312 mdoc
->last
= mdoc
->last
->parent
;
316 if ( ! mdoc_valid_post(mdoc
))
318 return(mdoc_action_post(mdoc
));
323 * Return the opening macro of a closing one, e.g., `Ec' has `Eo' as its
327 rew_alt(enum mdoct tok
)
371 * Rewind rules. This indicates whether to stop rewinding
372 * (REWIND_HALT) without touching our current scope, stop rewinding and
373 * close our current scope (REWIND_REWIND), or continue (REWIND_NOHALT).
374 * The scope-closing and so on occurs in the various rew_* routines.
377 rew_dohalt(enum mdoct tok
, enum mdoc_type type
,
378 const struct mdoc_node
*p
)
381 if (MDOC_ROOT
== p
->type
)
383 if (MDOC_VALID
& p
->flags
)
384 return(REWIND_NOHALT
);
410 assert(MDOC_TAIL
!= type
);
411 if (type
== p
->type
&& tok
== p
->tok
)
412 return(REWIND_REWIND
);
415 assert(MDOC_TAIL
!= type
);
416 if (type
== p
->type
&& tok
== p
->tok
)
417 return(REWIND_REWIND
);
418 if (MDOC_BODY
== p
->type
&& MDOC_Bl
== p
->tok
)
422 if (type
== p
->type
&& tok
== p
->tok
)
423 return(REWIND_REWIND
);
428 assert(MDOC_TAIL
!= type
);
429 if (type
== p
->type
&& tok
== p
->tok
)
430 return(REWIND_REWIND
);
431 if (MDOC_BODY
== p
->type
&& MDOC_Sh
== p
->tok
)
465 if (type
== p
->type
&& tok
== p
->tok
)
466 return(REWIND_REWIND
);
468 /* Multi-line explicit scope close. */
500 if (type
== p
->type
&& rew_alt(tok
) == p
->tok
)
501 return(REWIND_REWIND
);
508 return(REWIND_NOHALT
);
513 * See if we can break an encountered scope (the rew_dohalt has returned
517 rew_dobreak(enum mdoct tok
, const struct mdoc_node
*p
)
520 assert(MDOC_ROOT
!= p
->type
);
521 if (MDOC_ELEM
== p
->type
)
523 if (MDOC_TEXT
== p
->type
)
525 if (MDOC_VALID
& p
->flags
)
530 return(MDOC_It
== p
->tok
);
532 return(MDOC_Nd
== p
->tok
);
534 return(MDOC_Ss
== p
->tok
);
536 if (MDOC_Nd
== p
->tok
)
538 if (MDOC_Ss
== p
->tok
)
540 return(MDOC_Sh
== p
->tok
);
542 if (MDOC_It
== p
->tok
)
546 if (MDOC_Op
== p
->tok
)
553 if (MDOC_EXPLICIT
& mdoc_macros
[tok
].flags
)
554 return(p
->tok
== rew_alt(tok
));
555 else if (MDOC_BLOCK
== p
->type
)
558 return(tok
== p
->tok
);
563 rew_elem(struct mdoc
*mdoc
, enum mdoct tok
)
568 if (MDOC_ELEM
!= n
->type
)
570 assert(MDOC_ELEM
== n
->type
);
571 assert(tok
== n
->tok
);
573 return(rew_last(mdoc
, n
));
578 rew_sub(enum mdoc_type t
, struct mdoc
*m
,
579 enum mdoct tok
, int line
, int ppos
)
585 for (n
= m
->last
; n
; n
= n
->parent
) {
586 c
= rew_dohalt(tok
, t
, n
);
587 if (REWIND_HALT
== c
) {
590 if ( ! (MDOC_EXPLICIT
& mdoc_macros
[tok
].flags
))
592 /* FIXME: shouldn't raise an error */
593 mdoc_pmsg(m
, line
, ppos
, MANDOCERR_SYNTNOSCOPE
);
596 if (REWIND_REWIND
== c
)
598 else if (rew_dobreak(tok
, n
))
600 if ( ! swarn(m
, t
, line
, ppos
, n
))
605 if ( ! rew_last(m
, n
))
610 * The current block extends an enclosing block beyond a line
611 * break. Now that the current block ends, close the enclosing
614 if (NULL
!= (n
= n
->pending
)) {
615 assert(MDOC_HEAD
== n
->type
);
616 if ( ! rew_last(m
, n
))
618 if ( ! mdoc_body_alloc(m
, n
->line
, n
->pos
, n
->tok
))
628 append_delims(struct mdoc
*m
, int line
, int *pos
, char *buf
)
634 if ('\0' == buf
[*pos
])
639 ac
= mdoc_zargs(m
, line
, pos
, buf
, ARGS_NOWARN
, &p
);
641 if (ARGS_ERROR
== ac
)
643 else if (ARGS_EOLN
== ac
)
646 assert(DELIM_NONE
!= mdoc_isdelim(p
));
647 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
651 * If we encounter end-of-sentence symbols, then trigger
654 * XXX: it's easy to allow this to propogate outward to
655 * the last symbol, such that `. )' will cause the
656 * correct double-spacing. However, (1) groff isn't
657 * smart enough to do this and (2) it would require
658 * knowing which symbols break this behaviour, for
659 * example, `. ;' shouldn't propogate the double-space.
661 if (mandoc_eos(p
, strlen(p
)))
662 m
->last
->flags
|= MDOC_EOS
;
670 * Close out block partial/full explicit.
673 blk_exp_close(MACRO_PROT_ARGS
)
675 int j
, lastarg
, maxargs
, flushed
, nl
;
680 nl
= MDOC_NEWLINE
& m
->flags
;
691 if ( ! (MDOC_CALLABLE
& mdoc_macros
[tok
].flags
)) {
692 /* FIXME: do this in validate */
694 if ( ! mdoc_pmsg(m
, line
, ppos
, MANDOCERR_ARGSLOST
))
697 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
699 return(rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
));
702 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
706 if ( ! mdoc_tail_alloc(m
, line
, ppos
, rew_alt(tok
)))
709 for (flushed
= j
= 0; ; j
++) {
712 if (j
== maxargs
&& ! flushed
) {
713 if ( ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
718 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
720 if (ARGS_ERROR
== ac
)
722 if (ARGS_PUNCT
== ac
)
727 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
729 if (MDOC_MAX
== ntok
) {
730 if ( ! mdoc_word_alloc(m
, line
, lastarg
, p
))
736 if ( ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
740 if ( ! mdoc_macro(m
, ntok
, line
, lastarg
, pos
, buf
))
745 if ( ! flushed
&& ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
750 return(append_delims(m
, line
, pos
, buf
));
755 in_line(MACRO_PROT_ARGS
)
757 int la
, lastpunct
, cnt
, nc
, nl
;
762 struct mdoc_arg
*arg
;
765 nl
= MDOC_NEWLINE
& m
->flags
;
768 * Whether we allow ignored elements (those without content,
769 * usually because of reserved words) to squeak by.
791 for (arg
= NULL
;; ) {
793 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
795 if (ARGV_WORD
== av
) {
808 for (cnt
= 0, lastpunct
= 1;; ) {
810 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
812 if (ARGS_ERROR
== ac
)
816 if (ARGS_PUNCT
== ac
)
819 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
822 * In this case, we've located a submacro and must
823 * execute it. Close out scope, if open. If no
824 * elements have been generated, either create one (nc)
825 * or raise a warning.
828 if (MDOC_MAX
!= ntok
) {
829 if (0 == lastpunct
&& ! rew_elem(m
, tok
))
831 if (nc
&& 0 == cnt
) {
832 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
834 if ( ! rew_last(m
, m
->last
))
836 } else if ( ! nc
&& 0 == cnt
) {
838 if ( ! mdoc_pmsg(m
, line
, ppos
, MANDOCERR_MACROEMPTY
))
841 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
845 return(append_delims(m
, line
, pos
, buf
));
849 * Non-quote-enclosed punctuation. Set up our scope, if
850 * a word; rewind the scope, if a delimiter; then append
854 d
= ARGS_QWORD
== ac
? DELIM_NONE
: mdoc_isdelim(p
);
856 if (ARGS_QWORD
!= ac
&& DELIM_NONE
!= d
) {
857 if (0 == lastpunct
&& ! rew_elem(m
, tok
))
860 } else if (lastpunct
) {
861 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
868 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
872 * `Fl' macros have their scope re-opened with each new
873 * word so that the `-' can be added to each one without
874 * having to parse out spaces.
876 if (0 == lastpunct
&& MDOC_Fl
== tok
) {
877 if ( ! rew_elem(m
, tok
))
883 if (0 == lastpunct
&& ! rew_elem(m
, tok
))
887 * If no elements have been collected and we're allowed to have
888 * empties (nc), open a scope and close it out. Otherwise,
892 if (nc
&& 0 == cnt
) {
893 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
895 if ( ! rew_last(m
, m
->last
))
897 } else if ( ! nc
&& 0 == cnt
) {
899 if ( ! mdoc_pmsg(m
, line
, ppos
, MANDOCERR_MACROEMPTY
))
905 return(append_delims(m
, line
, pos
, buf
));
910 blk_full(MACRO_PROT_ARGS
)
913 struct mdoc_arg
*arg
;
914 struct mdoc_node
*head
; /* save of head macro */
915 struct mdoc_node
*body
; /* save of body macro */
920 enum margserr ac
, lac
;
924 nl
= MDOC_NEWLINE
& m
->flags
;
926 /* Close out prior implicit scope. */
928 if ( ! (MDOC_EXPLICIT
& mdoc_macros
[tok
].flags
)) {
929 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
931 if ( ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
936 * This routine accomodates implicitly- and explicitly-scoped
937 * macro openings. Implicit ones first close out prior scope
938 * (seen above). Delay opening the head until necessary to
939 * allow leading punctuation to print. Special consideration
940 * for `It -column', which has phrase-part syntax instead of
941 * regular child nodes.
944 for (arg
= NULL
;; ) {
946 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
948 if (ARGV_WORD
== av
) {
962 if ( ! mdoc_block_alloc(m
, line
, ppos
, tok
, arg
))
968 * The `Nd' macro has all arguments in its body: it's a hybrid
969 * of block partial-explicit and full-implicit. Stupid.
972 if (MDOC_Nd
== tok
) {
973 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
976 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
978 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
988 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
990 if (ARGS_ERROR
== ac
)
995 if (ARGS_PEND
== ac
) {
996 if (ARGS_PPHRASE
== lac
)
1002 /* Don't emit leading punct. for phrases. */
1005 ARGS_PHRASE
!= ac
&&
1006 ARGS_PPHRASE
!= ac
&&
1008 DELIM_OPEN
== mdoc_isdelim(p
)) {
1009 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1014 /* Always re-open head for phrases. */
1017 ARGS_PHRASE
== ac
||
1018 ARGS_PPHRASE
== ac
) {
1019 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1024 if (ARGS_PHRASE
== ac
|| ARGS_PPHRASE
== ac
) {
1025 if (ARGS_PPHRASE
== ac
)
1026 m
->flags
|= MDOC_PPHRASE
;
1027 if ( ! phrase(m
, line
, la
, buf
, ac
))
1029 m
->flags
&= ~MDOC_PPHRASE
;
1030 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1035 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1037 if (MDOC_MAX
== ntok
) {
1038 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1043 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1049 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1054 if (nl
&& ! append_delims(m
, line
, pos
, buf
))
1057 /* If we've already opened our body, exit now. */
1064 * If there is an open (i.e., unvalidated) sub-block requiring
1065 * explicit close-out, postpone switching the current block from
1066 * head to body until the rew_sub() call closing out that
1069 for (n
= m
->last
; n
&& n
!= head
; n
= n
->parent
) {
1070 if (MDOC_BLOCK
== n
->type
&&
1071 MDOC_EXPLICIT
& mdoc_macros
[n
->tok
].flags
&&
1072 ! (MDOC_VALID
& n
->flags
)) {
1073 assert( ! (MDOC_ACTED
& n
->flags
));
1080 /* Close out scopes to remain in a consistent state. */
1082 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1084 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1092 blk_part_imp(MACRO_PROT_ARGS
)
1098 struct mdoc_node
*blk
; /* saved block context */
1099 struct mdoc_node
*body
; /* saved body context */
1100 struct mdoc_node
*n
;
1102 nl
= MDOC_NEWLINE
& m
->flags
;
1105 * A macro that spans to the end of the line. This is generally
1106 * (but not necessarily) called as the first macro. The block
1107 * has a head as the immediate child, which is always empty,
1108 * followed by zero or more opening punctuation nodes, then the
1109 * body (which may be empty, depending on the macro), then zero
1110 * or more closing punctuation nodes.
1113 if ( ! mdoc_block_alloc(m
, line
, ppos
, tok
, NULL
))
1118 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1120 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1124 * Open the body scope "on-demand", that is, after we've
1125 * processed all our the leading delimiters (open parenthesis,
1129 for (body
= NULL
; ; ) {
1131 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1133 if (ARGS_ERROR
== ac
)
1135 if (ARGS_EOLN
== ac
)
1137 if (ARGS_PUNCT
== ac
)
1140 if (NULL
== body
&& ARGS_QWORD
!= ac
&&
1141 DELIM_OPEN
== mdoc_isdelim(p
)) {
1142 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1148 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1153 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1155 if (MDOC_MAX
== ntok
) {
1156 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1161 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1166 /* Clean-ups to leave in a consistent state. */
1169 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1174 for (n
= body
->child
; n
&& n
->next
; n
= n
->next
)
1178 * End of sentence spacing: if the last node is a text node and
1179 * has a trailing period, then mark it as being end-of-sentence.
1182 if (n
&& MDOC_TEXT
== n
->type
&& n
->string
)
1183 if (mandoc_eos(n
->string
, strlen(n
->string
)))
1184 n
->flags
|= MDOC_EOS
;
1186 /* Up-propogate the end-of-space flag. */
1188 if (n
&& (MDOC_EOS
& n
->flags
)) {
1189 body
->flags
|= MDOC_EOS
;
1190 body
->parent
->flags
|= MDOC_EOS
;
1194 * If we can't rewind to our body, then our scope has already
1195 * been closed by another macro (like `Oc' closing `Op'). This
1196 * is ugly behaviour nodding its head to OpenBSD's overwhelming
1197 * crufty use of `Op' breakage.
1199 * FIXME - this should be ifdef'd OpenBSD?
1201 for (n
= m
->last
; n
; n
= n
->parent
)
1205 if (NULL
== n
&& ! mdoc_nmsg(m
, body
, MANDOCERR_SCOPE
))
1208 if (n
&& ! rew_last(m
, body
))
1211 /* Standard appending of delimiters. */
1213 if (nl
&& ! append_delims(m
, line
, pos
, buf
))
1216 /* Rewind scope, if applicable. */
1218 if (n
&& ! rew_last(m
, blk
))
1226 blk_part_exp(MACRO_PROT_ARGS
)
1230 struct mdoc_node
*head
; /* keep track of head */
1231 struct mdoc_node
*body
; /* keep track of body */
1235 nl
= MDOC_NEWLINE
& m
->flags
;
1238 * The opening of an explicit macro having zero or more leading
1239 * punctuation nodes; a head with optional single element (the
1240 * case of `Eo'); and a body that may be empty.
1243 if ( ! mdoc_block_alloc(m
, line
, ppos
, tok
, NULL
))
1246 for (head
= body
= NULL
; ; ) {
1248 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1250 if (ARGS_ERROR
== ac
)
1252 if (ARGS_PUNCT
== ac
)
1254 if (ARGS_EOLN
== ac
)
1257 /* Flush out leading punctuation. */
1259 if (NULL
== head
&& ARGS_QWORD
!= ac
&&
1260 DELIM_OPEN
== mdoc_isdelim(p
)) {
1261 assert(NULL
== body
);
1262 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1268 assert(NULL
== body
);
1269 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1275 * `Eo' gobbles any data into the head, but most other
1276 * macros just immediately close out and begin the body.
1281 /* No check whether it's a macro! */
1283 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1286 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1288 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1296 assert(NULL
!= head
&& NULL
!= body
);
1298 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1300 if (MDOC_MAX
== ntok
) {
1301 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1306 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1311 /* Clean-up to leave in a consistent state. */
1314 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1320 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1322 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1327 /* Standard appending of delimiters. */
1331 return(append_delims(m
, line
, pos
, buf
));
1337 in_line_argn(MACRO_PROT_ARGS
)
1339 int la
, flushed
, j
, maxargs
, nl
;
1342 struct mdoc_arg
*arg
;
1346 nl
= MDOC_NEWLINE
& m
->flags
;
1349 * A line macro that has a fixed number of arguments (maxargs).
1350 * Only open the scope once the first non-leading-punctuation is
1351 * found (unless MDOC_IGNDELIM is noted, like in `Pf'), then
1352 * keep it open until the maximum number of arguments are
1374 for (arg
= NULL
; ; ) {
1376 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
1378 if (ARGV_WORD
== av
) {
1383 if (ARGV_EOLN
== av
)
1388 mdoc_argv_free(arg
);
1392 for (flushed
= j
= 0; ; ) {
1394 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1396 if (ARGS_ERROR
== ac
)
1398 if (ARGS_PUNCT
== ac
)
1400 if (ARGS_EOLN
== ac
)
1403 if ( ! (MDOC_IGNDELIM
& mdoc_macros
[tok
].flags
) &&
1405 0 == j
&& DELIM_OPEN
== mdoc_isdelim(p
)) {
1406 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1410 if ( ! mdoc_elem_alloc(m
, line
, la
, tok
, arg
))
1413 if (j
== maxargs
&& ! flushed
) {
1414 if ( ! rew_elem(m
, tok
))
1419 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1421 if (MDOC_MAX
!= ntok
) {
1422 if ( ! flushed
&& ! rew_elem(m
, tok
))
1425 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1431 if ( ! (MDOC_IGNDELIM
& mdoc_macros
[tok
].flags
) &&
1434 DELIM_NONE
!= mdoc_isdelim(p
)) {
1435 if ( ! rew_elem(m
, tok
))
1441 * XXX: this is a hack to work around groff's ugliness
1442 * as regards `Xr' and extraneous arguments. It should
1443 * ideally be deprecated behaviour, but because this is
1444 * code is no here, it's unlikely to be removed.
1448 if (MDOC_Xr
== tok
&& j
== maxargs
) {
1449 if ( ! mdoc_elem_alloc(m
, line
, la
, MDOC_Ns
, NULL
))
1451 if ( ! rew_elem(m
, MDOC_Ns
))
1456 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1461 if (0 == j
&& ! mdoc_elem_alloc(m
, line
, la
, tok
, arg
))
1464 /* Close out in a consistent state. */
1466 if ( ! flushed
&& ! rew_elem(m
, tok
))
1470 return(append_delims(m
, line
, pos
, buf
));
1475 in_line_eoln(MACRO_PROT_ARGS
)
1480 struct mdoc_arg
*arg
;
1484 assert( ! (MDOC_PARSED
& mdoc_macros
[tok
].flags
));
1486 /* Parse macro arguments. */
1488 for (arg
= NULL
; ; ) {
1490 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
1492 if (ARGV_WORD
== av
) {
1496 if (ARGV_EOLN
== av
)
1501 mdoc_argv_free(arg
);
1505 /* Open element scope. */
1507 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
1510 /* Parse argument terms. */
1514 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1516 if (ARGS_ERROR
== ac
)
1518 if (ARGS_EOLN
== ac
)
1521 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1523 if (MDOC_MAX
== ntok
) {
1524 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1529 if ( ! rew_elem(m
, tok
))
1531 return(mdoc_macro(m
, ntok
, line
, la
, pos
, buf
));
1534 /* Close out (no delimiters). */
1536 return(rew_elem(m
, tok
));
1542 ctx_synopsis(MACRO_PROT_ARGS
)
1546 nl
= MDOC_NEWLINE
& m
->flags
;
1548 /* If we're not in the SYNOPSIS, go straight to in-line. */
1549 if (SEC_SYNOPSIS
!= m
->lastsec
)
1550 return(in_line(m
, tok
, line
, ppos
, pos
, buf
));
1552 /* If we're a nested call, same place. */
1554 return(in_line(m
, tok
, line
, ppos
, pos
, buf
));
1557 * XXX: this will open a block scope; however, if later we end
1558 * up formatting the block scope, then child nodes will inherit
1559 * the formatting. Be careful.
1562 return(blk_part_imp(m
, tok
, line
, ppos
, pos
, buf
));
1568 obsolete(MACRO_PROT_ARGS
)
1571 return(mdoc_pmsg(m
, line
, ppos
, MANDOCERR_MACROOBS
));
1576 * Phrases occur within `Bl -column' entries, separated by `Ta' or tabs.
1577 * They're unusual because they're basically free-form text until a
1578 * macro is encountered.
1581 phrase(struct mdoc
*m
, int line
, int ppos
, char *buf
, enum margserr ac
)
1588 assert(ARGS_PHRASE
== ac
|| ARGS_PPHRASE
== ac
);
1590 for (pos
= ppos
; ; ) {
1593 aac
= mdoc_zargs(m
, line
, &pos
, buf
, 0, &p
);
1595 if (ARGS_ERROR
== aac
)
1597 if (ARGS_EOLN
== aac
)
1600 ntok
= ARGS_QWORD
== aac
? MDOC_MAX
: lookup_raw(p
);
1602 if (MDOC_MAX
== ntok
) {
1603 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1608 if ( ! mdoc_macro(m
, ntok
, line
, la
, &pos
, buf
))
1610 return(append_delims(m
, line
, &pos
, buf
));