]>
git.cameronkatri.com Git - mandoc.git/blob - mdoc_macro.c
1 /* $Id: mdoc_macro.c,v 1.85 2010/06/29 19:45:06 schwarze Exp $ */
3 * Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@bsd.lv>
5 * Permission to use, copy, modify, and distribute this software for any
6 * purpose with or without fee is hereby granted, provided that the above
7 * copyright notice and this permission notice appear in all copies.
9 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
30 #include "libmandoc.h"
32 enum rew
{ /* see rew_dohalt() */
40 static int blk_full(MACRO_PROT_ARGS
);
41 static int blk_exp_close(MACRO_PROT_ARGS
);
42 static int blk_part_exp(MACRO_PROT_ARGS
);
43 static int blk_part_imp(MACRO_PROT_ARGS
);
44 static int ctx_synopsis(MACRO_PROT_ARGS
);
45 static int in_line_eoln(MACRO_PROT_ARGS
);
46 static int in_line_argn(MACRO_PROT_ARGS
);
47 static int in_line(MACRO_PROT_ARGS
);
48 static int obsolete(MACRO_PROT_ARGS
);
49 static int phrase_ta(MACRO_PROT_ARGS
);
51 static int append_delims(struct mdoc
*,
53 static enum mdoct
lookup(enum mdoct
, const char *);
54 static enum mdoct
lookup_raw(const char *);
55 static int make_pending(struct mdoc_node
*, enum mdoct
,
56 struct mdoc
*, int, int);
57 static int phrase(struct mdoc
*, int, int, char *);
58 static enum mdoct
rew_alt(enum mdoct
);
59 static enum rew
rew_dohalt(enum mdoct
, enum mdoc_type
,
60 const struct mdoc_node
*);
61 static int rew_elem(struct mdoc
*, enum mdoct
);
62 static int rew_last(struct mdoc
*,
63 const struct mdoc_node
*);
64 static int rew_sub(enum mdoc_type
, struct mdoc
*,
65 enum mdoct
, int, int);
67 const struct mdoc_macro __mdoc_macros
[MDOC_MAX
] = {
68 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ap */
69 { in_line_eoln
, MDOC_PROLOGUE
}, /* Dd */
70 { in_line_eoln
, MDOC_PROLOGUE
}, /* Dt */
71 { in_line_eoln
, MDOC_PROLOGUE
}, /* Os */
72 { blk_full
, 0 }, /* Sh */
73 { blk_full
, 0 }, /* Ss */
74 { in_line_eoln
, 0 }, /* Pp */
75 { blk_part_imp
, MDOC_PARSED
}, /* D1 */
76 { blk_part_imp
, MDOC_PARSED
}, /* Dl */
77 { blk_full
, MDOC_EXPLICIT
}, /* Bd */
78 { blk_exp_close
, MDOC_EXPLICIT
}, /* Ed */
79 { blk_full
, MDOC_EXPLICIT
}, /* Bl */
80 { blk_exp_close
, MDOC_EXPLICIT
}, /* El */
81 { blk_full
, MDOC_PARSED
}, /* It */
82 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ad */
83 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* An */
84 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ar */
85 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Cd */
86 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Cm */
87 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Dv */
88 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Er */
89 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ev */
90 { in_line_eoln
, 0 }, /* Ex */
91 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fa */
92 { in_line_eoln
, 0 }, /* Fd */
93 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fl */
94 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fn */
95 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ft */
96 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ic */
97 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* In */
98 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Li */
99 { blk_full
, 0 }, /* Nd */
100 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Nm */
101 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Op */
102 { obsolete
, 0 }, /* Ot */
103 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Pa */
104 { in_line_eoln
, 0 }, /* Rv */
105 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* St */
106 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Va */
107 { ctx_synopsis
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Vt */
108 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Xr */
109 { in_line_eoln
, 0 }, /* %A */
110 { in_line_eoln
, 0 }, /* %B */
111 { in_line_eoln
, 0 }, /* %D */
112 { in_line_eoln
, 0 }, /* %I */
113 { in_line_eoln
, 0 }, /* %J */
114 { in_line_eoln
, 0 }, /* %N */
115 { in_line_eoln
, 0 }, /* %O */
116 { in_line_eoln
, 0 }, /* %P */
117 { in_line_eoln
, 0 }, /* %R */
118 { in_line_eoln
, 0 }, /* %T */
119 { in_line_eoln
, 0 }, /* %V */
120 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Ac */
121 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Ao */
122 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Aq */
123 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* At */
124 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Bc */
125 { blk_full
, MDOC_EXPLICIT
}, /* Bf */
126 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Bo */
127 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Bq */
128 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Bsx */
129 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Bx */
130 { in_line_eoln
, 0 }, /* Db */
131 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Dc */
132 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Do */
133 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Dq */
134 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Ec */
135 { blk_exp_close
, MDOC_EXPLICIT
}, /* Ef */
136 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Em */
137 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Eo */
138 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fx */
139 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ms */
140 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* No */
141 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ns */
142 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Nx */
143 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ox */
144 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Pc */
145 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_IGNDELIM
}, /* Pf */
146 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Po */
147 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Pq */
148 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Qc */
149 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ql */
150 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Qo */
151 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Qq */
152 { blk_exp_close
, MDOC_EXPLICIT
}, /* Re */
153 { blk_full
, MDOC_EXPLICIT
}, /* Rs */
154 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Sc */
155 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* So */
156 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Sq */
157 { in_line_eoln
, 0 }, /* Sm */
158 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Sx */
159 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Sy */
160 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Tn */
161 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ux */
162 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Xc */
163 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Xo */
164 { blk_full
, MDOC_EXPLICIT
| MDOC_CALLABLE
}, /* Fo */
165 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Fc */
166 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Oo */
167 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Oc */
168 { blk_full
, MDOC_EXPLICIT
}, /* Bk */
169 { blk_exp_close
, MDOC_EXPLICIT
}, /* Ek */
170 { in_line_eoln
, 0 }, /* Bt */
171 { in_line_eoln
, 0 }, /* Hf */
172 { obsolete
, 0 }, /* Fr */
173 { in_line_eoln
, 0 }, /* Ud */
174 { in_line
, 0 }, /* Lb */
175 { in_line_eoln
, 0 }, /* Lp */
176 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Lk */
177 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Mt */
178 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Brq */
179 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Bro */
180 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Brc */
181 { in_line_eoln
, 0 }, /* %C */
182 { obsolete
, 0 }, /* Es */
183 { obsolete
, 0 }, /* En */
184 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Dx */
185 { in_line_eoln
, 0 }, /* %Q */
186 { in_line_eoln
, 0 }, /* br */
187 { in_line_eoln
, 0 }, /* sp */
188 { in_line_eoln
, 0 }, /* %U */
189 { phrase_ta
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ta */
192 const struct mdoc_macro
* const mdoc_macros
= __mdoc_macros
;
196 * This is called at the end of parsing. It must traverse up the tree,
197 * closing out open [implicit] scopes. Obviously, open explicit scopes
201 mdoc_macroend(struct mdoc
*m
)
205 /* Scan for open explicit scopes. */
207 n
= MDOC_VALID
& m
->last
->flags
? m
->last
->parent
: m
->last
;
209 for ( ; n
; n
= n
->parent
) {
210 if (MDOC_BLOCK
!= n
->type
)
212 if ( ! (MDOC_EXPLICIT
& mdoc_macros
[n
->tok
].flags
))
214 mdoc_nmsg(m
, n
, MANDOCERR_SYNTSCOPE
);
218 /* Rewind to the first. */
220 return(rew_last(m
, m
->first
));
225 * Look up a macro from within a subsequent context.
228 lookup(enum mdoct from
, const char *p
)
230 /* FIXME: make -diag lists be un-PARSED. */
232 if ( ! (MDOC_PARSED
& mdoc_macros
[from
].flags
))
234 return(lookup_raw(p
));
239 * Lookup a macro following the initial line macro.
242 lookup_raw(const char *p
)
246 if (MDOC_MAX
== (res
= mdoc_hash_find(p
)))
248 if (MDOC_CALLABLE
& mdoc_macros
[res
].flags
)
255 rew_last(struct mdoc
*mdoc
, const struct mdoc_node
*to
)
259 mdoc
->next
= MDOC_NEXT_SIBLING
;
262 while (mdoc
->last
!= to
) {
263 if ( ! mdoc_valid_post(mdoc
))
265 if ( ! mdoc_action_post(mdoc
))
267 mdoc
->last
= mdoc
->last
->parent
;
271 if ( ! mdoc_valid_post(mdoc
))
273 return(mdoc_action_post(mdoc
));
278 * For a block closing macro, return the corresponding opening one.
279 * Otherwise, return the macro itself.
282 rew_alt(enum mdoct tok
)
325 * Rewinding to tok, how do we have to handle *p?
326 * REWIND_NONE: *p would delimit tok, but no tok scope is open
327 * inside *p, so there is no need to rewind anything at all.
328 * REWIND_THIS: *p matches tok, so rewind *p and nothing else.
329 * REWIND_MORE: *p is implicit, rewind it and keep searching for tok.
330 * REWIND_LATER: *p is explicit and still open, postpone rewinding.
331 * REWIND_ERROR: No tok block is open at all.
334 rew_dohalt(enum mdoct tok
, enum mdoc_type type
,
335 const struct mdoc_node
*p
)
338 if (MDOC_ROOT
== p
->type
)
339 return(MDOC_BLOCK
== type
&&
340 MDOC_EXPLICIT
& mdoc_macros
[tok
].flags
?
341 REWIND_ERROR
: REWIND_NONE
);
342 if (MDOC_TEXT
== p
->type
|| MDOC_VALID
& p
->flags
)
347 return(p
->end
? REWIND_NONE
:
348 type
== p
->type
? REWIND_THIS
: REWIND_MORE
);
350 if (MDOC_ELEM
== p
->type
)
355 if (MDOC_It
== p
->tok
)
359 if (MDOC_BODY
== p
->type
&& MDOC_Bl
== p
->tok
)
363 * XXX Badly nested block handling still fails badly
364 * when one block is breaking two blocks of the same type.
365 * This is an incomplete and extremely ugly workaround,
366 * required to let the OpenBSD tree build.
369 if (MDOC_Op
== p
->tok
)
375 if (MDOC_BODY
== p
->type
&& MDOC_Sh
== p
->tok
)
379 if (MDOC_Nd
== p
->tok
|| MDOC_Ss
== p
->tok
||
387 return(p
->end
|| (MDOC_BLOCK
== p
->type
&&
388 ! (MDOC_EXPLICIT
& mdoc_macros
[tok
].flags
)) ?
389 REWIND_MORE
: REWIND_LATER
);
394 rew_elem(struct mdoc
*mdoc
, enum mdoct tok
)
399 if (MDOC_ELEM
!= n
->type
)
401 assert(MDOC_ELEM
== n
->type
);
402 assert(tok
== n
->tok
);
404 return(rew_last(mdoc
, n
));
409 * We are trying to close a block identified by tok,
410 * but the child block *broken is still open.
411 * Thus, postpone closing the tok block
412 * until the rew_sub call closing *broken.
415 make_pending(struct mdoc_node
*broken
, enum mdoct tok
,
416 struct mdoc
*m
, int line
, int ppos
)
418 struct mdoc_node
*breaker
;
421 * Iterate backwards, searching for the block matching tok,
422 * that is, the block breaking the *broken block.
424 for (breaker
= broken
->parent
; breaker
; breaker
= breaker
->parent
) {
427 * If the *broken block had already been broken before
428 * and we encounter its breaker, make the tok block
429 * pending on the inner breaker.
430 * Graphically, "[A breaker=[B broken=[C->B B] tok=A] C]"
431 * becomes "[A broken=[B [C->B B] tok=A] C]"
432 * and finally "[A [B->A [C->B B] A] C]".
434 if (breaker
== broken
->pending
) {
439 if (REWIND_THIS
!= rew_dohalt(tok
, MDOC_BLOCK
, breaker
))
441 if (MDOC_BODY
== broken
->type
)
442 broken
= broken
->parent
;
446 * If another, outer breaker is already pending on
447 * the *broken block, we must not clobber the link
448 * to the outer breaker, but make it pending on the
449 * new, now inner breaker.
450 * Graphically, "[A breaker=[B broken=[C->A A] tok=B] C]"
451 * becomes "[A breaker=[B->A broken=[C A] tok=B] C]"
452 * and finally "[A [B->A [C->B A] B] C]".
454 if (broken
->pending
) {
455 struct mdoc_node
*taker
;
458 * If the breaker had also been broken before,
459 * it cannot take on the outer breaker itself,
460 * but must hand it on to its own breakers.
461 * Graphically, this is the following situation:
462 * "[A [B breaker=[C->B B] broken=[D->A A] tok=C] D]"
463 * "[A taker=[B->A breaker=[C->B B] [D->C A] C] D]"
466 while (taker
->pending
)
467 taker
= taker
->pending
;
468 taker
->pending
= broken
->pending
;
470 broken
->pending
= breaker
;
471 mdoc_vmsg(m
, MANDOCERR_SCOPE
, line
, ppos
, "%s breaks %s",
472 mdoc_macronames
[tok
], mdoc_macronames
[broken
->tok
]);
477 * Found no matching block for tok.
478 * Are you trying to close a block that is not open?
479 * XXX Make this non-fatal.
481 mdoc_pmsg(m
, line
, ppos
, MANDOCERR_SYNTNOSCOPE
);
487 rew_sub(enum mdoc_type t
, struct mdoc
*m
,
488 enum mdoct tok
, int line
, int ppos
)
494 switch (rew_dohalt(tok
, t
, n
)) {
503 return(make_pending(n
, tok
, m
, line
, ppos
));
505 /* XXX Make this non-fatal. */
506 mdoc_pmsg(m
, line
, ppos
, MANDOCERR_SYNTNOSCOPE
);
513 if ( ! rew_last(m
, n
))
517 * The current block extends an enclosing block.
518 * Now that the current block ends, close the enclosing block, too.
520 while (NULL
!= (n
= n
->pending
)) {
521 if ( ! rew_last(m
, n
))
523 if (MDOC_HEAD
== n
->type
&&
524 ! mdoc_body_alloc(m
, n
->line
, n
->pos
, n
->tok
))
533 append_delims(struct mdoc
*m
, int line
, int *pos
, char *buf
)
539 if ('\0' == buf
[*pos
])
544 ac
= mdoc_zargs(m
, line
, pos
, buf
, ARGS_NOWARN
, &p
);
546 if (ARGS_ERROR
== ac
)
548 else if (ARGS_EOLN
== ac
)
551 assert(DELIM_NONE
!= mdoc_isdelim(p
));
552 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
556 * If we encounter end-of-sentence symbols, then trigger
559 * XXX: it's easy to allow this to propogate outward to
560 * the last symbol, such that `. )' will cause the
561 * correct double-spacing. However, (1) groff isn't
562 * smart enough to do this and (2) it would require
563 * knowing which symbols break this behaviour, for
564 * example, `. ;' shouldn't propogate the double-space.
566 if (mandoc_eos(p
, strlen(p
)))
567 m
->last
->flags
|= MDOC_EOS
;
575 * Close out block partial/full explicit.
578 blk_exp_close(MACRO_PROT_ARGS
)
580 struct mdoc_node
*body
; /* Our own body. */
581 struct mdoc_node
*later
; /* A sub-block starting later. */
582 struct mdoc_node
*n
; /* For searching backwards. */
584 int j
, lastarg
, maxargs
, flushed
, nl
;
586 enum mdoct atok
, ntok
;
589 nl
= MDOC_NEWLINE
& m
->flags
;
601 * Search backwards for beginnings of blocks,
602 * both of our own and of pending sub-blocks.
606 for (n
= m
->last
; n
; n
= n
->parent
) {
607 if (MDOC_VALID
& n
->flags
)
610 /* Remember the start of our own body. */
611 if (MDOC_BODY
== n
->type
&& atok
== n
->tok
) {
617 if (MDOC_BLOCK
!= n
->type
)
619 if (atok
== n
->tok
) {
623 * Found the start of our own block.
624 * When there is no pending sub block,
625 * just proceed to closing out.
631 * When there is a pending sub block,
632 * postpone closing out the current block
633 * until the rew_sub() closing out the sub-block.
635 if ( ! make_pending(later
, tok
, m
, line
, ppos
))
639 * Mark the place where the formatting - but not
640 * the scope - of the current block ends.
642 if ( ! mdoc_endbody_alloc(m
, line
, ppos
,
643 atok
, body
, ENDBODY_SPACE
))
649 * When finding an open sub block, remember the last
650 * open explicit block, or, in case there are only
651 * implicit ones, the first open implicit block.
654 MDOC_EXPLICIT
& mdoc_macros
[later
->tok
].flags
)
656 if (MDOC_CALLABLE
& mdoc_macros
[n
->tok
].flags
) {
657 assert( ! (MDOC_ACTED
& n
->flags
));
662 if ( ! (MDOC_CALLABLE
& mdoc_macros
[tok
].flags
)) {
663 /* FIXME: do this in validate */
665 if ( ! mdoc_pmsg(m
, line
, ppos
, MANDOCERR_ARGSLOST
))
668 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
670 return(rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
));
673 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
676 if (NULL
== later
&& maxargs
> 0)
677 if ( ! mdoc_tail_alloc(m
, line
, ppos
, rew_alt(tok
)))
680 for (flushed
= j
= 0; ; j
++) {
683 if (j
== maxargs
&& ! flushed
) {
684 if ( ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
689 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
691 if (ARGS_ERROR
== ac
)
693 if (ARGS_PUNCT
== ac
)
698 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
700 if (MDOC_MAX
== ntok
) {
701 if ( ! mdoc_word_alloc(m
, line
, lastarg
, p
))
707 if ( ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
711 if ( ! mdoc_macro(m
, ntok
, line
, lastarg
, pos
, buf
))
716 if ( ! flushed
&& ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
721 return(append_delims(m
, line
, pos
, buf
));
726 in_line(MACRO_PROT_ARGS
)
728 int la
, scope
, cnt
, nc
, nl
;
733 struct mdoc_arg
*arg
;
736 nl
= MDOC_NEWLINE
& m
->flags
;
739 * Whether we allow ignored elements (those without content,
740 * usually because of reserved words) to squeak by.
762 for (arg
= NULL
;; ) {
764 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
766 if (ARGV_WORD
== av
) {
779 for (cnt
= scope
= 0;; ) {
781 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
783 if (ARGS_ERROR
== ac
)
787 if (ARGS_PUNCT
== ac
)
790 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
793 * In this case, we've located a submacro and must
794 * execute it. Close out scope, if open. If no
795 * elements have been generated, either create one (nc)
796 * or raise a warning.
799 if (MDOC_MAX
!= ntok
) {
800 if (scope
&& ! rew_elem(m
, tok
))
802 if (nc
&& 0 == cnt
) {
803 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
805 if ( ! rew_last(m
, m
->last
))
807 } else if ( ! nc
&& 0 == cnt
) {
809 if ( ! mdoc_pmsg(m
, line
, ppos
, MANDOCERR_MACROEMPTY
))
812 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
816 return(append_delims(m
, line
, pos
, buf
));
820 * Non-quote-enclosed punctuation. Set up our scope, if
821 * a word; rewind the scope, if a delimiter; then append
825 d
= ARGS_QWORD
== ac
? DELIM_NONE
: mdoc_isdelim(p
);
827 if (DELIM_NONE
!= d
) {
829 * If we encounter closing punctuation, no word
830 * has been omitted, no scope is open, and we're
831 * allowed to have an empty element, then start
832 * a new scope. `Ar', `Fl', and `Li', only do
833 * this once per invocation. There may be more
834 * of these (all of them?).
836 if (0 == cnt
&& (nc
|| MDOC_Li
== tok
) &&
837 DELIM_CLOSE
== d
&& ! scope
) {
838 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
840 if (MDOC_Ar
== tok
|| MDOC_Li
== tok
||
846 * Close out our scope, if one is open, before
849 if (scope
&& ! rew_elem(m
, tok
))
852 } else if ( ! scope
) {
853 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
860 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
864 * `Fl' macros have their scope re-opened with each new
865 * word so that the `-' can be added to each one without
866 * having to parse out spaces.
868 if (scope
&& MDOC_Fl
== tok
) {
869 if ( ! rew_elem(m
, tok
))
875 if (scope
&& ! rew_elem(m
, tok
))
879 * If no elements have been collected and we're allowed to have
880 * empties (nc), open a scope and close it out. Otherwise,
884 if (nc
&& 0 == cnt
) {
885 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
887 if ( ! rew_last(m
, m
->last
))
889 } else if ( ! nc
&& 0 == cnt
) {
891 if ( ! mdoc_pmsg(m
, line
, ppos
, MANDOCERR_MACROEMPTY
))
897 return(append_delims(m
, line
, pos
, buf
));
902 blk_full(MACRO_PROT_ARGS
)
905 struct mdoc_arg
*arg
;
906 struct mdoc_node
*head
; /* save of head macro */
907 struct mdoc_node
*body
; /* save of body macro */
911 enum margserr ac
, lac
;
915 nl
= MDOC_NEWLINE
& m
->flags
;
917 /* Close out prior implicit scope. */
919 if ( ! (MDOC_EXPLICIT
& mdoc_macros
[tok
].flags
)) {
920 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
922 if ( ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
927 * This routine accomodates implicitly- and explicitly-scoped
928 * macro openings. Implicit ones first close out prior scope
929 * (seen above). Delay opening the head until necessary to
930 * allow leading punctuation to print. Special consideration
931 * for `It -column', which has phrase-part syntax instead of
932 * regular child nodes.
935 for (arg
= NULL
;; ) {
937 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
939 if (ARGV_WORD
== av
) {
953 if ( ! mdoc_block_alloc(m
, line
, ppos
, tok
, arg
))
959 * The `Nd' macro has all arguments in its body: it's a hybrid
960 * of block partial-explicit and full-implicit. Stupid.
963 if (MDOC_Nd
== tok
) {
964 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
967 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
969 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
978 /* Initialise last-phrase-type with ARGS_PEND. */
979 lac
= ARGS_ERROR
== ac
? ARGS_PEND
: ac
;
980 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
982 if (ARGS_ERROR
== ac
)
985 if (ARGS_EOLN
== ac
) {
986 if (ARGS_PPHRASE
!= lac
&& ARGS_PHRASE
!= lac
)
989 * This is necessary: if the last token on a
990 * line is a `Ta' or tab, then we'll get
991 * ARGS_EOLN, so we must be smart enough to
992 * reopen our scope if the last parse was a
993 * phrase or partial phrase.
995 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
997 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1004 * Emit leading punctuation (i.e., punctuation before
1005 * the MDOC_HEAD) for non-phrase types.
1010 ARGS_PHRASE
!= ac
&&
1011 ARGS_PPHRASE
!= ac
&&
1013 DELIM_OPEN
== mdoc_isdelim(p
)) {
1014 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1019 /* Open a head if one hasn't been opened. */
1022 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1027 if (ARGS_PHRASE
== ac
||
1029 ARGS_PPHRASE
== ac
) {
1031 * If we haven't opened a body yet, rewind the
1032 * head; if we have, rewind that instead.
1035 mtt
= body
? MDOC_BODY
: MDOC_HEAD
;
1036 if ( ! rew_sub(mtt
, m
, tok
, line
, ppos
))
1039 /* Then allocate our body context. */
1041 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1046 * Process phrases: set whether we're in a
1047 * partial-phrase (this effects line handling)
1048 * then call down into the phrase parser.
1051 if (ARGS_PPHRASE
== ac
)
1052 m
->flags
|= MDOC_PPHRASE
;
1053 if (ARGS_PEND
== ac
&& ARGS_PPHRASE
== lac
)
1054 m
->flags
|= MDOC_PPHRASE
;
1056 if ( ! phrase(m
, line
, la
, buf
))
1059 m
->flags
&= ~MDOC_PPHRASE
;
1063 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1065 if (MDOC_MAX
== ntok
) {
1066 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1071 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1077 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1082 if (nl
&& ! append_delims(m
, line
, pos
, buf
))
1085 /* If we've already opened our body, exit now. */
1091 * If there is an open (i.e., unvalidated) sub-block requiring
1092 * explicit close-out, postpone switching the current block from
1093 * head to body until the rew_sub() call closing out that
1096 for (n
= m
->last
; n
&& n
!= head
; n
= n
->parent
) {
1097 if (MDOC_BLOCK
== n
->type
&&
1098 MDOC_EXPLICIT
& mdoc_macros
[n
->tok
].flags
&&
1099 ! (MDOC_VALID
& n
->flags
)) {
1100 assert( ! (MDOC_ACTED
& n
->flags
));
1106 /* Close out scopes to remain in a consistent state. */
1108 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1110 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1114 if ( ! (MDOC_FREECOL
& m
->flags
))
1117 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
1119 if ( ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
1122 m
->flags
&= ~MDOC_FREECOL
;
1128 blk_part_imp(MACRO_PROT_ARGS
)
1134 struct mdoc_node
*blk
; /* saved block context */
1135 struct mdoc_node
*body
; /* saved body context */
1136 struct mdoc_node
*n
;
1138 nl
= MDOC_NEWLINE
& m
->flags
;
1141 * A macro that spans to the end of the line. This is generally
1142 * (but not necessarily) called as the first macro. The block
1143 * has a head as the immediate child, which is always empty,
1144 * followed by zero or more opening punctuation nodes, then the
1145 * body (which may be empty, depending on the macro), then zero
1146 * or more closing punctuation nodes.
1149 if ( ! mdoc_block_alloc(m
, line
, ppos
, tok
, NULL
))
1154 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1156 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1160 * Open the body scope "on-demand", that is, after we've
1161 * processed all our the leading delimiters (open parenthesis,
1165 for (body
= NULL
; ; ) {
1167 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1169 if (ARGS_ERROR
== ac
)
1171 if (ARGS_EOLN
== ac
)
1173 if (ARGS_PUNCT
== ac
)
1176 if (NULL
== body
&& ARGS_QWORD
!= ac
&&
1177 DELIM_OPEN
== mdoc_isdelim(p
)) {
1178 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1184 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1189 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1191 if (MDOC_MAX
== ntok
) {
1192 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1197 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1202 /* Clean-ups to leave in a consistent state. */
1205 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1210 for (n
= body
->child
; n
&& n
->next
; n
= n
->next
)
1214 * End of sentence spacing: if the last node is a text node and
1215 * has a trailing period, then mark it as being end-of-sentence.
1218 if (n
&& MDOC_TEXT
== n
->type
&& n
->string
)
1219 if (mandoc_eos(n
->string
, strlen(n
->string
)))
1220 n
->flags
|= MDOC_EOS
;
1222 /* Up-propogate the end-of-space flag. */
1224 if (n
&& (MDOC_EOS
& n
->flags
)) {
1225 body
->flags
|= MDOC_EOS
;
1226 body
->parent
->flags
|= MDOC_EOS
;
1230 * If there is an open sub-block requiring explicit close-out,
1231 * postpone closing out the current block
1232 * until the rew_sub() call closing out the sub-block.
1234 for (n
= m
->last
; n
&& n
!= body
&& n
!= blk
->parent
; n
= n
->parent
) {
1235 if (MDOC_BLOCK
== n
->type
&&
1236 MDOC_EXPLICIT
& mdoc_macros
[n
->tok
].flags
&&
1237 ! (MDOC_VALID
& n
->flags
)) {
1238 assert( ! (MDOC_ACTED
& n
->flags
));
1239 if ( ! make_pending(n
, tok
, m
, line
, ppos
))
1241 if ( ! mdoc_endbody_alloc(m
, line
, ppos
,
1242 tok
, body
, ENDBODY_NOSPACE
))
1249 * If we can't rewind to our body, then our scope has already
1250 * been closed by another macro (like `Oc' closing `Op'). This
1251 * is ugly behaviour nodding its head to OpenBSD's overwhelming
1252 * crufty use of `Op' breakage.
1254 if (n
!= body
&& ! mdoc_vmsg(m
, MANDOCERR_SCOPE
, line
, ppos
,
1255 "%s broken", mdoc_macronames
[tok
]))
1258 if (n
&& ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
1261 /* Standard appending of delimiters. */
1263 if (nl
&& ! append_delims(m
, line
, pos
, buf
))
1266 /* Rewind scope, if applicable. */
1268 if (n
&& ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
1276 blk_part_exp(MACRO_PROT_ARGS
)
1280 struct mdoc_node
*head
; /* keep track of head */
1281 struct mdoc_node
*body
; /* keep track of body */
1285 nl
= MDOC_NEWLINE
& m
->flags
;
1288 * The opening of an explicit macro having zero or more leading
1289 * punctuation nodes; a head with optional single element (the
1290 * case of `Eo'); and a body that may be empty.
1293 if ( ! mdoc_block_alloc(m
, line
, ppos
, tok
, NULL
))
1296 for (head
= body
= NULL
; ; ) {
1298 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1300 if (ARGS_ERROR
== ac
)
1302 if (ARGS_PUNCT
== ac
)
1304 if (ARGS_EOLN
== ac
)
1307 /* Flush out leading punctuation. */
1309 if (NULL
== head
&& ARGS_QWORD
!= ac
&&
1310 DELIM_OPEN
== mdoc_isdelim(p
)) {
1311 assert(NULL
== body
);
1312 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1318 assert(NULL
== body
);
1319 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1325 * `Eo' gobbles any data into the head, but most other
1326 * macros just immediately close out and begin the body.
1331 /* No check whether it's a macro! */
1333 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1336 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1338 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1346 assert(NULL
!= head
&& NULL
!= body
);
1348 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1350 if (MDOC_MAX
== ntok
) {
1351 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1356 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1361 /* Clean-up to leave in a consistent state. */
1364 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1370 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1372 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1377 /* Standard appending of delimiters. */
1381 return(append_delims(m
, line
, pos
, buf
));
1387 in_line_argn(MACRO_PROT_ARGS
)
1389 int la
, flushed
, j
, maxargs
, nl
;
1392 struct mdoc_arg
*arg
;
1396 nl
= MDOC_NEWLINE
& m
->flags
;
1399 * A line macro that has a fixed number of arguments (maxargs).
1400 * Only open the scope once the first non-leading-punctuation is
1401 * found (unless MDOC_IGNDELIM is noted, like in `Pf'), then
1402 * keep it open until the maximum number of arguments are
1424 for (arg
= NULL
; ; ) {
1426 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
1428 if (ARGV_WORD
== av
) {
1433 if (ARGV_EOLN
== av
)
1438 mdoc_argv_free(arg
);
1442 for (flushed
= j
= 0; ; ) {
1444 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1446 if (ARGS_ERROR
== ac
)
1448 if (ARGS_PUNCT
== ac
)
1450 if (ARGS_EOLN
== ac
)
1453 if ( ! (MDOC_IGNDELIM
& mdoc_macros
[tok
].flags
) &&
1455 0 == j
&& DELIM_OPEN
== mdoc_isdelim(p
)) {
1456 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1460 if ( ! mdoc_elem_alloc(m
, line
, la
, tok
, arg
))
1463 if (j
== maxargs
&& ! flushed
) {
1464 if ( ! rew_elem(m
, tok
))
1469 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1471 if (MDOC_MAX
!= ntok
) {
1472 if ( ! flushed
&& ! rew_elem(m
, tok
))
1475 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1481 if ( ! (MDOC_IGNDELIM
& mdoc_macros
[tok
].flags
) &&
1484 DELIM_NONE
!= mdoc_isdelim(p
)) {
1485 if ( ! rew_elem(m
, tok
))
1491 * XXX: this is a hack to work around groff's ugliness
1492 * as regards `Xr' and extraneous arguments. It should
1493 * ideally be deprecated behaviour, but because this is
1494 * code is no here, it's unlikely to be removed.
1498 if (MDOC_Xr
== tok
&& j
== maxargs
) {
1499 if ( ! mdoc_elem_alloc(m
, line
, la
, MDOC_Ns
, NULL
))
1501 if ( ! rew_elem(m
, MDOC_Ns
))
1506 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1511 if (0 == j
&& ! mdoc_elem_alloc(m
, line
, la
, tok
, arg
))
1514 /* Close out in a consistent state. */
1516 if ( ! flushed
&& ! rew_elem(m
, tok
))
1520 return(append_delims(m
, line
, pos
, buf
));
1525 in_line_eoln(MACRO_PROT_ARGS
)
1530 struct mdoc_arg
*arg
;
1534 assert( ! (MDOC_PARSED
& mdoc_macros
[tok
].flags
));
1536 /* Parse macro arguments. */
1538 for (arg
= NULL
; ; ) {
1540 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
1542 if (ARGV_WORD
== av
) {
1546 if (ARGV_EOLN
== av
)
1551 mdoc_argv_free(arg
);
1555 /* Open element scope. */
1557 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
1560 /* Parse argument terms. */
1564 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1566 if (ARGS_ERROR
== ac
)
1568 if (ARGS_EOLN
== ac
)
1571 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1573 if (MDOC_MAX
== ntok
) {
1574 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1579 if ( ! rew_elem(m
, tok
))
1581 return(mdoc_macro(m
, ntok
, line
, la
, pos
, buf
));
1584 /* Close out (no delimiters). */
1586 return(rew_elem(m
, tok
));
1592 ctx_synopsis(MACRO_PROT_ARGS
)
1596 nl
= MDOC_NEWLINE
& m
->flags
;
1598 /* If we're not in the SYNOPSIS, go straight to in-line. */
1599 if (SEC_SYNOPSIS
!= m
->lastsec
)
1600 return(in_line(m
, tok
, line
, ppos
, pos
, buf
));
1602 /* If we're a nested call, same place. */
1604 return(in_line(m
, tok
, line
, ppos
, pos
, buf
));
1607 * XXX: this will open a block scope; however, if later we end
1608 * up formatting the block scope, then child nodes will inherit
1609 * the formatting. Be careful.
1612 return(blk_part_imp(m
, tok
, line
, ppos
, pos
, buf
));
1618 obsolete(MACRO_PROT_ARGS
)
1621 return(mdoc_pmsg(m
, line
, ppos
, MANDOCERR_MACROOBS
));
1626 * Phrases occur within `Bl -column' entries, separated by `Ta' or tabs.
1627 * They're unusual because they're basically free-form text until a
1628 * macro is encountered.
1631 phrase(struct mdoc
*m
, int line
, int ppos
, char *buf
)
1638 for (pos
= ppos
; ; ) {
1641 ac
= mdoc_zargs(m
, line
, &pos
, buf
, 0, &p
);
1643 if (ARGS_ERROR
== ac
)
1645 if (ARGS_EOLN
== ac
)
1648 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup_raw(p
);
1650 if (MDOC_MAX
== ntok
) {
1651 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1656 if ( ! mdoc_macro(m
, ntok
, line
, la
, &pos
, buf
))
1658 return(append_delims(m
, line
, &pos
, buf
));
1667 phrase_ta(MACRO_PROT_ARGS
)
1675 * FIXME: this is overly restrictive: if the `Ta' is unexpected,
1676 * it should simply error out with ARGSLOST.
1679 if ( ! rew_sub(MDOC_BODY
, m
, MDOC_It
, line
, ppos
))
1681 if ( ! mdoc_body_alloc(m
, line
, ppos
, MDOC_It
))
1686 ac
= mdoc_zargs(m
, line
, pos
, buf
, 0, &p
);
1688 if (ARGS_ERROR
== ac
)
1690 if (ARGS_EOLN
== ac
)
1693 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup_raw(p
);
1695 if (MDOC_MAX
== ntok
) {
1696 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1701 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1703 return(append_delims(m
, line
, pos
, buf
));