]>
git.cameronkatri.com Git - mandoc.git/blob - mdoc_macro.c
51c852a012421a80852e818e7cc6bcd006ea34ab
1 /* $Id: mdoc_macro.c,v 1.82 2010/06/27 15:52:41 kristaps Exp $ */
3 * Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@bsd.lv>
5 * Permission to use, copy, modify, and distribute this software for any
6 * purpose with or without fee is hereby granted, provided that the above
7 * copyright notice and this permission notice appear in all copies.
9 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
30 #include "libmandoc.h"
38 static int blk_full(MACRO_PROT_ARGS
);
39 static int blk_exp_close(MACRO_PROT_ARGS
);
40 static int blk_part_exp(MACRO_PROT_ARGS
);
41 static int blk_part_imp(MACRO_PROT_ARGS
);
42 static int ctx_synopsis(MACRO_PROT_ARGS
);
43 static int in_line_eoln(MACRO_PROT_ARGS
);
44 static int in_line_argn(MACRO_PROT_ARGS
);
45 static int in_line(MACRO_PROT_ARGS
);
46 static int obsolete(MACRO_PROT_ARGS
);
47 static int phrase_ta(MACRO_PROT_ARGS
);
49 static int append_delims(struct mdoc
*,
51 static enum mdoct
lookup(enum mdoct
, const char *);
52 static enum mdoct
lookup_raw(const char *);
53 static int phrase(struct mdoc
*, int, int, char *);
54 static enum mdoct
rew_alt(enum mdoct
);
55 static int rew_dobreak(enum mdoct
,
56 const struct mdoc_node
*);
57 static enum rew
rew_dohalt(enum mdoct
, enum mdoc_type
,
58 const struct mdoc_node
*);
59 static int rew_elem(struct mdoc
*, enum mdoct
);
60 static int rew_last(struct mdoc
*,
61 const struct mdoc_node
*);
62 static int rew_sub(enum mdoc_type
, struct mdoc
*,
63 enum mdoct
, int, int);
64 static int swarn(struct mdoc
*, enum mdoc_type
, int,
65 int, const struct mdoc_node
*);
67 const struct mdoc_macro __mdoc_macros
[MDOC_MAX
] = {
68 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ap */
69 { in_line_eoln
, MDOC_PROLOGUE
}, /* Dd */
70 { in_line_eoln
, MDOC_PROLOGUE
}, /* Dt */
71 { in_line_eoln
, MDOC_PROLOGUE
}, /* Os */
72 { blk_full
, 0 }, /* Sh */
73 { blk_full
, 0 }, /* Ss */
74 { in_line_eoln
, 0 }, /* Pp */
75 { blk_part_imp
, MDOC_PARSED
}, /* D1 */
76 { blk_part_imp
, MDOC_PARSED
}, /* Dl */
77 { blk_full
, MDOC_EXPLICIT
}, /* Bd */
78 { blk_exp_close
, MDOC_EXPLICIT
}, /* Ed */
79 { blk_full
, MDOC_EXPLICIT
}, /* Bl */
80 { blk_exp_close
, MDOC_EXPLICIT
}, /* El */
81 { blk_full
, MDOC_PARSED
}, /* It */
82 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ad */
83 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* An */
84 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ar */
85 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Cd */
86 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Cm */
87 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Dv */
88 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Er */
89 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ev */
90 { in_line_eoln
, 0 }, /* Ex */
91 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fa */
92 { in_line_eoln
, 0 }, /* Fd */
93 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fl */
94 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fn */
95 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ft */
96 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ic */
97 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* In */
98 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Li */
99 { blk_full
, 0 }, /* Nd */
100 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Nm */
101 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Op */
102 { obsolete
, 0 }, /* Ot */
103 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Pa */
104 { in_line_eoln
, 0 }, /* Rv */
105 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* St */
106 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Va */
107 { ctx_synopsis
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Vt */
108 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Xr */
109 { in_line_eoln
, 0 }, /* %A */
110 { in_line_eoln
, 0 }, /* %B */
111 { in_line_eoln
, 0 }, /* %D */
112 { in_line_eoln
, 0 }, /* %I */
113 { in_line_eoln
, 0 }, /* %J */
114 { in_line_eoln
, 0 }, /* %N */
115 { in_line_eoln
, 0 }, /* %O */
116 { in_line_eoln
, 0 }, /* %P */
117 { in_line_eoln
, 0 }, /* %R */
118 { in_line_eoln
, 0 }, /* %T */
119 { in_line_eoln
, 0 }, /* %V */
120 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Ac */
121 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Ao */
122 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Aq */
123 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* At */
124 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Bc */
125 { blk_full
, MDOC_EXPLICIT
}, /* Bf */
126 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Bo */
127 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Bq */
128 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Bsx */
129 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Bx */
130 { in_line_eoln
, 0 }, /* Db */
131 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Dc */
132 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Do */
133 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Dq */
134 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Ec */
135 { blk_exp_close
, MDOC_EXPLICIT
}, /* Ef */
136 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Em */
137 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Eo */
138 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Fx */
139 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ms */
140 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* No */
141 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ns */
142 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Nx */
143 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ox */
144 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Pc */
145 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_IGNDELIM
}, /* Pf */
146 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Po */
147 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Pq */
148 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Qc */
149 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ql */
150 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Qo */
151 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Qq */
152 { blk_exp_close
, MDOC_EXPLICIT
}, /* Re */
153 { blk_full
, MDOC_EXPLICIT
}, /* Rs */
154 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Sc */
155 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* So */
156 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Sq */
157 { in_line_eoln
, 0 }, /* Sm */
158 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Sx */
159 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Sy */
160 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Tn */
161 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ux */
162 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Xc */
163 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Xo */
164 { blk_full
, MDOC_EXPLICIT
| MDOC_CALLABLE
}, /* Fo */
165 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Fc */
166 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Oo */
167 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Oc */
168 { blk_full
, MDOC_EXPLICIT
}, /* Bk */
169 { blk_exp_close
, MDOC_EXPLICIT
}, /* Ek */
170 { in_line_eoln
, 0 }, /* Bt */
171 { in_line_eoln
, 0 }, /* Hf */
172 { obsolete
, 0 }, /* Fr */
173 { in_line_eoln
, 0 }, /* Ud */
174 { in_line
, 0 }, /* Lb */
175 { in_line_eoln
, 0 }, /* Lp */
176 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Lk */
177 { in_line
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Mt */
178 { blk_part_imp
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Brq */
179 { blk_part_exp
, MDOC_CALLABLE
| MDOC_PARSED
| MDOC_EXPLICIT
}, /* Bro */
180 { blk_exp_close
, MDOC_EXPLICIT
| MDOC_CALLABLE
| MDOC_PARSED
}, /* Brc */
181 { in_line_eoln
, 0 }, /* %C */
182 { obsolete
, 0 }, /* Es */
183 { obsolete
, 0 }, /* En */
184 { in_line_argn
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Dx */
185 { in_line_eoln
, 0 }, /* %Q */
186 { in_line_eoln
, 0 }, /* br */
187 { in_line_eoln
, 0 }, /* sp */
188 { in_line_eoln
, 0 }, /* %U */
189 { phrase_ta
, MDOC_CALLABLE
| MDOC_PARSED
}, /* Ta */
192 const struct mdoc_macro
* const mdoc_macros
= __mdoc_macros
;
196 swarn(struct mdoc
*mdoc
, enum mdoc_type type
,
197 int line
, int pos
, const struct mdoc_node
*p
)
199 const char *n
, *t
, *tt
;
218 n
= mdoc_macronames
[p
->tok
];
222 n
= mdoc_macronames
[p
->tok
];
226 n
= mdoc_macronames
[p
->tok
];
233 ec
= (MDOC_IGN_SCOPE
& mdoc
->pflags
) ?
234 MANDOCERR_SCOPE
: MANDOCERR_SYNTSCOPE
;
236 return(mdoc_vmsg(mdoc
, ec
, line
, pos
,
237 "%s scope breaks %s of %s",
243 * This is called at the end of parsing. It must traverse up the tree,
244 * closing out open [implicit] scopes. Obviously, open explicit scopes
248 mdoc_macroend(struct mdoc
*m
)
252 /* Scan for open explicit scopes. */
254 n
= MDOC_VALID
& m
->last
->flags
? m
->last
->parent
: m
->last
;
256 for ( ; n
; n
= n
->parent
) {
257 if (MDOC_BLOCK
!= n
->type
)
259 if ( ! (MDOC_EXPLICIT
& mdoc_macros
[n
->tok
].flags
))
261 mdoc_nmsg(m
, n
, MANDOCERR_SYNTSCOPE
);
265 /* Rewind to the first. */
267 return(rew_last(m
, m
->first
));
272 * Look up a macro from within a subsequent context.
275 lookup(enum mdoct from
, const char *p
)
277 /* FIXME: make -diag lists be un-PARSED. */
279 if ( ! (MDOC_PARSED
& mdoc_macros
[from
].flags
))
281 return(lookup_raw(p
));
286 * Lookup a macro following the initial line macro.
289 lookup_raw(const char *p
)
293 if (MDOC_MAX
== (res
= mdoc_hash_find(p
)))
295 if (MDOC_CALLABLE
& mdoc_macros
[res
].flags
)
302 rew_last(struct mdoc
*mdoc
, const struct mdoc_node
*to
)
306 mdoc
->next
= MDOC_NEXT_SIBLING
;
309 while (mdoc
->last
!= to
) {
310 if ( ! mdoc_valid_post(mdoc
))
312 if ( ! mdoc_action_post(mdoc
))
314 mdoc
->last
= mdoc
->last
->parent
;
318 if ( ! mdoc_valid_post(mdoc
))
320 return(mdoc_action_post(mdoc
));
325 * Return the opening macro of a closing one, e.g., `Ec' has `Eo' as its
329 rew_alt(enum mdoct tok
)
373 * Rewind rules. This indicates whether to stop rewinding
374 * (REWIND_HALT) without touching our current scope, stop rewinding and
375 * close our current scope (REWIND_REWIND), or continue (REWIND_NOHALT).
376 * The scope-closing and so on occurs in the various rew_* routines.
379 rew_dohalt(enum mdoct tok
, enum mdoc_type type
,
380 const struct mdoc_node
*p
)
383 if (MDOC_ROOT
== p
->type
)
385 if (MDOC_VALID
& p
->flags
)
386 return(REWIND_NOHALT
);
412 assert(MDOC_TAIL
!= type
);
413 if (type
== p
->type
&& tok
== p
->tok
)
414 return(REWIND_REWIND
);
417 assert(MDOC_TAIL
!= type
);
418 if (type
== p
->type
&& tok
== p
->tok
)
419 return(REWIND_REWIND
);
420 if (MDOC_BODY
== p
->type
&& MDOC_Bl
== p
->tok
)
424 if (type
== p
->type
&& tok
== p
->tok
)
425 return(REWIND_REWIND
);
430 assert(MDOC_TAIL
!= type
);
431 if (type
== p
->type
&& tok
== p
->tok
)
432 return(REWIND_REWIND
);
433 if (MDOC_BODY
== p
->type
&& MDOC_Sh
== p
->tok
)
467 if (type
== p
->type
&& tok
== p
->tok
)
468 return(REWIND_REWIND
);
470 /* Multi-line explicit scope close. */
502 if (type
== p
->type
&& rew_alt(tok
) == p
->tok
)
503 return(REWIND_REWIND
);
510 return(REWIND_NOHALT
);
515 * See if we can break an encountered scope (the rew_dohalt has returned
519 rew_dobreak(enum mdoct tok
, const struct mdoc_node
*p
)
522 assert(MDOC_ROOT
!= p
->type
);
523 if (MDOC_ELEM
== p
->type
)
525 if (MDOC_TEXT
== p
->type
)
527 if (MDOC_VALID
& p
->flags
)
532 return(MDOC_It
== p
->tok
);
534 return(MDOC_Nd
== p
->tok
);
536 return(MDOC_Ss
== p
->tok
);
538 if (MDOC_Nd
== p
->tok
)
540 if (MDOC_Ss
== p
->tok
)
542 return(MDOC_Sh
== p
->tok
);
544 if (MDOC_It
== p
->tok
)
548 if (MDOC_Op
== p
->tok
)
555 if (MDOC_EXPLICIT
& mdoc_macros
[tok
].flags
)
556 return(p
->tok
== rew_alt(tok
));
557 else if (MDOC_BLOCK
== p
->type
)
560 return(tok
== p
->tok
);
565 rew_elem(struct mdoc
*mdoc
, enum mdoct tok
)
570 if (MDOC_ELEM
!= n
->type
)
572 assert(MDOC_ELEM
== n
->type
);
573 assert(tok
== n
->tok
);
575 return(rew_last(mdoc
, n
));
580 rew_sub(enum mdoc_type t
, struct mdoc
*m
,
581 enum mdoct tok
, int line
, int ppos
)
587 for (n
= m
->last
; n
; n
= n
->parent
) {
588 c
= rew_dohalt(tok
, t
, n
);
589 if (REWIND_HALT
== c
) {
592 if ( ! (MDOC_EXPLICIT
& mdoc_macros
[tok
].flags
))
594 /* FIXME: shouldn't raise an error */
595 mdoc_pmsg(m
, line
, ppos
, MANDOCERR_SYNTNOSCOPE
);
598 if (REWIND_REWIND
== c
)
600 else if (rew_dobreak(tok
, n
))
602 if ( ! swarn(m
, t
, line
, ppos
, n
))
607 if ( ! rew_last(m
, n
))
611 * The current block extends an enclosing block beyond a line
612 * break. Now that the current block ends, close the enclosing
615 if (NULL
!= (n
= n
->pending
)) {
616 assert(MDOC_HEAD
== n
->type
);
617 if ( ! rew_last(m
, n
))
619 if ( ! mdoc_body_alloc(m
, n
->line
, n
->pos
, n
->tok
))
628 append_delims(struct mdoc
*m
, int line
, int *pos
, char *buf
)
634 if ('\0' == buf
[*pos
])
639 ac
= mdoc_zargs(m
, line
, pos
, buf
, ARGS_NOWARN
, &p
);
641 if (ARGS_ERROR
== ac
)
643 else if (ARGS_EOLN
== ac
)
646 assert(DELIM_NONE
!= mdoc_isdelim(p
));
647 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
651 * If we encounter end-of-sentence symbols, then trigger
654 * XXX: it's easy to allow this to propogate outward to
655 * the last symbol, such that `. )' will cause the
656 * correct double-spacing. However, (1) groff isn't
657 * smart enough to do this and (2) it would require
658 * knowing which symbols break this behaviour, for
659 * example, `. ;' shouldn't propogate the double-space.
661 if (mandoc_eos(p
, strlen(p
)))
662 m
->last
->flags
|= MDOC_EOS
;
670 * Close out block partial/full explicit.
673 blk_exp_close(MACRO_PROT_ARGS
)
675 int j
, lastarg
, maxargs
, flushed
, nl
;
680 nl
= MDOC_NEWLINE
& m
->flags
;
691 if ( ! (MDOC_CALLABLE
& mdoc_macros
[tok
].flags
)) {
692 /* FIXME: do this in validate */
694 if ( ! mdoc_pmsg(m
, line
, ppos
, MANDOCERR_ARGSLOST
))
697 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
699 return(rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
));
702 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
706 if ( ! mdoc_tail_alloc(m
, line
, ppos
, rew_alt(tok
)))
709 for (flushed
= j
= 0; ; j
++) {
712 if (j
== maxargs
&& ! flushed
) {
713 if ( ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
718 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
720 if (ARGS_ERROR
== ac
)
722 if (ARGS_PUNCT
== ac
)
727 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
729 if (MDOC_MAX
== ntok
) {
730 if ( ! mdoc_word_alloc(m
, line
, lastarg
, p
))
736 if ( ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
740 if ( ! mdoc_macro(m
, ntok
, line
, lastarg
, pos
, buf
))
745 if ( ! flushed
&& ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
750 return(append_delims(m
, line
, pos
, buf
));
755 in_line(MACRO_PROT_ARGS
)
757 int la
, scope
, cnt
, nc
, nl
;
762 struct mdoc_arg
*arg
;
765 nl
= MDOC_NEWLINE
& m
->flags
;
768 * Whether we allow ignored elements (those without content,
769 * usually because of reserved words) to squeak by.
791 for (arg
= NULL
;; ) {
793 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
795 if (ARGV_WORD
== av
) {
808 for (cnt
= scope
= 0;; ) {
810 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
812 if (ARGS_ERROR
== ac
)
816 if (ARGS_PUNCT
== ac
)
819 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
822 * In this case, we've located a submacro and must
823 * execute it. Close out scope, if open. If no
824 * elements have been generated, either create one (nc)
825 * or raise a warning.
828 if (MDOC_MAX
!= ntok
) {
829 if (scope
&& ! rew_elem(m
, tok
))
831 if (nc
&& 0 == cnt
) {
832 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
834 if ( ! rew_last(m
, m
->last
))
836 } else if ( ! nc
&& 0 == cnt
) {
838 if ( ! mdoc_pmsg(m
, line
, ppos
, MANDOCERR_MACROEMPTY
))
841 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
845 return(append_delims(m
, line
, pos
, buf
));
849 * Non-quote-enclosed punctuation. Set up our scope, if
850 * a word; rewind the scope, if a delimiter; then append
854 d
= ARGS_QWORD
== ac
? DELIM_NONE
: mdoc_isdelim(p
);
856 if (DELIM_NONE
!= d
) {
858 * If we encounter closing punctuation, no word
859 * has been omitted, no scope is open, and we're
860 * allowed to have an empty element, then start
861 * a new scope. `Ar', `Fl', and `Li', only do
862 * this once per invocation. There may be more
863 * of these (all of them?).
865 if (0 == cnt
&& (nc
|| MDOC_Li
== tok
) &&
866 DELIM_CLOSE
== d
&& ! scope
) {
867 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
869 if (MDOC_Ar
== tok
|| MDOC_Li
== tok
||
875 * Close out our scope, if one is open, before
878 if (scope
&& ! rew_elem(m
, tok
))
881 } else if ( ! scope
) {
882 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
889 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
893 * `Fl' macros have their scope re-opened with each new
894 * word so that the `-' can be added to each one without
895 * having to parse out spaces.
897 if (scope
&& MDOC_Fl
== tok
) {
898 if ( ! rew_elem(m
, tok
))
904 if (scope
&& ! rew_elem(m
, tok
))
908 * If no elements have been collected and we're allowed to have
909 * empties (nc), open a scope and close it out. Otherwise,
913 if (nc
&& 0 == cnt
) {
914 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
916 if ( ! rew_last(m
, m
->last
))
918 } else if ( ! nc
&& 0 == cnt
) {
920 if ( ! mdoc_pmsg(m
, line
, ppos
, MANDOCERR_MACROEMPTY
))
926 return(append_delims(m
, line
, pos
, buf
));
931 blk_full(MACRO_PROT_ARGS
)
934 struct mdoc_arg
*arg
;
935 struct mdoc_node
*head
; /* save of head macro */
936 struct mdoc_node
*body
; /* save of body macro */
940 enum margserr ac
, lac
;
944 nl
= MDOC_NEWLINE
& m
->flags
;
946 /* Close out prior implicit scope. */
948 if ( ! (MDOC_EXPLICIT
& mdoc_macros
[tok
].flags
)) {
949 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
951 if ( ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
956 * This routine accomodates implicitly- and explicitly-scoped
957 * macro openings. Implicit ones first close out prior scope
958 * (seen above). Delay opening the head until necessary to
959 * allow leading punctuation to print. Special consideration
960 * for `It -column', which has phrase-part syntax instead of
961 * regular child nodes.
964 for (arg
= NULL
;; ) {
966 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
968 if (ARGV_WORD
== av
) {
982 if ( ! mdoc_block_alloc(m
, line
, ppos
, tok
, arg
))
988 * The `Nd' macro has all arguments in its body: it's a hybrid
989 * of block partial-explicit and full-implicit. Stupid.
992 if (MDOC_Nd
== tok
) {
993 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
996 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
998 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1007 /* Initialise last-phrase-type with ARGS_PEND. */
1008 lac
= ARGS_ERROR
== ac
? ARGS_PEND
: ac
;
1009 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1011 if (ARGS_ERROR
== ac
)
1014 if (ARGS_EOLN
== ac
) {
1015 if (ARGS_PPHRASE
!= lac
&& ARGS_PHRASE
!= lac
)
1018 * This is necessary: if the last token on a
1019 * line is a `Ta' or tab, then we'll get
1020 * ARGS_EOLN, so we must be smart enough to
1021 * reopen our scope if the last parse was a
1022 * phrase or partial phrase.
1024 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
1026 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1033 * Emit leading punctuation (i.e., punctuation before
1034 * the MDOC_HEAD) for non-phrase types.
1039 ARGS_PHRASE
!= ac
&&
1040 ARGS_PPHRASE
!= ac
&&
1042 DELIM_OPEN
== mdoc_isdelim(p
)) {
1043 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1048 /* Open a head if one hasn't been opened. */
1051 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1056 if (ARGS_PHRASE
== ac
||
1058 ARGS_PPHRASE
== ac
) {
1060 * If we haven't opened a body yet, rewind the
1061 * head; if we have, rewind that instead.
1064 mtt
= body
? MDOC_BODY
: MDOC_HEAD
;
1065 if ( ! rew_sub(mtt
, m
, tok
, line
, ppos
))
1068 /* Then allocate our body context. */
1070 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1075 * Process phrases: set whether we're in a
1076 * partial-phrase (this effects line handling)
1077 * then call down into the phrase parser.
1080 if (ARGS_PPHRASE
== ac
)
1081 m
->flags
|= MDOC_PPHRASE
;
1082 if (ARGS_PEND
== ac
&& ARGS_PPHRASE
== lac
)
1083 m
->flags
|= MDOC_PPHRASE
;
1085 if ( ! phrase(m
, line
, la
, buf
))
1088 m
->flags
&= ~MDOC_PPHRASE
;
1092 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1094 if (MDOC_MAX
== ntok
) {
1095 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1100 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1106 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1111 if (nl
&& ! append_delims(m
, line
, pos
, buf
))
1114 /* If we've already opened our body, exit now. */
1120 * If there is an open (i.e., unvalidated) sub-block requiring
1121 * explicit close-out, postpone switching the current block from
1122 * head to body until the rew_sub() call closing out that
1125 for (n
= m
->last
; n
&& n
!= head
; n
= n
->parent
) {
1126 if (MDOC_BLOCK
== n
->type
&&
1127 MDOC_EXPLICIT
& mdoc_macros
[n
->tok
].flags
&&
1128 ! (MDOC_VALID
& n
->flags
)) {
1129 assert( ! (MDOC_ACTED
& n
->flags
));
1135 /* Close out scopes to remain in a consistent state. */
1137 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1139 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1143 if ( ! (MDOC_FREECOL
& m
->flags
))
1146 if ( ! rew_sub(MDOC_BODY
, m
, tok
, line
, ppos
))
1148 if ( ! rew_sub(MDOC_BLOCK
, m
, tok
, line
, ppos
))
1151 m
->flags
&= ~MDOC_FREECOL
;
1157 blk_part_imp(MACRO_PROT_ARGS
)
1163 struct mdoc_node
*blk
; /* saved block context */
1164 struct mdoc_node
*body
; /* saved body context */
1165 struct mdoc_node
*n
;
1167 nl
= MDOC_NEWLINE
& m
->flags
;
1170 * A macro that spans to the end of the line. This is generally
1171 * (but not necessarily) called as the first macro. The block
1172 * has a head as the immediate child, which is always empty,
1173 * followed by zero or more opening punctuation nodes, then the
1174 * body (which may be empty, depending on the macro), then zero
1175 * or more closing punctuation nodes.
1178 if ( ! mdoc_block_alloc(m
, line
, ppos
, tok
, NULL
))
1183 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1185 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1189 * Open the body scope "on-demand", that is, after we've
1190 * processed all our the leading delimiters (open parenthesis,
1194 for (body
= NULL
; ; ) {
1196 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1198 if (ARGS_ERROR
== ac
)
1200 if (ARGS_EOLN
== ac
)
1202 if (ARGS_PUNCT
== ac
)
1205 if (NULL
== body
&& ARGS_QWORD
!= ac
&&
1206 DELIM_OPEN
== mdoc_isdelim(p
)) {
1207 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1213 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1218 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1220 if (MDOC_MAX
== ntok
) {
1221 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1226 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1231 /* Clean-ups to leave in a consistent state. */
1234 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1239 for (n
= body
->child
; n
&& n
->next
; n
= n
->next
)
1243 * End of sentence spacing: if the last node is a text node and
1244 * has a trailing period, then mark it as being end-of-sentence.
1247 if (n
&& MDOC_TEXT
== n
->type
&& n
->string
)
1248 if (mandoc_eos(n
->string
, strlen(n
->string
)))
1249 n
->flags
|= MDOC_EOS
;
1251 /* Up-propogate the end-of-space flag. */
1253 if (n
&& (MDOC_EOS
& n
->flags
)) {
1254 body
->flags
|= MDOC_EOS
;
1255 body
->parent
->flags
|= MDOC_EOS
;
1259 * If we can't rewind to our body, then our scope has already
1260 * been closed by another macro (like `Oc' closing `Op'). This
1261 * is ugly behaviour nodding its head to OpenBSD's overwhelming
1262 * crufty use of `Op' breakage.
1264 * FIXME - this should be ifdef'd OpenBSD?
1266 for (n
= m
->last
; n
; n
= n
->parent
)
1270 if (NULL
== n
&& ! mdoc_nmsg(m
, body
, MANDOCERR_SCOPE
))
1273 if (n
&& ! rew_last(m
, body
))
1276 /* Standard appending of delimiters. */
1278 if (nl
&& ! append_delims(m
, line
, pos
, buf
))
1281 /* Rewind scope, if applicable. */
1283 if (n
&& ! rew_last(m
, blk
))
1291 blk_part_exp(MACRO_PROT_ARGS
)
1295 struct mdoc_node
*head
; /* keep track of head */
1296 struct mdoc_node
*body
; /* keep track of body */
1300 nl
= MDOC_NEWLINE
& m
->flags
;
1303 * The opening of an explicit macro having zero or more leading
1304 * punctuation nodes; a head with optional single element (the
1305 * case of `Eo'); and a body that may be empty.
1308 if ( ! mdoc_block_alloc(m
, line
, ppos
, tok
, NULL
))
1311 for (head
= body
= NULL
; ; ) {
1313 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1315 if (ARGS_ERROR
== ac
)
1317 if (ARGS_PUNCT
== ac
)
1319 if (ARGS_EOLN
== ac
)
1322 /* Flush out leading punctuation. */
1324 if (NULL
== head
&& ARGS_QWORD
!= ac
&&
1325 DELIM_OPEN
== mdoc_isdelim(p
)) {
1326 assert(NULL
== body
);
1327 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1333 assert(NULL
== body
);
1334 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1340 * `Eo' gobbles any data into the head, but most other
1341 * macros just immediately close out and begin the body.
1346 /* No check whether it's a macro! */
1348 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1351 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1353 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1361 assert(NULL
!= head
&& NULL
!= body
);
1363 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1365 if (MDOC_MAX
== ntok
) {
1366 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1371 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1376 /* Clean-up to leave in a consistent state. */
1379 if ( ! mdoc_head_alloc(m
, line
, ppos
, tok
))
1385 if ( ! rew_sub(MDOC_HEAD
, m
, tok
, line
, ppos
))
1387 if ( ! mdoc_body_alloc(m
, line
, ppos
, tok
))
1392 /* Standard appending of delimiters. */
1396 return(append_delims(m
, line
, pos
, buf
));
1402 in_line_argn(MACRO_PROT_ARGS
)
1404 int la
, flushed
, j
, maxargs
, nl
;
1407 struct mdoc_arg
*arg
;
1411 nl
= MDOC_NEWLINE
& m
->flags
;
1414 * A line macro that has a fixed number of arguments (maxargs).
1415 * Only open the scope once the first non-leading-punctuation is
1416 * found (unless MDOC_IGNDELIM is noted, like in `Pf'), then
1417 * keep it open until the maximum number of arguments are
1439 for (arg
= NULL
; ; ) {
1441 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
1443 if (ARGV_WORD
== av
) {
1448 if (ARGV_EOLN
== av
)
1453 mdoc_argv_free(arg
);
1457 for (flushed
= j
= 0; ; ) {
1459 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1461 if (ARGS_ERROR
== ac
)
1463 if (ARGS_PUNCT
== ac
)
1465 if (ARGS_EOLN
== ac
)
1468 if ( ! (MDOC_IGNDELIM
& mdoc_macros
[tok
].flags
) &&
1470 0 == j
&& DELIM_OPEN
== mdoc_isdelim(p
)) {
1471 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1475 if ( ! mdoc_elem_alloc(m
, line
, la
, tok
, arg
))
1478 if (j
== maxargs
&& ! flushed
) {
1479 if ( ! rew_elem(m
, tok
))
1484 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1486 if (MDOC_MAX
!= ntok
) {
1487 if ( ! flushed
&& ! rew_elem(m
, tok
))
1490 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1496 if ( ! (MDOC_IGNDELIM
& mdoc_macros
[tok
].flags
) &&
1499 DELIM_NONE
!= mdoc_isdelim(p
)) {
1500 if ( ! rew_elem(m
, tok
))
1506 * XXX: this is a hack to work around groff's ugliness
1507 * as regards `Xr' and extraneous arguments. It should
1508 * ideally be deprecated behaviour, but because this is
1509 * code is no here, it's unlikely to be removed.
1513 if (MDOC_Xr
== tok
&& j
== maxargs
) {
1514 if ( ! mdoc_elem_alloc(m
, line
, la
, MDOC_Ns
, NULL
))
1516 if ( ! rew_elem(m
, MDOC_Ns
))
1521 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1526 if (0 == j
&& ! mdoc_elem_alloc(m
, line
, la
, tok
, arg
))
1529 /* Close out in a consistent state. */
1531 if ( ! flushed
&& ! rew_elem(m
, tok
))
1535 return(append_delims(m
, line
, pos
, buf
));
1540 in_line_eoln(MACRO_PROT_ARGS
)
1545 struct mdoc_arg
*arg
;
1549 assert( ! (MDOC_PARSED
& mdoc_macros
[tok
].flags
));
1551 /* Parse macro arguments. */
1553 for (arg
= NULL
; ; ) {
1555 av
= mdoc_argv(m
, line
, tok
, &arg
, pos
, buf
);
1557 if (ARGV_WORD
== av
) {
1561 if (ARGV_EOLN
== av
)
1566 mdoc_argv_free(arg
);
1570 /* Open element scope. */
1572 if ( ! mdoc_elem_alloc(m
, line
, ppos
, tok
, arg
))
1575 /* Parse argument terms. */
1579 ac
= mdoc_args(m
, line
, pos
, buf
, tok
, &p
);
1581 if (ARGS_ERROR
== ac
)
1583 if (ARGS_EOLN
== ac
)
1586 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup(tok
, p
);
1588 if (MDOC_MAX
== ntok
) {
1589 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1594 if ( ! rew_elem(m
, tok
))
1596 return(mdoc_macro(m
, ntok
, line
, la
, pos
, buf
));
1599 /* Close out (no delimiters). */
1601 return(rew_elem(m
, tok
));
1607 ctx_synopsis(MACRO_PROT_ARGS
)
1611 nl
= MDOC_NEWLINE
& m
->flags
;
1613 /* If we're not in the SYNOPSIS, go straight to in-line. */
1614 if (SEC_SYNOPSIS
!= m
->lastsec
)
1615 return(in_line(m
, tok
, line
, ppos
, pos
, buf
));
1617 /* If we're a nested call, same place. */
1619 return(in_line(m
, tok
, line
, ppos
, pos
, buf
));
1622 * XXX: this will open a block scope; however, if later we end
1623 * up formatting the block scope, then child nodes will inherit
1624 * the formatting. Be careful.
1627 return(blk_part_imp(m
, tok
, line
, ppos
, pos
, buf
));
1633 obsolete(MACRO_PROT_ARGS
)
1636 return(mdoc_pmsg(m
, line
, ppos
, MANDOCERR_MACROOBS
));
1641 * Phrases occur within `Bl -column' entries, separated by `Ta' or tabs.
1642 * They're unusual because they're basically free-form text until a
1643 * macro is encountered.
1646 phrase(struct mdoc
*m
, int line
, int ppos
, char *buf
)
1653 for (pos
= ppos
; ; ) {
1656 ac
= mdoc_zargs(m
, line
, &pos
, buf
, 0, &p
);
1658 if (ARGS_ERROR
== ac
)
1660 if (ARGS_EOLN
== ac
)
1663 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup_raw(p
);
1665 if (MDOC_MAX
== ntok
) {
1666 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1671 if ( ! mdoc_macro(m
, ntok
, line
, la
, &pos
, buf
))
1673 return(append_delims(m
, line
, &pos
, buf
));
1682 phrase_ta(MACRO_PROT_ARGS
)
1690 * FIXME: this is overly restrictive: if the `Ta' is unexpected,
1691 * it should simply error out with ARGSLOST.
1694 if ( ! rew_sub(MDOC_BODY
, m
, MDOC_It
, line
, ppos
))
1696 if ( ! mdoc_body_alloc(m
, line
, ppos
, MDOC_It
))
1701 ac
= mdoc_zargs(m
, line
, pos
, buf
, 0, &p
);
1703 if (ARGS_ERROR
== ac
)
1705 if (ARGS_EOLN
== ac
)
1708 ntok
= ARGS_QWORD
== ac
? MDOC_MAX
: lookup_raw(p
);
1710 if (MDOC_MAX
== ntok
) {
1711 if ( ! mdoc_word_alloc(m
, line
, la
, p
))
1716 if ( ! mdoc_macro(m
, ntok
, line
, la
, pos
, buf
))
1718 return(append_delims(m
, line
, pos
, buf
));