]>
git.cameronkatri.com Git - mandoc.git/blob - mdoc_validate.c
1 /* $Id: mdoc_validate.c,v 1.223 2014/07/02 20:19:11 schwarze Exp $ */
3 * Copyright (c) 2008-2012 Kristaps Dzonsons <kristaps@bsd.lv>
4 * Copyright (c) 2010-2014 Ingo Schwarze <schwarze@openbsd.org>
5 * Copyright (c) 2010 Joerg Sonnenberger <joerg@netbsd.org>
7 * Permission to use, copy, modify, and distribute this software for any
8 * purpose with or without fee is hereby granted, provided that the above
9 * copyright notice and this permission notice appear in all copies.
11 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
12 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
13 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
14 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
15 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
16 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
17 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
24 #include <sys/utsname.h>
27 #include <sys/types.h>
39 #include "mandoc_aux.h"
41 #include "libmandoc.h"
43 /* FIXME: .Bl -diag can't have non-text children in HEAD. */
45 #define PRE_ARGS struct mdoc *mdoc, struct mdoc_node *n
46 #define POST_ARGS struct mdoc *mdoc
59 typedef int (*v_pre
)(PRE_ARGS
);
60 typedef int (*v_post
)(POST_ARGS
);
67 static int check_count(struct mdoc
*, enum mdoc_type
,
68 enum check_lvl
, enum check_ineq
, int);
69 static int check_parent(PRE_ARGS
, enum mdoct
, enum mdoc_type
);
70 static void check_text(struct mdoc
*, int, int, char *);
71 static void check_argv(struct mdoc
*,
72 struct mdoc_node
*, struct mdoc_argv
*);
73 static void check_args(struct mdoc
*, struct mdoc_node
*);
74 static enum mdoc_sec
a2sec(const char *);
75 static size_t macro2len(enum mdoct
);
77 static int ebool(POST_ARGS
);
78 static int berr_ge1(POST_ARGS
);
79 static int bwarn_ge1(POST_ARGS
);
80 static int ewarn_eq0(POST_ARGS
);
81 static int ewarn_eq1(POST_ARGS
);
82 static int ewarn_ge1(POST_ARGS
);
83 static int ewarn_le1(POST_ARGS
);
84 static int hwarn_eq0(POST_ARGS
);
85 static int hwarn_eq1(POST_ARGS
);
86 static int hwarn_ge1(POST_ARGS
);
87 static int hwarn_le1(POST_ARGS
);
89 static int post_an(POST_ARGS
);
90 static int post_at(POST_ARGS
);
91 static int post_bf(POST_ARGS
);
92 static int post_bl(POST_ARGS
);
93 static int post_bl_block(POST_ARGS
);
94 static int post_bl_block_width(POST_ARGS
);
95 static int post_bl_block_tag(POST_ARGS
);
96 static int post_bl_head(POST_ARGS
);
97 static int post_bx(POST_ARGS
);
98 static int post_defaults(POST_ARGS
);
99 static int post_dd(POST_ARGS
);
100 static int post_dt(POST_ARGS
);
101 static int post_en(POST_ARGS
);
102 static int post_es(POST_ARGS
);
103 static int post_eoln(POST_ARGS
);
104 static int post_hyph(POST_ARGS
);
105 static int post_ignpar(POST_ARGS
);
106 static int post_it(POST_ARGS
);
107 static int post_lb(POST_ARGS
);
108 static int post_literal(POST_ARGS
);
109 static int post_nm(POST_ARGS
);
110 static int post_ns(POST_ARGS
);
111 static int post_os(POST_ARGS
);
112 static int post_par(POST_ARGS
);
113 static int post_prol(POST_ARGS
);
114 static int post_root(POST_ARGS
);
115 static int post_rs(POST_ARGS
);
116 static int post_sh(POST_ARGS
);
117 static int post_sh_body(POST_ARGS
);
118 static int post_sh_head(POST_ARGS
);
119 static int post_st(POST_ARGS
);
120 static int post_std(POST_ARGS
);
121 static int post_vt(POST_ARGS
);
122 static int pre_an(PRE_ARGS
);
123 static int pre_bd(PRE_ARGS
);
124 static int pre_bl(PRE_ARGS
);
125 static int pre_dd(PRE_ARGS
);
126 static int pre_display(PRE_ARGS
);
127 static int pre_dt(PRE_ARGS
);
128 static int pre_it(PRE_ARGS
);
129 static int pre_literal(PRE_ARGS
);
130 static int pre_obsolete(PRE_ARGS
);
131 static int pre_os(PRE_ARGS
);
132 static int pre_par(PRE_ARGS
);
133 static int pre_sh(PRE_ARGS
);
134 static int pre_ss(PRE_ARGS
);
135 static int pre_std(PRE_ARGS
);
137 static v_post posts_an
[] = { post_an
, NULL
};
138 static v_post posts_at
[] = { post_at
, post_defaults
, NULL
};
139 static v_post posts_bd
[] = { post_literal
, hwarn_eq0
, bwarn_ge1
, NULL
};
140 static v_post posts_bf
[] = { hwarn_le1
, post_bf
, NULL
};
141 static v_post posts_bk
[] = { hwarn_eq0
, bwarn_ge1
, NULL
};
142 static v_post posts_bl
[] = { bwarn_ge1
, post_bl
, NULL
};
143 static v_post posts_bx
[] = { post_bx
, NULL
};
144 static v_post posts_bool
[] = { ebool
, NULL
};
145 static v_post posts_eoln
[] = { post_eoln
, NULL
};
146 static v_post posts_defaults
[] = { post_defaults
, NULL
};
147 static v_post posts_d1
[] = { bwarn_ge1
, post_hyph
, NULL
};
148 static v_post posts_dd
[] = { post_dd
, post_prol
, NULL
};
149 static v_post posts_dl
[] = { post_literal
, bwarn_ge1
, NULL
};
150 static v_post posts_dt
[] = { post_dt
, post_prol
, NULL
};
151 static v_post posts_en
[] = { post_en
, NULL
};
152 static v_post posts_es
[] = { post_es
, NULL
};
153 static v_post posts_fo
[] = { hwarn_eq1
, bwarn_ge1
, NULL
};
154 static v_post posts_hyph
[] = { post_hyph
, NULL
};
155 static v_post posts_hyphtext
[] = { ewarn_ge1
, post_hyph
, NULL
};
156 static v_post posts_it
[] = { post_it
, NULL
};
157 static v_post posts_lb
[] = { post_lb
, NULL
};
158 static v_post posts_nd
[] = { berr_ge1
, post_hyph
, NULL
};
159 static v_post posts_nm
[] = { post_nm
, NULL
};
160 static v_post posts_notext
[] = { ewarn_eq0
, NULL
};
161 static v_post posts_ns
[] = { post_ns
, NULL
};
162 static v_post posts_os
[] = { post_os
, post_prol
, NULL
};
163 static v_post posts_pp
[] = { post_par
, ewarn_eq0
, NULL
};
164 static v_post posts_rs
[] = { post_rs
, NULL
};
165 static v_post posts_sh
[] = { post_ignpar
,hwarn_ge1
,post_sh
,post_hyph
,NULL
};
166 static v_post posts_sp
[] = { post_par
, ewarn_le1
, NULL
};
167 static v_post posts_ss
[] = { post_ignpar
, hwarn_ge1
, post_hyph
, NULL
};
168 static v_post posts_st
[] = { post_st
, NULL
};
169 static v_post posts_std
[] = { post_std
, NULL
};
170 static v_post posts_text
[] = { ewarn_ge1
, NULL
};
171 static v_post posts_text1
[] = { ewarn_eq1
, NULL
};
172 static v_post posts_vt
[] = { post_vt
, NULL
};
173 static v_pre pres_an
[] = { pre_an
, NULL
};
174 static v_pre pres_bd
[] = { pre_display
, pre_bd
, pre_literal
, pre_par
, NULL
};
175 static v_pre pres_bl
[] = { pre_bl
, pre_par
, NULL
};
176 static v_pre pres_d1
[] = { pre_display
, NULL
};
177 static v_pre pres_dl
[] = { pre_literal
, pre_display
, NULL
};
178 static v_pre pres_dd
[] = { pre_dd
, NULL
};
179 static v_pre pres_dt
[] = { pre_dt
, NULL
};
180 static v_pre pres_it
[] = { pre_it
, pre_par
, NULL
};
181 static v_pre pres_obsolete
[] = { pre_obsolete
, NULL
};
182 static v_pre pres_os
[] = { pre_os
, NULL
};
183 static v_pre pres_pp
[] = { pre_par
, NULL
};
184 static v_pre pres_sh
[] = { pre_sh
, NULL
};
185 static v_pre pres_ss
[] = { pre_ss
, NULL
};
186 static v_pre pres_std
[] = { pre_std
, NULL
};
188 static const struct valids mdoc_valids
[MDOC_MAX
] = {
189 { NULL
, NULL
}, /* Ap */
190 { pres_dd
, posts_dd
}, /* Dd */
191 { pres_dt
, posts_dt
}, /* Dt */
192 { pres_os
, posts_os
}, /* Os */
193 { pres_sh
, posts_sh
}, /* Sh */
194 { pres_ss
, posts_ss
}, /* Ss */
195 { pres_pp
, posts_pp
}, /* Pp */
196 { pres_d1
, posts_d1
}, /* D1 */
197 { pres_dl
, posts_dl
}, /* Dl */
198 { pres_bd
, posts_bd
}, /* Bd */
199 { NULL
, NULL
}, /* Ed */
200 { pres_bl
, posts_bl
}, /* Bl */
201 { NULL
, NULL
}, /* El */
202 { pres_it
, posts_it
}, /* It */
203 { NULL
, NULL
}, /* Ad */
204 { pres_an
, posts_an
}, /* An */
205 { NULL
, posts_defaults
}, /* Ar */
206 { NULL
, NULL
}, /* Cd */
207 { NULL
, NULL
}, /* Cm */
208 { NULL
, NULL
}, /* Dv */
209 { NULL
, NULL
}, /* Er */
210 { NULL
, NULL
}, /* Ev */
211 { pres_std
, posts_std
}, /* Ex */
212 { NULL
, NULL
}, /* Fa */
213 { NULL
, posts_text
}, /* Fd */
214 { NULL
, NULL
}, /* Fl */
215 { NULL
, NULL
}, /* Fn */
216 { NULL
, NULL
}, /* Ft */
217 { NULL
, NULL
}, /* Ic */
218 { NULL
, posts_text1
}, /* In */
219 { NULL
, posts_defaults
}, /* Li */
220 { NULL
, posts_nd
}, /* Nd */
221 { NULL
, posts_nm
}, /* Nm */
222 { NULL
, NULL
}, /* Op */
223 { pres_obsolete
, NULL
}, /* Ot */
224 { NULL
, posts_defaults
}, /* Pa */
225 { pres_std
, posts_std
}, /* Rv */
226 { NULL
, posts_st
}, /* St */
227 { NULL
, NULL
}, /* Va */
228 { NULL
, posts_vt
}, /* Vt */
229 { NULL
, posts_text
}, /* Xr */
230 { NULL
, posts_text
}, /* %A */
231 { NULL
, posts_hyphtext
}, /* %B */ /* FIXME: can be used outside Rs/Re. */
232 { NULL
, posts_text
}, /* %D */
233 { NULL
, posts_text
}, /* %I */
234 { NULL
, posts_text
}, /* %J */
235 { NULL
, posts_hyphtext
}, /* %N */
236 { NULL
, posts_hyphtext
}, /* %O */
237 { NULL
, posts_text
}, /* %P */
238 { NULL
, posts_hyphtext
}, /* %R */
239 { NULL
, posts_hyphtext
}, /* %T */ /* FIXME: can be used outside Rs/Re. */
240 { NULL
, posts_text
}, /* %V */
241 { NULL
, NULL
}, /* Ac */
242 { NULL
, NULL
}, /* Ao */
243 { NULL
, NULL
}, /* Aq */
244 { NULL
, posts_at
}, /* At */
245 { NULL
, NULL
}, /* Bc */
246 { NULL
, posts_bf
}, /* Bf */
247 { NULL
, NULL
}, /* Bo */
248 { NULL
, NULL
}, /* Bq */
249 { NULL
, NULL
}, /* Bsx */
250 { NULL
, posts_bx
}, /* Bx */
251 { NULL
, posts_bool
}, /* Db */
252 { NULL
, NULL
}, /* Dc */
253 { NULL
, NULL
}, /* Do */
254 { NULL
, NULL
}, /* Dq */
255 { NULL
, NULL
}, /* Ec */
256 { NULL
, NULL
}, /* Ef */
257 { NULL
, NULL
}, /* Em */
258 { NULL
, NULL
}, /* Eo */
259 { NULL
, NULL
}, /* Fx */
260 { NULL
, NULL
}, /* Ms */
261 { NULL
, posts_notext
}, /* No */
262 { NULL
, posts_ns
}, /* Ns */
263 { NULL
, NULL
}, /* Nx */
264 { NULL
, NULL
}, /* Ox */
265 { NULL
, NULL
}, /* Pc */
266 { NULL
, posts_text1
}, /* Pf */
267 { NULL
, NULL
}, /* Po */
268 { NULL
, NULL
}, /* Pq */
269 { NULL
, NULL
}, /* Qc */
270 { NULL
, NULL
}, /* Ql */
271 { NULL
, NULL
}, /* Qo */
272 { NULL
, NULL
}, /* Qq */
273 { NULL
, NULL
}, /* Re */
274 { NULL
, posts_rs
}, /* Rs */
275 { NULL
, NULL
}, /* Sc */
276 { NULL
, NULL
}, /* So */
277 { NULL
, NULL
}, /* Sq */
278 { NULL
, posts_bool
}, /* Sm */
279 { NULL
, posts_hyph
}, /* Sx */
280 { NULL
, NULL
}, /* Sy */
281 { NULL
, NULL
}, /* Tn */
282 { NULL
, NULL
}, /* Ux */
283 { NULL
, NULL
}, /* Xc */
284 { NULL
, NULL
}, /* Xo */
285 { NULL
, posts_fo
}, /* Fo */
286 { NULL
, NULL
}, /* Fc */
287 { NULL
, NULL
}, /* Oo */
288 { NULL
, NULL
}, /* Oc */
289 { NULL
, posts_bk
}, /* Bk */
290 { NULL
, NULL
}, /* Ek */
291 { NULL
, posts_eoln
}, /* Bt */
292 { NULL
, NULL
}, /* Hf */
293 { pres_obsolete
, NULL
}, /* Fr */
294 { NULL
, posts_eoln
}, /* Ud */
295 { NULL
, posts_lb
}, /* Lb */
296 { pres_pp
, posts_pp
}, /* Lp */
297 { NULL
, NULL
}, /* Lk */
298 { NULL
, posts_defaults
}, /* Mt */
299 { NULL
, NULL
}, /* Brq */
300 { NULL
, NULL
}, /* Bro */
301 { NULL
, NULL
}, /* Brc */
302 { NULL
, posts_text
}, /* %C */
303 { pres_obsolete
, posts_es
}, /* Es */
304 { pres_obsolete
, posts_en
}, /* En */
305 { NULL
, NULL
}, /* Dx */
306 { NULL
, posts_text
}, /* %Q */
307 { NULL
, posts_pp
}, /* br */
308 { NULL
, posts_sp
}, /* sp */
309 { NULL
, posts_text1
}, /* %U */
310 { NULL
, NULL
}, /* Ta */
311 { NULL
, NULL
}, /* ll */
314 #define RSORD_MAX 14 /* Number of `Rs' blocks. */
316 static const enum mdoct rsord
[RSORD_MAX
] = {
333 static const char * const secnames
[SEC__MAX
] = {
340 "IMPLEMENTATION NOTES",
355 "SECURITY CONSIDERATIONS",
361 mdoc_valid_pre(struct mdoc
*mdoc
, struct mdoc_node
*n
)
372 check_text(mdoc
, line
, pos
, tp
);
386 if (NULL
== mdoc_valids
[n
->tok
].pre
)
388 for (p
= mdoc_valids
[n
->tok
].pre
; *p
; p
++)
389 if ( ! (*p
)(mdoc
, n
))
395 mdoc_valid_post(struct mdoc
*mdoc
)
399 if (MDOC_VALID
& mdoc
->last
->flags
)
401 mdoc
->last
->flags
|= MDOC_VALID
;
403 switch (mdoc
->last
->type
) {
411 return(post_root(mdoc
));
416 if (NULL
== mdoc_valids
[mdoc
->last
->tok
].post
)
418 for (p
= mdoc_valids
[mdoc
->last
->tok
].post
; *p
; p
++)
426 check_count(struct mdoc
*mdoc
, enum mdoc_type type
,
427 enum check_lvl lvl
, enum check_ineq ineq
, int val
)
432 if (mdoc
->last
->type
!= type
)
438 if (mdoc
->last
->nchild
< val
)
443 if (mdoc
->last
->nchild
> val
)
448 if (val
== mdoc
->last
->nchild
)
456 t
= lvl
== CHECK_WARN
? MANDOCERR_ARGCWARN
: MANDOCERR_ARGCOUNT
;
457 mandoc_vmsg(t
, mdoc
->parse
, mdoc
->last
->line
,
458 mdoc
->last
->pos
, "want %s%d children (have %d)",
459 p
, val
, mdoc
->last
->nchild
);
467 return(check_count(mdoc
, MDOC_BODY
, CHECK_ERROR
, CHECK_GT
, 0));
473 return(check_count(mdoc
, MDOC_BODY
, CHECK_WARN
, CHECK_GT
, 0));
479 return(check_count(mdoc
, MDOC_ELEM
, CHECK_WARN
, CHECK_EQ
, 0));
485 return(check_count(mdoc
, MDOC_ELEM
, CHECK_WARN
, CHECK_EQ
, 1));
491 return(check_count(mdoc
, MDOC_ELEM
, CHECK_WARN
, CHECK_GT
, 0));
497 return(check_count(mdoc
, MDOC_ELEM
, CHECK_WARN
, CHECK_LT
, 2));
503 return(check_count(mdoc
, MDOC_HEAD
, CHECK_WARN
, CHECK_EQ
, 0));
509 return(check_count(mdoc
, MDOC_HEAD
, CHECK_WARN
, CHECK_EQ
, 1));
515 return(check_count(mdoc
, MDOC_HEAD
, CHECK_WARN
, CHECK_GT
, 0));
521 return(check_count(mdoc
, MDOC_HEAD
, CHECK_WARN
, CHECK_LT
, 2));
525 check_args(struct mdoc
*mdoc
, struct mdoc_node
*n
)
532 assert(n
->args
->argc
);
533 for (i
= 0; i
< (int)n
->args
->argc
; i
++)
534 check_argv(mdoc
, n
, &n
->args
->argv
[i
]);
538 check_argv(struct mdoc
*mdoc
, struct mdoc_node
*n
, struct mdoc_argv
*v
)
542 for (i
= 0; i
< (int)v
->sz
; i
++)
543 check_text(mdoc
, v
->line
, v
->pos
, v
->value
[i
]);
545 /* FIXME: move to post_std(). */
547 if (MDOC_Std
== v
->arg
)
548 if ( ! (v
->sz
|| mdoc
->meta
.name
))
549 mdoc_nmsg(mdoc
, n
, MANDOCERR_NONAME
);
553 check_text(struct mdoc
*mdoc
, int ln
, int pos
, char *p
)
557 if (MDOC_LITERAL
& mdoc
->flags
)
560 for (cp
= p
; NULL
!= (p
= strchr(p
, '\t')); p
++)
561 mdoc_pmsg(mdoc
, ln
, pos
+ (int)(p
- cp
), MANDOCERR_BADTAB
);
565 check_parent(PRE_ARGS
, enum mdoct tok
, enum mdoc_type t
)
569 if ((MDOC_ROOT
== t
|| tok
== n
->parent
->tok
) &&
570 (t
== n
->parent
->type
))
573 mandoc_vmsg(MANDOCERR_SYNTCHILD
, mdoc
->parse
,
574 n
->line
, n
->pos
, "want parent %s",
575 MDOC_ROOT
== t
? "<root>" : mdoc_macronames
[tok
]);
581 pre_display(PRE_ARGS
)
583 struct mdoc_node
*node
;
585 if (MDOC_BLOCK
!= n
->type
)
588 for (node
= mdoc
->last
->parent
; node
; node
= node
->parent
)
589 if (MDOC_BLOCK
== node
->type
)
590 if (MDOC_Bd
== node
->tok
)
594 mandoc_vmsg(MANDOCERR_BD_NEST
,
595 mdoc
->parse
, n
->line
, n
->pos
,
596 "%s in Bd", mdoc_macronames
[n
->tok
]);
605 const char *offs
, *width
;
607 struct mdoc_node
*np
;
609 if (MDOC_BLOCK
!= n
->type
) {
610 if (ENDBODY_NOT
!= n
->end
) {
612 np
= n
->pending
->parent
;
617 assert(MDOC_BLOCK
== np
->type
);
618 assert(MDOC_Bl
== np
->tok
);
623 * First figure out which kind of list to use: bind ourselves to
624 * the first mentioned list type and warn about any remaining
625 * ones. If we find no list type, we default to LIST_item.
628 for (i
= 0; n
->args
&& i
< (int)n
->args
->argc
; i
++) {
632 switch (n
->args
->argv
[i
].arg
) {
633 /* Set list types. */
667 /* Set list arguments. */
669 dup
= n
->norm
->Bl
.comp
;
673 /* NB: this can be empty! */
674 if (n
->args
->argv
[i
].sz
) {
675 width
= n
->args
->argv
[i
].value
[0];
676 dup
= (NULL
!= n
->norm
->Bl
.width
);
679 mdoc_nmsg(mdoc
, n
, MANDOCERR_IGNARGV
);
682 /* NB: this can be empty! */
683 if (n
->args
->argv
[i
].sz
) {
684 offs
= n
->args
->argv
[i
].value
[0];
685 dup
= (NULL
!= n
->norm
->Bl
.offs
);
688 mdoc_nmsg(mdoc
, n
, MANDOCERR_IGNARGV
);
694 /* Check: duplicate auxiliary arguments. */
697 mdoc_nmsg(mdoc
, n
, MANDOCERR_ARGVREP
);
700 n
->norm
->Bl
.comp
= comp
;
702 n
->norm
->Bl
.offs
= offs
;
704 n
->norm
->Bl
.width
= width
;
706 /* Check: multiple list types. */
708 if (LIST__NONE
!= lt
&& n
->norm
->Bl
.type
!= LIST__NONE
)
709 mdoc_nmsg(mdoc
, n
, MANDOCERR_LISTREP
);
711 /* Assign list type. */
713 if (LIST__NONE
!= lt
&& n
->norm
->Bl
.type
== LIST__NONE
) {
714 n
->norm
->Bl
.type
= lt
;
715 /* Set column information, too. */
716 if (LIST_column
== lt
) {
719 n
->norm
->Bl
.cols
= (void *)
720 n
->args
->argv
[i
].value
;
724 /* The list type should come first. */
726 if (n
->norm
->Bl
.type
== LIST__NONE
)
727 if (n
->norm
->Bl
.width
||
730 mdoc_nmsg(mdoc
, n
, MANDOCERR_LISTFIRST
);
735 /* Allow lists to default to LIST_item. */
737 if (LIST__NONE
== n
->norm
->Bl
.type
) {
738 mdoc_nmsg(mdoc
, n
, MANDOCERR_LISTTYPE
);
739 n
->norm
->Bl
.type
= LIST_item
;
743 * Validate the width field. Some list types don't need width
744 * types and should be warned about them. Others should have it
745 * and must also be warned. Yet others have a default and need
749 switch (n
->norm
->Bl
.type
) {
751 if (NULL
== n
->norm
->Bl
.width
)
752 mdoc_nmsg(mdoc
, n
, MANDOCERR_NOWIDTHARG
);
763 if (n
->norm
->Bl
.width
)
764 mdoc_nmsg(mdoc
, n
, MANDOCERR_IGNARGV
);
771 if (NULL
== n
->norm
->Bl
.width
)
772 n
->norm
->Bl
.width
= "2n";
775 if (NULL
== n
->norm
->Bl
.width
)
776 n
->norm
->Bl
.width
= "3n";
791 struct mdoc_node
*np
;
793 if (MDOC_BLOCK
!= n
->type
) {
794 if (ENDBODY_NOT
!= n
->end
) {
796 np
= n
->pending
->parent
;
801 assert(MDOC_BLOCK
== np
->type
);
802 assert(MDOC_Bd
== np
->tok
);
806 for (i
= 0; n
->args
&& i
< (int)n
->args
->argc
; i
++) {
811 switch (n
->args
->argv
[i
].arg
) {
828 mdoc_nmsg(mdoc
, n
, MANDOCERR_BADDISP
);
831 /* NB: this can be empty! */
832 if (n
->args
->argv
[i
].sz
) {
833 offs
= n
->args
->argv
[i
].value
[0];
834 dup
= (NULL
!= n
->norm
->Bd
.offs
);
837 mdoc_nmsg(mdoc
, n
, MANDOCERR_IGNARGV
);
841 dup
= n
->norm
->Bd
.comp
;
848 /* Check whether we have duplicates. */
851 mdoc_nmsg(mdoc
, n
, MANDOCERR_ARGVREP
);
853 /* Make our auxiliary assignments. */
856 n
->norm
->Bd
.offs
= offs
;
858 n
->norm
->Bd
.comp
= comp
;
860 /* Check whether a type has already been assigned. */
862 if (DISP__NONE
!= dt
&& n
->norm
->Bd
.type
!= DISP__NONE
)
863 mdoc_nmsg(mdoc
, n
, MANDOCERR_DISPREP
);
865 /* Make our type assignment. */
867 if (DISP__NONE
!= dt
&& n
->norm
->Bd
.type
== DISP__NONE
)
868 n
->norm
->Bd
.type
= dt
;
871 if (DISP__NONE
== n
->norm
->Bd
.type
) {
872 mdoc_nmsg(mdoc
, n
, MANDOCERR_DISPTYPE
);
873 n
->norm
->Bd
.type
= DISP_ragged
;
883 if (MDOC_BLOCK
!= n
->type
)
885 return(check_parent(mdoc
, n
, MDOC_Sh
, MDOC_BODY
));
892 if (MDOC_BLOCK
!= n
->type
)
894 return(check_parent(mdoc
, n
, MDOC_MAX
, MDOC_ROOT
));
901 if (MDOC_BLOCK
!= n
->type
)
904 return(check_parent(mdoc
, n
, MDOC_Bl
, MDOC_BODY
));
915 for (i
= 1; i
< (int)n
->args
->argc
; i
++)
916 mdoc_pmsg(mdoc
, n
->args
->argv
[i
].line
,
917 n
->args
->argv
[i
].pos
, MANDOCERR_IGNARGV
);
919 if (MDOC_Split
== n
->args
->argv
[0].arg
)
920 n
->norm
->An
.auth
= AUTH_split
;
921 else if (MDOC_Nosplit
== n
->args
->argv
[0].arg
)
922 n
->norm
->An
.auth
= AUTH_nosplit
;
933 if (n
->args
&& 1 == n
->args
->argc
)
934 if (MDOC_Std
== n
->args
->argv
[0].arg
)
937 mdoc_nmsg(mdoc
, n
, MANDOCERR_NOARGV
);
942 pre_obsolete(PRE_ARGS
)
945 if (MDOC_ELEM
== n
->type
|| MDOC_BLOCK
== n
->type
)
946 mandoc_msg(MANDOCERR_MACRO_OBS
, mdoc
->parse
,
947 n
->line
, n
->pos
, mdoc_macronames
[n
->tok
]);
955 if (NULL
== mdoc
->meta
.date
|| mdoc
->meta
.os
)
956 mandoc_msg(MANDOCERR_PROLOG_ORDER
, mdoc
->parse
,
957 n
->line
, n
->pos
, "Dt");
959 if (mdoc
->meta
.title
)
960 mandoc_msg(MANDOCERR_PROLOG_REP
, mdoc
->parse
,
961 n
->line
, n
->pos
, "Dt");
970 if (NULL
== mdoc
->meta
.title
|| NULL
== mdoc
->meta
.date
)
971 mandoc_msg(MANDOCERR_PROLOG_ORDER
, mdoc
->parse
,
972 n
->line
, n
->pos
, "Os");
975 mandoc_msg(MANDOCERR_PROLOG_REP
, mdoc
->parse
,
976 n
->line
, n
->pos
, "Os");
985 if (mdoc
->meta
.title
|| mdoc
->meta
.os
)
986 mandoc_msg(MANDOCERR_PROLOG_ORDER
, mdoc
->parse
,
987 n
->line
, n
->pos
, "Dd");
990 mandoc_msg(MANDOCERR_PROLOG_REP
, mdoc
->parse
,
991 n
->line
, n
->pos
, "Dd");
999 struct mdoc_node
*np
;
1003 * Unlike other data pointers, these are "housed" by the HEAD
1004 * element, which contains the goods.
1007 if (MDOC_HEAD
!= mdoc
->last
->type
) {
1008 if (ENDBODY_NOT
!= mdoc
->last
->end
) {
1009 assert(mdoc
->last
->pending
);
1010 np
= mdoc
->last
->pending
->parent
->head
;
1011 } else if (MDOC_BLOCK
!= mdoc
->last
->type
) {
1012 np
= mdoc
->last
->parent
->head
;
1014 np
= mdoc
->last
->head
;
1017 assert(MDOC_HEAD
== np
->type
);
1018 assert(MDOC_Bf
== np
->tok
);
1023 assert(MDOC_BLOCK
== np
->parent
->type
);
1024 assert(MDOC_Bf
== np
->parent
->tok
);
1027 * Cannot have both argument and parameter.
1028 * If neither is specified, let it through with a warning.
1031 if (np
->parent
->args
&& np
->child
) {
1032 mdoc_nmsg(mdoc
, np
, MANDOCERR_SYNTARGVCOUNT
);
1034 } else if (NULL
== np
->parent
->args
&& NULL
== np
->child
) {
1035 mdoc_nmsg(mdoc
, np
, MANDOCERR_FONTTYPE
);
1039 /* Extract argument into data. */
1041 if (np
->parent
->args
) {
1042 arg
= np
->parent
->args
->argv
[0].arg
;
1043 if (MDOC_Emphasis
== arg
)
1044 np
->norm
->Bf
.font
= FONT_Em
;
1045 else if (MDOC_Literal
== arg
)
1046 np
->norm
->Bf
.font
= FONT_Li
;
1047 else if (MDOC_Symbolic
== arg
)
1048 np
->norm
->Bf
.font
= FONT_Sy
;
1054 /* Extract parameter into data. */
1056 if (0 == strcmp(np
->child
->string
, "Em"))
1057 np
->norm
->Bf
.font
= FONT_Em
;
1058 else if (0 == strcmp(np
->child
->string
, "Li"))
1059 np
->norm
->Bf
.font
= FONT_Li
;
1060 else if (0 == strcmp(np
->child
->string
, "Sy"))
1061 np
->norm
->Bf
.font
= FONT_Sy
;
1063 mdoc_nmsg(mdoc
, np
, MANDOCERR_FONTTYPE
);
1071 struct mdoc_node
*n
;
1072 const char *stdlibname
;
1075 check_count(mdoc
, MDOC_ELEM
, CHECK_WARN
, CHECK_EQ
, 1);
1077 n
= mdoc
->last
->child
;
1080 assert(MDOC_TEXT
== n
->type
);
1082 if (NULL
== (stdlibname
= mdoc_a2lib(n
->string
)))
1083 mandoc_asprintf(&libname
,
1084 "library \\(lq%s\\(rq", n
->string
);
1086 libname
= mandoc_strdup(stdlibname
);
1089 n
->string
= libname
;
1094 post_eoln(POST_ARGS
)
1097 if (mdoc
->last
->child
)
1098 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_ARGSLOST
);
1105 const struct mdoc_node
*n
;
1108 * The Vt macro comes in both ELEM and BLOCK form, both of which
1109 * have different syntaxes (yet more context-sensitive
1110 * behaviour). ELEM types must have a child, which is already
1111 * guaranteed by the in_line parsing routine; BLOCK types,
1112 * specifically the BODY, should only have TEXT children.
1115 if (MDOC_BODY
!= mdoc
->last
->type
)
1118 for (n
= mdoc
->last
->child
; n
; n
= n
->next
)
1119 if (MDOC_TEXT
!= n
->type
)
1120 mandoc_msg(MANDOCERR_VT_CHILD
, mdoc
->parse
,
1121 n
->line
, n
->pos
, mdoc_macronames
[n
->tok
]);
1130 if (NULL
!= mdoc
->meta
.name
)
1133 mdoc_deroff(&mdoc
->meta
.name
, mdoc
->last
);
1135 if (NULL
== mdoc
->meta
.name
) {
1136 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_NONAME
);
1137 mdoc
->meta
.name
= mandoc_strdup("UNKNOWN");
1143 post_literal(POST_ARGS
)
1147 * The `Dl' (note "el" not "one") and `Bd' macros unset the
1148 * MDOC_LITERAL flag as they leave. Note that `Bd' only sets
1149 * this in literal mode, but it doesn't hurt to just switch it
1150 * off in general since displays can't be nested.
1153 if (MDOC_BODY
== mdoc
->last
->type
)
1154 mdoc
->flags
&= ~MDOC_LITERAL
;
1160 post_defaults(POST_ARGS
)
1162 struct mdoc_node
*nn
;
1165 * The `Ar' defaults to "file ..." if no value is provided as an
1166 * argument; the `Mt' and `Pa' macros use "~"; the `Li' just
1167 * gets an empty string.
1170 if (mdoc
->last
->child
)
1174 mdoc
->next
= MDOC_NEXT_CHILD
;
1178 if ( ! mdoc_word_alloc(mdoc
, nn
->line
, nn
->pos
, "file"))
1180 if ( ! mdoc_word_alloc(mdoc
, nn
->line
, nn
->pos
, "..."))
1184 if ( ! mdoc_word_alloc(mdoc
, nn
->line
, nn
->pos
, "AT&T"))
1186 if ( ! mdoc_word_alloc(mdoc
, nn
->line
, nn
->pos
, "UNIX"))
1190 if ( ! mdoc_word_alloc(mdoc
, nn
->line
, nn
->pos
, ""))
1196 if ( ! mdoc_word_alloc(mdoc
, nn
->line
, nn
->pos
, "~"))
1211 struct mdoc_node
*n
;
1212 const char *std_att
;
1216 * If we have a child, look it up in the standard keys. If a
1217 * key exist, use that instead of the child; if it doesn't,
1218 * prefix "AT&T UNIX " to the existing data.
1221 if (NULL
== (n
= mdoc
->last
->child
))
1224 assert(MDOC_TEXT
== n
->type
);
1225 if (NULL
== (std_att
= mdoc_a2att(n
->string
))) {
1226 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_BADATT
);
1227 mandoc_asprintf(&att
, "AT&T UNIX %s", n
->string
);
1229 att
= mandoc_strdup(std_att
);
1239 struct mdoc_node
*np
;
1242 if (AUTH__NONE
== np
->norm
->An
.auth
) {
1244 check_count(mdoc
, MDOC_ELEM
, CHECK_WARN
, CHECK_GT
, 0);
1245 } else if (np
->child
)
1246 check_count(mdoc
, MDOC_ELEM
, CHECK_WARN
, CHECK_EQ
, 0);
1255 if (MDOC_BLOCK
== mdoc
->last
->type
)
1256 mdoc
->last
->norm
->Es
= mdoc
->last_es
;
1264 mdoc
->last_es
= mdoc
->last
;
1273 struct mdoc_node
*n
, *c
;
1276 if (MDOC_BLOCK
!= mdoc
->last
->type
)
1279 n
= mdoc
->last
->parent
->parent
;
1280 lt
= n
->norm
->Bl
.type
;
1282 if (LIST__NONE
== lt
) {
1283 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_LISTTYPE
);
1289 if (mdoc
->last
->head
->child
)
1291 /* FIXME: give this a dummy value. */
1292 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_NOARGS
);
1301 if (NULL
== mdoc
->last
->head
->child
)
1302 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_NOARGS
);
1311 if (NULL
== mdoc
->last
->body
->child
)
1312 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_NOBODY
);
1315 if (mdoc
->last
->head
->child
)
1316 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_ARGSLOST
);
1319 cols
= (int)n
->norm
->Bl
.ncols
;
1321 assert(NULL
== mdoc
->last
->head
->child
);
1323 if (NULL
== mdoc
->last
->body
->child
)
1324 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_NOBODY
);
1326 for (i
= 0, c
= mdoc
->last
->child
; c
; c
= c
->next
)
1327 if (MDOC_BODY
== c
->type
)
1331 er
= MANDOCERR_ARGCOUNT
;
1332 else if (i
== cols
|| i
== cols
+ 1)
1335 er
= MANDOCERR_SYNTARGCOUNT
;
1337 mandoc_vmsg(er
, mdoc
->parse
,
1338 mdoc
->last
->line
, mdoc
->last
->pos
,
1339 "columns == %d (have %d)", cols
, i
);
1340 return(MANDOCERR_ARGCOUNT
== er
);
1349 post_bl_block(POST_ARGS
)
1351 struct mdoc_node
*n
, *ni
, *nc
;
1354 * These are fairly complicated, so we've broken them into two
1355 * functions. post_bl_block_tag() is called when a -tag is
1356 * specified, but no -width (it must be guessed). The second
1357 * when a -width is specified (macro indicators must be
1358 * rewritten into real lengths).
1363 if (LIST_tag
== n
->norm
->Bl
.type
&&
1364 NULL
== n
->norm
->Bl
.width
) {
1365 if ( ! post_bl_block_tag(mdoc
))
1367 assert(n
->norm
->Bl
.width
);
1368 } else if (NULL
!= n
->norm
->Bl
.width
) {
1369 if ( ! post_bl_block_width(mdoc
))
1371 assert(n
->norm
->Bl
.width
);
1374 for (ni
= n
->body
->child
; ni
; ni
= ni
->next
) {
1375 if (NULL
== ni
->body
)
1377 nc
= ni
->body
->last
;
1378 while (NULL
!= nc
) {
1390 if (NULL
== ni
->next
) {
1391 mandoc_msg(MANDOCERR_PAR_MOVE
,
1392 mdoc
->parse
, nc
->line
, nc
->pos
,
1393 mdoc_macronames
[nc
->tok
]);
1394 if ( ! mdoc_node_relink(mdoc
, nc
))
1396 } else if (0 == n
->norm
->Bl
.comp
&&
1397 LIST_column
!= n
->norm
->Bl
.type
) {
1398 mandoc_vmsg(MANDOCERR_PAR_SKIP
,
1399 mdoc
->parse
, nc
->line
, nc
->pos
,
1401 mdoc_macronames
[nc
->tok
]);
1402 mdoc_node_delete(mdoc
, nc
);
1405 nc
= ni
->body
->last
;
1412 post_bl_block_width(POST_ARGS
)
1417 struct mdoc_node
*n
;
1423 * Calculate the real width of a list from the -width string,
1424 * which may contain a macro (with a known default width), a
1425 * literal string, or a scaling width.
1427 * If the value to -width is a macro, then we re-write it to be
1428 * the macro's width as set in share/tmac/mdoc/doc-common.
1431 if (0 == strcmp(n
->norm
->Bl
.width
, "Ds"))
1433 else if (MDOC_MAX
== (tok
= mdoc_hash_find(n
->norm
->Bl
.width
)))
1435 else if (0 == (width
= macro2len(tok
))) {
1436 mdoc_nmsg(mdoc
, n
, MANDOCERR_BADWIDTH
);
1440 /* The value already exists: free and reallocate it. */
1444 for (i
= 0; i
< (int)n
->args
->argc
; i
++)
1445 if (MDOC_Width
== n
->args
->argv
[i
].arg
)
1448 assert(i
< (int)n
->args
->argc
);
1450 (void)snprintf(buf
, sizeof(buf
), "%un", (unsigned int)width
);
1451 free(n
->args
->argv
[i
].value
[0]);
1452 n
->args
->argv
[i
].value
[0] = mandoc_strdup(buf
);
1454 /* Set our width! */
1455 n
->norm
->Bl
.width
= n
->args
->argv
[i
].value
[0];
1460 post_bl_block_tag(POST_ARGS
)
1462 struct mdoc_node
*n
, *nn
;
1468 * Calculate the -width for a `Bl -tag' list if it hasn't been
1469 * provided. Uses the first head macro. NOTE AGAIN: this is
1470 * ONLY if the -width argument has NOT been provided. See
1471 * post_bl_block_width() for converting the -width string.
1477 for (nn
= n
->body
->child
; nn
; nn
= nn
->next
) {
1478 if (MDOC_It
!= nn
->tok
)
1481 assert(MDOC_BLOCK
== nn
->type
);
1482 nn
= nn
->head
->child
;
1487 if (MDOC_TEXT
== nn
->type
) {
1488 sz
= strlen(nn
->string
) + 1;
1492 if (0 != (ssz
= macro2len(nn
->tok
)))
1498 /* Defaults to ten ens. */
1500 (void)snprintf(buf
, sizeof(buf
), "%un", (unsigned int)sz
);
1503 * We have to dynamically add this to the macro's argument list.
1504 * We're guaranteed that a MDOC_Width doesn't already exist.
1508 i
= (int)(n
->args
->argc
)++;
1510 n
->args
->argv
= mandoc_reallocarray(n
->args
->argv
,
1511 n
->args
->argc
, sizeof(struct mdoc_argv
));
1513 n
->args
->argv
[i
].arg
= MDOC_Width
;
1514 n
->args
->argv
[i
].line
= n
->line
;
1515 n
->args
->argv
[i
].pos
= n
->pos
;
1516 n
->args
->argv
[i
].sz
= 1;
1517 n
->args
->argv
[i
].value
= mandoc_malloc(sizeof(char *));
1518 n
->args
->argv
[i
].value
[0] = mandoc_strdup(buf
);
1520 /* Set our width! */
1521 n
->norm
->Bl
.width
= n
->args
->argv
[i
].value
[0];
1526 post_bl_head(POST_ARGS
)
1528 struct mdoc_node
*np
, *nn
, *nnp
;
1531 if (LIST_column
!= mdoc
->last
->norm
->Bl
.type
)
1532 /* FIXME: this should be ERROR class... */
1533 return(hwarn_eq0(mdoc
));
1536 * Convert old-style lists, where the column width specifiers
1537 * trail as macro parameters, to the new-style ("normal-form")
1538 * lists where they're argument values following -column.
1541 /* First, disallow both types and allow normal-form. */
1544 * TODO: technically, we can accept both and just merge the two
1545 * lists, but I'll leave that for another day.
1548 if (mdoc
->last
->norm
->Bl
.ncols
&& mdoc
->last
->nchild
) {
1549 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_COLUMNS
);
1551 } else if (NULL
== mdoc
->last
->child
)
1554 np
= mdoc
->last
->parent
;
1557 for (j
= 0; j
< (int)np
->args
->argc
; j
++)
1558 if (MDOC_Column
== np
->args
->argv
[j
].arg
)
1561 assert(j
< (int)np
->args
->argc
);
1562 assert(0 == np
->args
->argv
[j
].sz
);
1565 * Accommodate for new-style groff column syntax. Shuffle the
1566 * child nodes, all of which must be TEXT, as arguments for the
1567 * column field. Then, delete the head children.
1570 np
->args
->argv
[j
].sz
= (size_t)mdoc
->last
->nchild
;
1571 np
->args
->argv
[j
].value
= mandoc_reallocarray(NULL
,
1572 (size_t)mdoc
->last
->nchild
, sizeof(char *));
1574 mdoc
->last
->norm
->Bl
.ncols
= np
->args
->argv
[j
].sz
;
1575 mdoc
->last
->norm
->Bl
.cols
= (void *)np
->args
->argv
[j
].value
;
1577 for (i
= 0, nn
= mdoc
->last
->child
; nn
; i
++) {
1578 np
->args
->argv
[j
].value
[i
] = nn
->string
;
1582 mdoc_node_delete(NULL
, nnp
);
1585 mdoc
->last
->nchild
= 0;
1586 mdoc
->last
->child
= NULL
;
1594 struct mdoc_node
*nparent
, *nprev
; /* of the Bl block */
1595 struct mdoc_node
*nblock
, *nbody
; /* of the Bl */
1596 struct mdoc_node
*nchild
, *nnext
; /* of the Bl body */
1599 switch (nbody
->type
) {
1601 return(post_bl_block(mdoc
));
1603 return(post_bl_head(mdoc
));
1610 nchild
= nbody
->child
;
1611 while (NULL
!= nchild
) {
1612 if (MDOC_It
== nchild
->tok
|| MDOC_Sm
== nchild
->tok
) {
1613 nchild
= nchild
->next
;
1617 mandoc_msg(MANDOCERR_BL_MOVE
, mdoc
->parse
,
1618 nchild
->line
, nchild
->pos
,
1619 mdoc_macronames
[nchild
->tok
]);
1622 * Move the node out of the Bl block.
1623 * First, collect all required node pointers.
1626 nblock
= nbody
->parent
;
1627 nprev
= nblock
->prev
;
1628 nparent
= nblock
->parent
;
1629 nnext
= nchild
->next
;
1632 * Unlink this child.
1635 assert(NULL
== nchild
->prev
);
1636 if (0 == --nbody
->nchild
) {
1637 nbody
->child
= NULL
;
1639 assert(NULL
== nnext
);
1641 nbody
->child
= nnext
;
1646 * Relink this child.
1649 nchild
->parent
= nparent
;
1650 nchild
->prev
= nprev
;
1651 nchild
->next
= nblock
;
1653 nblock
->prev
= nchild
;
1656 nparent
->child
= nchild
;
1658 nprev
->next
= nchild
;
1667 ebool(struct mdoc
*mdoc
)
1670 if (NULL
== mdoc
->last
->child
) {
1671 if (MDOC_Sm
== mdoc
->last
->tok
)
1672 mdoc
->flags
^= MDOC_SMOFF
;
1676 check_count(mdoc
, MDOC_ELEM
, CHECK_WARN
, CHECK_LT
, 2);
1678 assert(MDOC_TEXT
== mdoc
->last
->child
->type
);
1680 if (0 == strcmp(mdoc
->last
->child
->string
, "on")) {
1681 if (MDOC_Sm
== mdoc
->last
->tok
)
1682 mdoc
->flags
&= ~MDOC_SMOFF
;
1685 if (0 == strcmp(mdoc
->last
->child
->string
, "off")) {
1686 if (MDOC_Sm
== mdoc
->last
->tok
)
1687 mdoc
->flags
|= MDOC_SMOFF
;
1691 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_BADBOOL
);
1696 post_root(POST_ARGS
)
1699 struct mdoc_node
*n
;
1703 /* Check that we have a finished prologue. */
1705 if ( ! (MDOC_PBODY
& mdoc
->flags
)) {
1707 mdoc_nmsg(mdoc
, mdoc
->first
, MANDOCERR_NODOCPROLOG
);
1713 /* Check that we begin with a proper `Sh'. */
1715 if (NULL
== n
->child
)
1716 mdoc_nmsg(mdoc
, n
, MANDOCERR_DOC_EMPTY
);
1717 else if (MDOC_Sh
!= n
->child
->tok
)
1718 mandoc_msg(MANDOCERR_SEC_BEFORE
, mdoc
->parse
,
1719 n
->child
->line
, n
->child
->pos
,
1720 mdoc_macronames
[n
->child
->tok
]);
1728 struct mdoc_node
*ch
;
1731 if (NULL
== (ch
= mdoc
->last
->child
)) {
1732 mandoc_msg(MANDOCERR_MACRO_EMPTY
, mdoc
->parse
,
1733 mdoc
->last
->line
, mdoc
->last
->pos
,
1734 mdoc_macronames
[mdoc
->last
->tok
]);
1735 mdoc_node_delete(mdoc
, mdoc
->last
);
1739 assert(MDOC_TEXT
== ch
->type
);
1741 if (NULL
== (p
= mdoc_a2st(ch
->string
))) {
1742 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_BADSTANDARD
);
1743 mdoc_node_delete(mdoc
, mdoc
->last
);
1746 ch
->string
= mandoc_strdup(p
);
1755 struct mdoc_node
*nn
, *next
, *prev
;
1758 switch (mdoc
->last
->type
) {
1760 check_count(mdoc
, MDOC_HEAD
, CHECK_WARN
, CHECK_EQ
, 0);
1763 if (mdoc
->last
->child
)
1765 check_count(mdoc
, MDOC_BODY
, CHECK_WARN
, CHECK_GT
, 0);
1772 * Make sure only certain types of nodes are allowed within the
1773 * the `Rs' body. Delete offending nodes and raise a warning.
1774 * Do this before re-ordering for the sake of clarity.
1778 for (nn
= mdoc
->last
->child
; nn
; nn
= next
) {
1779 for (i
= 0; i
< RSORD_MAX
; i
++)
1780 if (nn
->tok
== rsord
[i
])
1783 if (i
< RSORD_MAX
) {
1784 if (MDOC__J
== rsord
[i
] || MDOC__B
== rsord
[i
])
1785 mdoc
->last
->norm
->Rs
.quote_T
++;
1791 mandoc_msg(MANDOCERR_RS_SKIP
, mdoc
->parse
,
1792 nn
->line
, nn
->pos
, mdoc_macronames
[nn
->tok
]);
1793 mdoc_node_delete(mdoc
, nn
);
1797 * Nothing to sort if only invalid nodes were found
1798 * inside the `Rs' body.
1801 if (NULL
== mdoc
->last
->child
)
1805 * The full `Rs' block needs special handling to order the
1806 * sub-elements according to `rsord'. Pick through each element
1807 * and correctly order it. This is a insertion sort.
1811 for (nn
= mdoc
->last
->child
->next
; nn
; nn
= next
) {
1812 /* Determine order of `nn'. */
1813 for (i
= 0; i
< RSORD_MAX
; i
++)
1814 if (rsord
[i
] == nn
->tok
)
1818 * Remove `nn' from the chain. This somewhat
1819 * repeats mdoc_node_unlink(), but since we're
1820 * just re-ordering, there's no need for the
1821 * full unlink process.
1824 if (NULL
!= (next
= nn
->next
))
1825 next
->prev
= nn
->prev
;
1827 if (NULL
!= (prev
= nn
->prev
))
1828 prev
->next
= nn
->next
;
1830 nn
->prev
= nn
->next
= NULL
;
1833 * Scan back until we reach a node that's
1834 * ordered before `nn'.
1837 for ( ; prev
; prev
= prev
->prev
) {
1838 /* Determine order of `prev'. */
1839 for (j
= 0; j
< RSORD_MAX
; j
++)
1840 if (rsord
[j
] == prev
->tok
)
1848 * Set `nn' back into its correct place in front
1849 * of the `prev' node.
1856 prev
->next
->prev
= nn
;
1857 nn
->next
= prev
->next
;
1860 mdoc
->last
->child
->prev
= nn
;
1861 nn
->next
= mdoc
->last
->child
;
1862 mdoc
->last
->child
= nn
;
1870 * For some arguments of some macros,
1871 * convert all breakable hyphens into ASCII_HYPH.
1874 post_hyph(POST_ARGS
)
1876 struct mdoc_node
*n
, *nch
;
1882 if (MDOC_Sh
== n
->tok
|| MDOC_Ss
== n
->tok
)
1886 if (MDOC_D1
== n
->tok
|| MDOC_Nd
== n
->tok
)
1895 for (nch
= n
->child
; nch
; nch
= nch
->next
) {
1896 if (MDOC_TEXT
!= nch
->type
)
1901 while ('\0' != *(++cp
))
1903 isalpha((unsigned char)cp
[-1]) &&
1904 isalpha((unsigned char)cp
[1]))
1914 if (MDOC_LINE
& mdoc
->last
->flags
)
1915 mdoc_nmsg(mdoc
, mdoc
->last
, MANDOCERR_NS_SKIP
);
1923 if (MDOC_HEAD
== mdoc
->last
->type
)
1924 return(post_sh_head(mdoc
));
1925 if (MDOC_BODY
== mdoc
->last
->type
)
1926 return(post_sh_body(mdoc
));
1932 post_sh_body(POST_ARGS
)
1934 struct mdoc_node
*n
;
1936 if (SEC_NAME
!= mdoc
->lastsec
)
1940 * Warn if the NAME section doesn't contain the `Nm' and `Nd'
1941 * macros (can have multiple `Nm' and one `Nd'). Note that the
1942 * children of the BODY declaration can also be "text".
1945 if (NULL
== (n
= mdoc
->last
->child
)) {
1946 mandoc_msg(MANDOCERR_NAMESEC_BAD
, mdoc
->parse
,
1947 mdoc
->last
->line
, mdoc
->last
->pos
, "empty");
1951 for ( ; n
&& n
->next
; n
= n
->next
) {
1952 if (MDOC_ELEM
== n
->type
&& MDOC_Nm
== n
->tok
)
1954 if (MDOC_TEXT
== n
->type
)
1956 mandoc_msg(MANDOCERR_NAMESEC_BAD
, mdoc
->parse
,
1957 n
->line
, n
->pos
, mdoc_macronames
[n
->tok
]);
1961 if (MDOC_BLOCK
== n
->type
&& MDOC_Nd
== n
->tok
)
1964 mandoc_msg(MANDOCERR_NAMESEC_BAD
, mdoc
->parse
,
1965 n
->line
, n
->pos
, mdoc_macronames
[n
->tok
]);
1970 post_sh_head(POST_ARGS
)
1972 struct mdoc_node
*n
;
1973 const char *goodsec
;
1978 * Process a new section. Sections are either "named" or
1979 * "custom". Custom sections are user-defined, while named ones
1980 * follow a conventional order and may only appear in certain
1986 mdoc_deroff(&secname
, mdoc
->last
);
1987 sec
= NULL
== secname
? SEC_CUSTOM
: a2sec(secname
);
1989 /* The NAME should be first. */
1991 if (SEC_NAME
!= sec
&& SEC_NONE
== mdoc
->lastnamed
)
1992 mandoc_msg(MANDOCERR_NAMESEC_FIRST
, mdoc
->parse
,
1993 mdoc
->last
->line
, mdoc
->last
->pos
, secname
);
1995 /* The SYNOPSIS gets special attention in other areas. */
1997 if (SEC_SYNOPSIS
== sec
) {
1998 roff_setreg(mdoc
->roff
, "nS", 1, '=');
1999 mdoc
->flags
|= MDOC_SYNOPSIS
;
2001 roff_setreg(mdoc
->roff
, "nS", 0, '=');
2002 mdoc
->flags
&= ~MDOC_SYNOPSIS
;
2005 /* Mark our last section. */
2007 mdoc
->lastsec
= sec
;
2010 * Set the section attribute for the current HEAD, for its
2011 * parent BLOCK, and for the HEAD children; the latter can
2012 * only be TEXT nodes, so no recursion is needed.
2013 * For other blocks and elements, including .Sh BODY, this is
2014 * done when allocating the node data structures, but for .Sh
2015 * BLOCK and HEAD, the section is still unknown at that time.
2018 mdoc
->last
->parent
->sec
= sec
;
2019 mdoc
->last
->sec
= sec
;
2020 for (n
= mdoc
->last
->child
; n
; n
= n
->next
)
2023 /* We don't care about custom sections after this. */
2025 if (SEC_CUSTOM
== sec
) {
2031 * Check whether our non-custom section is being repeated or is
2035 if (sec
== mdoc
->lastnamed
)
2036 mandoc_msg(MANDOCERR_SEC_REP
, mdoc
->parse
,
2037 mdoc
->last
->line
, mdoc
->last
->pos
, secname
);
2039 if (sec
< mdoc
->lastnamed
)
2040 mandoc_msg(MANDOCERR_SEC_ORDER
, mdoc
->parse
,
2041 mdoc
->last
->line
, mdoc
->last
->pos
, secname
);
2043 /* Mark the last named section. */
2045 mdoc
->lastnamed
= sec
;
2047 /* Check particular section/manual conventions. */
2049 assert(mdoc
->meta
.msec
);
2054 if (*mdoc
->meta
.msec
== '4')
2056 goodsec
= "2, 3, 4, 9";
2058 case SEC_RETURN_VALUES
:
2061 if (*mdoc
->meta
.msec
== '2')
2063 if (*mdoc
->meta
.msec
== '3')
2065 if (NULL
== goodsec
)
2066 goodsec
= "2, 3, 9";
2069 if (*mdoc
->meta
.msec
== '9')
2071 if (NULL
== goodsec
)
2073 mandoc_vmsg(MANDOCERR_SEC_MSEC
, mdoc
->parse
,
2074 mdoc
->last
->line
, mdoc
->last
->pos
,
2075 "%s for %s only", secname
, goodsec
);
2086 post_ignpar(POST_ARGS
)
2088 struct mdoc_node
*np
;
2090 if (MDOC_BODY
!= mdoc
->last
->type
)
2093 if (NULL
!= (np
= mdoc
->last
->child
))
2094 if (MDOC_Pp
== np
->tok
|| MDOC_Lp
== np
->tok
) {
2095 mandoc_vmsg(MANDOCERR_PAR_SKIP
,
2096 mdoc
->parse
, np
->line
, np
->pos
,
2097 "%s after %s", mdoc_macronames
[np
->tok
],
2098 mdoc_macronames
[mdoc
->last
->tok
]);
2099 mdoc_node_delete(mdoc
, np
);
2102 if (NULL
!= (np
= mdoc
->last
->last
))
2103 if (MDOC_Pp
== np
->tok
|| MDOC_Lp
== np
->tok
) {
2104 mandoc_vmsg(MANDOCERR_PAR_SKIP
, mdoc
->parse
,
2105 np
->line
, np
->pos
, "%s at the end of %s",
2106 mdoc_macronames
[np
->tok
],
2107 mdoc_macronames
[mdoc
->last
->tok
]);
2108 mdoc_node_delete(mdoc
, np
);
2118 if (NULL
== mdoc
->last
)
2120 if (MDOC_ELEM
!= n
->type
&& MDOC_BLOCK
!= n
->type
)
2124 * Don't allow prior `Lp' or `Pp' prior to a paragraph-type
2125 * block: `Lp', `Pp', or non-compact `Bd' or `Bl'.
2128 if (MDOC_Pp
!= mdoc
->last
->tok
&&
2129 MDOC_Lp
!= mdoc
->last
->tok
&&
2130 MDOC_br
!= mdoc
->last
->tok
)
2132 if (MDOC_Bl
== n
->tok
&& n
->norm
->Bl
.comp
)
2134 if (MDOC_Bd
== n
->tok
&& n
->norm
->Bd
.comp
)
2136 if (MDOC_It
== n
->tok
&& n
->parent
->norm
->Bl
.comp
)
2139 mandoc_vmsg(MANDOCERR_PAR_SKIP
, mdoc
->parse
,
2140 mdoc
->last
->line
, mdoc
->last
->pos
,
2141 "%s before %s", mdoc_macronames
[mdoc
->last
->tok
],
2142 mdoc_macronames
[n
->tok
]);
2143 mdoc_node_delete(mdoc
, mdoc
->last
);
2150 struct mdoc_node
*np
;
2152 if (MDOC_ELEM
!= mdoc
->last
->type
&&
2153 MDOC_BLOCK
!= mdoc
->last
->type
)
2156 if (NULL
== (np
= mdoc
->last
->prev
)) {
2157 np
= mdoc
->last
->parent
;
2158 if (MDOC_Sh
!= np
->tok
&& MDOC_Ss
!= np
->tok
)
2161 if (MDOC_Pp
!= np
->tok
&& MDOC_Lp
!= np
->tok
&&
2162 (MDOC_br
!= mdoc
->last
->tok
||
2163 (MDOC_sp
!= np
->tok
&& MDOC_br
!= np
->tok
)))
2167 mandoc_vmsg(MANDOCERR_PAR_SKIP
, mdoc
->parse
,
2168 mdoc
->last
->line
, mdoc
->last
->pos
,
2169 "%s after %s", mdoc_macronames
[mdoc
->last
->tok
],
2170 mdoc_macronames
[np
->tok
]);
2171 mdoc_node_delete(mdoc
, mdoc
->last
);
2176 pre_literal(PRE_ARGS
)
2179 if (MDOC_BODY
!= n
->type
)
2183 * The `Dl' (note "el" not "one") and `Bd -literal' and `Bd
2184 * -unfilled' macros set MDOC_LITERAL on entrance to the body.
2189 mdoc
->flags
|= MDOC_LITERAL
;
2192 if (DISP_literal
== n
->norm
->Bd
.type
)
2193 mdoc
->flags
|= MDOC_LITERAL
;
2194 if (DISP_unfilled
== n
->norm
->Bd
.type
)
2195 mdoc
->flags
|= MDOC_LITERAL
;
2208 struct mdoc_node
*n
;
2211 if (mdoc
->meta
.date
)
2212 free(mdoc
->meta
.date
);
2215 if (NULL
== n
->child
|| '\0' == n
->child
->string
[0]) {
2216 mdoc
->meta
.date
= mdoc
->quick
? mandoc_strdup("") :
2217 mandoc_normdate(mdoc
->parse
, NULL
, n
->line
, n
->pos
);
2222 mdoc_deroff(&datestr
, n
);
2224 mdoc
->meta
.date
= datestr
;
2226 mdoc
->meta
.date
= mandoc_normdate(mdoc
->parse
,
2227 datestr
, n
->line
, n
->pos
);
2236 struct mdoc_node
*nn
, *n
;
2242 if (mdoc
->meta
.title
)
2243 free(mdoc
->meta
.title
);
2245 free(mdoc
->meta
.vol
);
2246 if (mdoc
->meta
.arch
)
2247 free(mdoc
->meta
.arch
);
2249 mdoc
->meta
.title
= mdoc
->meta
.vol
= mdoc
->meta
.arch
= NULL
;
2251 /* First check that all characters are uppercase. */
2253 if (NULL
!= (nn
= n
->child
))
2254 for (p
= nn
->string
; *p
; p
++) {
2255 if (toupper((unsigned char)*p
) == *p
)
2257 mandoc_msg(MANDOCERR_TITLE_CASE
,
2258 mdoc
->parse
, nn
->line
,
2259 nn
->pos
+ (p
- nn
->string
),
2265 * title = unknown, volume = local, msec = 0, arch = NULL
2268 if (NULL
== (nn
= n
->child
)) {
2269 /* XXX: make these macro values. */
2270 /* FIXME: warn about missing values. */
2271 mdoc
->meta
.title
= mandoc_strdup("UNKNOWN");
2272 mdoc
->meta
.vol
= mandoc_strdup("LOCAL");
2273 mdoc
->meta
.msec
= mandoc_strdup("1");
2277 /* Handles: `.Dt TITLE'
2278 * title = TITLE, volume = local, msec = 0, arch = NULL
2281 mdoc
->meta
.title
= mandoc_strdup(
2282 '\0' == nn
->string
[0] ? "UNKNOWN" : nn
->string
);
2284 if (NULL
== (nn
= nn
->next
)) {
2285 /* FIXME: warn about missing msec. */
2286 /* XXX: make this a macro value. */
2287 mdoc
->meta
.vol
= mandoc_strdup("LOCAL");
2288 mdoc
->meta
.msec
= mandoc_strdup("1");
2292 /* Handles: `.Dt TITLE SEC'
2294 * volume = SEC is msec ? format(msec) : SEC,
2295 * msec = SEC is msec ? atoi(msec) : 0,
2299 cp
= mandoc_a2msec(nn
->string
);
2301 mdoc
->meta
.vol
= mandoc_strdup(cp
);
2302 mdoc
->meta
.msec
= mandoc_strdup(nn
->string
);
2304 mandoc_msg(MANDOCERR_MSEC_BAD
, mdoc
->parse
,
2305 nn
->line
, nn
->pos
, nn
->string
);
2306 mdoc
->meta
.vol
= mandoc_strdup(nn
->string
);
2307 mdoc
->meta
.msec
= mandoc_strdup(nn
->string
);
2310 if (NULL
== (nn
= nn
->next
))
2313 /* Handles: `.Dt TITLE SEC VOL'
2315 * volume = VOL is vol ? format(VOL) :
2316 * VOL is arch ? format(arch) :
2320 cp
= mdoc_a2vol(nn
->string
);
2322 free(mdoc
->meta
.vol
);
2323 mdoc
->meta
.vol
= mandoc_strdup(cp
);
2325 cp
= mdoc_a2arch(nn
->string
);
2327 mandoc_msg(MANDOCERR_ARCH_BAD
, mdoc
->parse
,
2328 nn
->line
, nn
->pos
, nn
->string
);
2329 free(mdoc
->meta
.vol
);
2330 mdoc
->meta
.vol
= mandoc_strdup(nn
->string
);
2332 mdoc
->meta
.arch
= mandoc_strdup(cp
);
2335 /* Ignore any subsequent parameters... */
2336 /* FIXME: warn about subsequent parameters. */
2342 post_prol(POST_ARGS
)
2345 * Remove prologue macros from the document after they're
2346 * processed. The final document uses mdoc_meta for these
2347 * values and discards the originals.
2350 mdoc_node_delete(mdoc
, mdoc
->last
);
2351 if (mdoc
->meta
.title
&& mdoc
->meta
.date
&& mdoc
->meta
.os
)
2352 mdoc
->flags
|= MDOC_PBODY
;
2360 struct mdoc_node
*n
;
2363 * Make `Bx's second argument always start with an uppercase
2364 * letter. Groff checks if it's an "accepted" term, but we just
2365 * uppercase blindly.
2368 n
= mdoc
->last
->child
;
2369 if (n
&& NULL
!= (n
= n
->next
))
2370 *n
->string
= (char)toupper((unsigned char)*n
->string
);
2379 struct utsname utsname
;
2380 static char *defbuf
;
2382 struct mdoc_node
*n
;
2387 * Set the operating system by way of the `Os' macro.
2388 * The order of precedence is:
2389 * 1. the argument of the `Os' macro, unless empty
2390 * 2. the -Ios=foo command line argument, if provided
2391 * 3. -DOSNAME="\"foo\"", if provided during compilation
2392 * 4. "sysname release" from uname(3)
2395 free(mdoc
->meta
.os
);
2396 mdoc
->meta
.os
= NULL
;
2397 mdoc_deroff(&mdoc
->meta
.os
, n
);
2402 mdoc
->meta
.os
= mandoc_strdup(mdoc
->defos
);
2407 mdoc
->meta
.os
= mandoc_strdup(OSNAME
);
2409 if (NULL
== defbuf
) {
2410 if (-1 == uname(&utsname
)) {
2411 mdoc_nmsg(mdoc
, n
, MANDOCERR_UNAME
);
2412 defbuf
= mandoc_strdup("UNKNOWN");
2414 mandoc_asprintf(&defbuf
, "%s %s",
2415 utsname
.sysname
, utsname
.release
);
2417 mdoc
->meta
.os
= mandoc_strdup(defbuf
);
2425 struct mdoc_node
*nn
, *n
;
2430 * Macros accepting `-std' as an argument have the name of the
2431 * current document (`Nm') filled in as the argument if it's not
2438 if (NULL
== mdoc
->meta
.name
)
2442 mdoc
->next
= MDOC_NEXT_CHILD
;
2444 if ( ! mdoc_word_alloc(mdoc
, n
->line
, n
->pos
, mdoc
->meta
.name
))
2451 static enum mdoc_sec
2452 a2sec(const char *p
)
2456 for (i
= 0; i
< (int)SEC__MAX
; i
++)
2457 if (secnames
[i
] && 0 == strcmp(p
, secnames
[i
]))
2458 return((enum mdoc_sec
)i
);
2464 macro2len(enum mdoct macro
)