aboutsummaryrefslogtreecommitdiffstatshomepage
path: root/html.c
diff options
context:
space:
mode:
authorIngo Schwarze <schwarze@openbsd.org>2014-10-29 00:17:43 +0000
committerIngo Schwarze <schwarze@openbsd.org>2014-10-29 00:17:43 +0000
commitada69bce757bdb8fff8d778e0660446c440c7613 (patch)
treec855535ac67e0f62353307e69e90b8952d8ecad3 /html.c
parent3e8d538cdcbed1408b260186b980e5fa4eeb81af (diff)
downloadmandoc-ada69bce757bdb8fff8d778e0660446c440c7613.tar.gz
mandoc-ada69bce757bdb8fff8d778e0660446c440c7613.tar.zst
mandoc-ada69bce757bdb8fff8d778e0660446c440c7613.zip
In terminal output, unify handling of Unicode and numbered character
escape sequences just like it was earlier implemented for -Thtml. Do not let control characters other than ASCII 9 (horizontal tab) propagate to the output, even though groff allows them; but that really doesn't look like a great idea. Let mchars_num2char() return int such that we can distinguish invalid \N syntax from \N'0'. This also reduces the danger of signed char issues popping up.
Diffstat (limited to 'html.c')
-rw-r--r--html.c11
1 files changed, 7 insertions, 4 deletions
diff --git a/html.c b/html.c
index 912c006d..050fefe6 100644
--- a/html.c
+++ b/html.c
@@ -1,4 +1,4 @@
-/* $Id: html.c,v 1.180 2014/10/28 17:36:19 schwarze Exp $ */
+/* $Id: html.c,v 1.181 2014/10/29 00:17:43 schwarze Exp $ */
/*
* Copyright (c) 2008-2011, 2014 Kristaps Dzonsons <kristaps@bsd.lv>
* Copyright (c) 2011, 2012, 2013, 2014 Ingo Schwarze <schwarze@openbsd.org>
@@ -422,9 +422,13 @@ print_encode(struct html *h, const char *p, int norecurse)
break;
case ESCAPE_NUMBERED:
c = mchars_num2char(seq, len);
+ if (c < 0)
+ continue;
break;
case ESCAPE_SPECIAL:
c = mchars_spec2cp(h->symtab, seq, len);
+ if (c <= 0)
+ continue;
break;
case ESCAPE_NOSPACE:
if ('\0' == *p)
@@ -433,9 +437,8 @@ print_encode(struct html *h, const char *p, int norecurse)
default:
continue;
}
- if (c <= 0)
- continue;
- if (c < 0x20 || (c > 0x7E && c < 0xA0))
+ if ((c < 0x20 && c != 0x09) ||
+ (c > 0x7E && c < 0xA0))
c = 0xFFFD;
if (c > 0x7E)
printf("&#%d;", c);