done: .de; todo: """"; loops in macro and string expansion
[mandoc.git] / out.c
diff --git a/out.c b/out.c
index 713e5fa21716e06dc016131d731217bfa04969ad..2a683fae8ed4e7640ee4a5e898800677aebf1f7e 100644 (file)
--- a/out.c
+++ b/out.c
@@ -1,6 +1,6 @@
-/*     $Id: out.c,v 1.10 2009/11/08 09:23:35 kristaps Exp $ */
+/*     $Id: out.c,v 1.29 2010/08/29 11:28:09 kristaps Exp $ */
 /*
- * Copyright (c) 2009 Kristaps Dzonsons <kristaps@kth.se>
+ * Copyright (c) 2009, 2010 Kristaps Dzonsons <kristaps@bsd.lv>
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
  */
+#ifdef HAVE_CONFIG_H
+#include "config.h"
+#endif
+
 #include <sys/types.h>
 
 #include <assert.h>
 
 #include "out.h"
 
-/* See a2roffdeco(). */
-#define        C2LIM(c, l) do { \
-       (l) = 1; \
-       if ('[' == (c) || '\'' == (c)) \
-               (l) = 0; \
-       else if ('(' == (c)) \
-               (l) = 2; } \
-       while (/* CONSTCOND */ 0)
-
-/* See a2roffdeco(). */
-#define        C2TERM(c, t) do { \
-       (t) = 0; \
-       if ('\'' == (c)) \
-               (t) = 1; \
-       else if ('[' == (c)) \
-               (t) = 2; \
-       else if ('(' == (c)) \
-               (t) = 3; } \
-       while (/* CONSTCOND */ 0)
-
-#ifdef __linux__
-extern size_t    strlcat(char *, const char *, size_t);
-#endif
-
 /* 
  * Convert a `scaling unit' to a consistent form, or fail.  Scaling
  * units are documented in groff.7, mdoc.7, man.7.
@@ -136,11 +116,10 @@ a2roffsu(const char *src, struct roffsu *dst, enum roffscale def)
                return(0);
        }
 
+       /* FIXME: do this in the caller. */
        if ((dst->scale = atof(buf)) < 0)
                dst->scale = 0;
        dst->unit = unit;
-       dst->pt = hasd;
-
        return(1);
 }
 
@@ -187,165 +166,195 @@ time2a(time_t t, char *dst, size_t sz)
 }
 
 
-/* 
- * Returns length of parsed string (the leading "\" should NOT be
- * included).  This can be zero if the current character is the nil
- * terminator.  "d" is set to the type of parsed decorator, which may
- * have an adjoining "word" of size "sz" (e.g., "(ab" -> "ab", 2).
- */
 int
-a2roffdeco(enum roffdeco *d,
-               const char **word, size_t *sz)
+a2roffdeco(enum roffdeco *d, const char **word, size_t *sz)
 {
-       int              j, type, term, lim;
-       const char      *wp, *sp;
+       int              i, j, lim;
+       char             term, c;
+       const char      *wp;
+       enum roffdeco    dd;
 
        *d = DECO_NONE;
+       lim = i = 0;
+       term = '\0';
        wp = *word;
-       type = 1;
-
-       switch (*wp) {
-       case ('\0'):
-               return(0);
 
+       switch ((c = wp[i++])) {
        case ('('):
-               if ('\0' == *(++wp))
-                       return(1);
-               if ('\0' == *(wp + 1))
-                       return(2);
-
                *d = DECO_SPECIAL;
-               *sz = 2;
-               *word = wp;
-               return(3);
-
-       case ('*'):
-               switch (*(++wp)) {
-               case ('\0'):
-                       return(1);
-
-               case ('('):
-                       if ('\0' == *(++wp))
-                               return(2);
-                       if ('\0' == *(wp + 1))
-                               return(3);
-
-                       *d = DECO_RESERVED;
-                       *sz = 2;
-                       *word = wp;
-                       return(4);
-
-               case ('['):
-                       type = 0;
-                       break;
-
-               default:
-                       *d = DECO_RESERVED;
-                       *sz = 1;
-                       *word = wp;
-                       return(2);
-               }
+               lim = 2;
                break;
+       case ('F'):
+               /* FALLTHROUGH */
+       case ('f'):
+               *d = 'F' == c ? DECO_FFONT : DECO_FONT;
 
-       case ('s'):
-               sp = wp;
-               if ('\0' == *(++wp))
-                       return(1);
-
-               C2LIM(*wp, lim);
-               C2TERM(*wp, term);
-
-               if (term) 
-                       wp++;
-
-               *word = wp;
-
-               if (*wp == '+' || *wp == '-')
-                       ++wp;
-
-               switch (*wp) {
-               case ('\''):
-                       /* FALLTHROUGH */
-               case ('['):
-                       /* FALLTHROUGH */
+               switch (wp[i++]) {
                case ('('):
-                       if (term) 
-                               return((int)(wp - sp));
-
-                       C2LIM(*wp, lim);
-                       C2TERM(*wp, term);
-                       wp++;
+                       lim = 2;
                        break;
-               default:
+               case ('['):
+                       term = ']';
                        break;
-               }
-
-               if ( ! isdigit((u_char)*wp))
-                       return((int)(wp - sp));
-
-               for (j = 0; isdigit((u_char)*wp); j++) {
-                       if (lim && j >= lim)
-                               break;
-                       ++wp;
-               }
-
-               if (term && term < 3) {
-                       if (1 == term && *wp != '\'')
-                               return((int)(wp - sp));
-                       if (2 == term && *wp != ']')
-                               return((int)(wp - sp));
-                       ++wp;
-               }
-
-               *d = DECO_SIZE;
-               return((int)(wp - sp));
-
-       case ('f'):
-               switch (*(++wp)) {
-               case ('\0'):
-                       return(1);
                case ('3'):
                        /* FALLTHROUGH */
                case ('B'):
                        *d = DECO_BOLD;
-                       break;
+                       return(i);
                case ('2'):
                        /* FALLTHROUGH */
                case ('I'):
                        *d = DECO_ITALIC;
-                       break;
+                       return(i);
                case ('P'):
                        *d = DECO_PREVIOUS;
-                       break;
+                       return(i);
                case ('1'):
                        /* FALLTHROUGH */
                case ('R'):
                        *d = DECO_ROMAN;
+                       return(i);
+               default:
+                       i--;
+                       lim = 1;
+                       break;
+               }
+               break;
+       case ('k'):
+               /* FALLTHROUGH */
+       case ('M'):
+               /* FALLTHROUGH */
+       case ('m'):
+               /* FALLTHROUGH */
+       case ('*'):
+               if ('*' == c)
+                       *d = DECO_RESERVED;
+
+               switch (wp[i++]) {
+               case ('('):
+                       lim = 2;
+                       break;
+               case ('['):
+                       term = ']';
                        break;
                default:
+                       i--;
+                       lim = 1;
                        break;
                }
+               break;
+       case ('h'):
+               /* FALLTHROUGH */
+       case ('v'):
+               /* FALLTHROUGH */
+       case ('s'):
+               j = 0;
+               if ('+' == wp[i] || '-' == wp[i]) {
+                       i++;
+                       j = 1;
+               }
 
-               return(2);
+               switch (wp[i++]) {
+               case ('('):
+                       lim = 2;
+                       break;
+               case ('['):
+                       term = ']';
+                       break;
+               case ('\''):
+                       term = '\'';
+                       break;
+               case ('0'):
+                       j = 1;
+                       /* FALLTHROUGH */
+               default:
+                       i--;
+                       lim = 1;
+                       break;
+               }
+
+               if ('+' == wp[i] || '-' == wp[i]) {
+                       if (j)
+                               return(i);
+                       i++;
+               } 
+
+               /* Handle embedded numerical subexp or escape. */
+
+               if ('(' == wp[i]) {
+                       while (wp[i] && ')' != wp[i])
+                               if ('\\' == wp[i++]) {
+                                       /* Handle embedded escape. */
+                                       *word = &wp[i];
+                                       i += a2roffdeco(&dd, word, sz);
+                               }
 
+                       if (')' == wp[i++])
+                               break;
+
+                       *d = DECO_NONE;
+                       return(i - 1);
+               } else if ('\\' == wp[i]) {
+                       *word = &wp[++i];
+                       i += a2roffdeco(&dd, word, sz);
+               }
+
+               break;
        case ('['):
+               *d = DECO_SPECIAL;
+               term = ']';
                break;
-
+       case ('c'):
+               *d = DECO_NOSPACE;
+               return(i);
+       case ('z'):
+               *d = DECO_NONE;
+               if ('\\' == wp[i]) {
+                       *word = &wp[++i];
+                       return(i + a2roffdeco(&dd, word, sz));
+               } else
+                       lim = 1;
+               break;
+       case ('o'):
+               /* FALLTHROUGH */
+       case ('w'):
+               if ('\'' == wp[i++]) {
+                       term = '\'';
+                       break;
+               } 
+               /* FALLTHROUGH */
        default:
-               *d = DECO_SPECIAL;
-               *word = wp;
-               *sz = 1;
-               return(1);
+               *d = DECO_SSPECIAL;
+               i--;
+               lim = 1;
+               break;
+       }
+
+       assert(term || lim);
+       *word = &wp[i];
+
+       if (term) {
+               j = i;
+               while (wp[i] && wp[i] != term)
+                       i++;
+               if ('\0' == wp[i]) {
+                       *d = DECO_NONE;
+                       return(i);
+               }
+
+               assert(i >= j);
+               *sz = (size_t)(i - j);
+
+               return(i + 1);
        }
 
-       *word = ++wp;
-       for (j = 0; *wp && ']' != *wp; wp++, j++)
-               /* Loop... */ ;
+       assert(lim > 0);
+       *sz = (size_t)lim;
 
-       if ('\0' == *wp)
-               return(j + 1);
+       for (j = 0; wp[i] && j < lim; j++)
+               i++;
+       if (j < lim)
+               *d = DECO_NONE;
 
-       *d = type ? DECO_SPECIAL : DECO_RESERVED;
-       *sz = (size_t)j;
-       return (j + 2);
+       return(i);
 }