]> git.cameronkatri.com Git - mandoc.git/blobdiff - tbl_data.c
The files mandoc.c and mandoc.h contained both specialised low-level
[mandoc.git] / tbl_data.c
index 3e89ca6a9a0d557e36a4651accbf7ed89dbbffb7..dfb85bd27cdac7c5147be61bebd5d48ab3c6af7c 100644 (file)
@@ -1,6 +1,7 @@
-/*     $Id: tbl_data.c,v 1.2 2010/12/30 09:34:07 kristaps Exp $ */
+/*     $Id: tbl_data.c,v 1.29 2014/03/23 11:25:26 schwarze Exp $ */
 /*
- * Copyright (c) 2009, 2010 Kristaps Dzonsons <kristaps@bsd.lv>
+ * Copyright (c) 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv>
+ * Copyright (c) 2011 Ingo Schwarze <schwarze@openbsd.org>
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
  * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
  * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
  */
+#ifdef HAVE_CONFIG_H
+#include "config.h"
+#endif
+
 #include <assert.h>
 #include <ctype.h>
 #include <stdlib.h>
 #include <string.h>
+#include <time.h>
 
 #include "mandoc.h"
+#include "mandoc_aux.h"
 #include "libmandoc.h"
 #include "libroff.h"
 
-static void    data(struct tbl *, struct tbl_span *, 
-                       int, const char *, int *);
+static int              getdata(struct tbl_node *, struct tbl_span *, 
+                               int, const char *, int *);
+static struct tbl_span *newspan(struct tbl_node *, int, 
+                               struct tbl_row *);
 
-void
-data(struct tbl *tbl, struct tbl_span *dp, 
+static int
+getdata(struct tbl_node *tbl, struct tbl_span *dp, 
                int ln, const char *p, int *pos)
 {
        struct tbl_dat  *dat;
-       int              sv;
+       struct tbl_cell *cp;
+       int              sv, spans;
+
+       cp = NULL;
+       if (dp->last && dp->last->layout)
+               cp = dp->last->layout->next;
+       else if (NULL == dp->last)
+               cp = dp->layout->first;
+
+       /* 
+        * Skip over spanners, since
+        * we want to match data with data layout cells in the header.
+        */
+
+       while (cp && TBL_CELL_SPAN == cp->pos)
+               cp = cp->next;
 
-       /* FIXME: warn about losing data contents if cell is HORIZ. */
+       /*
+        * Stop processing when we reach the end of the available layout
+        * cells.  This means that we have extra input.
+        */
+
+       if (NULL == cp) {
+               mandoc_msg(MANDOCERR_TBLEXTRADAT, 
+                               tbl->parse, ln, *pos, NULL);
+               /* Skip to the end... */
+               while (p[*pos])
+                       (*pos)++;
+               return(1);
+       }
 
        dat = mandoc_calloc(1, sizeof(struct tbl_dat));
+       dat->layout = cp;
+       dat->pos = TBL_DATA_NONE;
+
+       assert(TBL_CELL_SPAN != cp->pos);
+
+       for (spans = 0, cp = cp->next; cp; cp = cp->next)
+               if (TBL_CELL_SPAN == cp->pos)
+                       spans++;
+               else
+                       break;
+       
+       dat->spans = spans;
 
        if (dp->last) {
                dp->last->next = dat;
@@ -44,59 +92,184 @@ data(struct tbl *tbl, struct tbl_span *dp,
                dp->last = dp->first = dat;
 
        sv = *pos;
-       while (p[*pos] && p[*pos] != tbl->tab)
+       while (p[*pos] && p[*pos] != tbl->opts.tab)
                (*pos)++;
 
-       dat->string = mandoc_malloc(*pos - sv + 1);
-       memcpy(dat->string, &p[sv], *pos - sv);
+       /*
+        * Check for a continued-data scope opening.  This consists of a
+        * trailing `T{' at the end of the line.  Subsequent lines,
+        * until a standalone `T}', are included in our cell.
+        */
+
+       if (*pos - sv == 2 && 'T' == p[sv] && '{' == p[sv + 1]) {
+               tbl->part = TBL_PART_CDATA;
+               return(1);
+       }
+
+       assert(*pos - sv >= 0);
+
+       dat->string = mandoc_malloc((size_t)(*pos - sv + 1));
+       memcpy(dat->string, &p[sv], (size_t)(*pos - sv));
        dat->string[*pos - sv] = '\0';
 
        if (p[*pos])
                (*pos)++;
 
-       /* XXX: do the strcmps, then malloc(). */
-
        if ( ! strcmp(dat->string, "_"))
-               dat->flags |= TBL_DATA_HORIZ;
+               dat->pos = TBL_DATA_HORIZ;
        else if ( ! strcmp(dat->string, "="))
-               dat->flags |= TBL_DATA_DHORIZ;
+               dat->pos = TBL_DATA_DHORIZ;
        else if ( ! strcmp(dat->string, "\\_"))
-               dat->flags |= TBL_DATA_NHORIZ;
+               dat->pos = TBL_DATA_NHORIZ;
        else if ( ! strcmp(dat->string, "\\="))
-               dat->flags |= TBL_DATA_NDHORIZ;
+               dat->pos = TBL_DATA_NDHORIZ;
+       else
+               dat->pos = TBL_DATA_DATA;
+
+       if (TBL_CELL_HORIZ == dat->layout->pos ||
+                       TBL_CELL_DHORIZ == dat->layout->pos ||
+                       TBL_CELL_DOWN == dat->layout->pos)
+               if (TBL_DATA_DATA == dat->pos && '\0' != *dat->string)
+                       mandoc_msg(MANDOCERR_TBLIGNDATA, 
+                                       tbl->parse, ln, sv, NULL);
+
+       return(1);
 }
 
+/* ARGSUSED */
 int
-tbl_data(struct tbl *tbl, int ln, const char *p)
+tbl_cdata(struct tbl_node *tbl, int ln, const char *p)
 {
-       struct tbl_span *dp;
+       struct tbl_dat  *dat;
+       size_t           sz;
        int              pos;
 
        pos = 0;
 
-       if ('\0' == p[pos]) {
-               TBL_MSG(tbl, MANDOCERR_TBL, ln, pos);
-               return(1);
+       dat = tbl->last_span->last;
+
+       if (p[pos] == 'T' && p[pos + 1] == '}') {
+               pos += 2;
+               if (p[pos] == tbl->opts.tab) {
+                       tbl->part = TBL_PART_DATA;
+                       pos++;
+                       return(getdata(tbl, tbl->last_span, ln, p, &pos));
+               } else if ('\0' == p[pos]) {
+                       tbl->part = TBL_PART_DATA;
+                       return(1);
+               }
+
+               /* Fallthrough: T} is part of a word. */
        }
 
+       dat->pos = TBL_DATA_DATA;
+
+       if (dat->string) {
+               sz = strlen(p) + strlen(dat->string) + 2;
+               dat->string = mandoc_realloc(dat->string, sz);
+               strlcat(dat->string, " ", sz);
+               strlcat(dat->string, p, sz);
+       } else
+               dat->string = mandoc_strdup(p);
+
+       if (TBL_CELL_DOWN == dat->layout->pos) 
+               mandoc_msg(MANDOCERR_TBLIGNDATA, 
+                               tbl->parse, ln, pos, NULL);
+
+       return(0);
+}
+
+static struct tbl_span *
+newspan(struct tbl_node *tbl, int line, struct tbl_row *rp)
+{
+       struct tbl_span *dp;
+
        dp = mandoc_calloc(1, sizeof(struct tbl_span));
+       dp->line = line;
+       dp->opts = &tbl->opts;
+       dp->layout = rp;
+       dp->head = tbl->first_head;
 
        if (tbl->last_span) {
                tbl->last_span->next = dp;
                tbl->last_span = dp;
-       } else
+       } else {
                tbl->last_span = tbl->first_span = dp;
+               tbl->current_span = NULL;
+               dp->flags |= TBL_SPAN_FIRST;
+       }
+
+       return(dp);
+}
+
+int
+tbl_data(struct tbl_node *tbl, int ln, const char *p)
+{
+       struct tbl_span *dp;
+       struct tbl_row  *rp;
+       int              pos;
+
+       pos = 0;
+
+       if ('\0' == p[pos]) {
+               mandoc_msg(MANDOCERR_TBL, tbl->parse, ln, pos, NULL);
+               return(0);
+       }
+
+       /* 
+        * Choose a layout row: take the one following the last parsed
+        * span's.  If that doesn't exist, use the last parsed span's.
+        * If there's no last parsed span, use the first row.  Lastly,
+        * if the last span was a horizontal line, use the same layout
+        * (it doesn't "consume" the layout).
+        */
+
+       if (tbl->last_span) {
+               assert(tbl->last_span->layout);
+               if (tbl->last_span->pos == TBL_SPAN_DATA) {
+                       for (rp = tbl->last_span->layout->next;
+                                       rp && rp->first; rp = rp->next) {
+                               switch (rp->first->pos) {
+                               case (TBL_CELL_HORIZ):
+                                       dp = newspan(tbl, ln, rp);
+                                       dp->pos = TBL_SPAN_HORIZ;
+                                       continue;
+                               case (TBL_CELL_DHORIZ):
+                                       dp = newspan(tbl, ln, rp);
+                                       dp->pos = TBL_SPAN_DHORIZ;
+                                       continue;
+                               default:
+                                       break;
+                               }
+                               break;
+                       }
+               } else
+                       rp = tbl->last_span->layout;
+
+               if (NULL == rp)
+                       rp = tbl->last_span->layout;
+       } else
+               rp = tbl->first_row;
+
+       assert(rp);
+
+       dp = newspan(tbl, ln, rp);
 
        if ( ! strcmp(p, "_")) {
-               dp->flags |= TBL_SPAN_HORIZ;
+               dp->pos = TBL_SPAN_HORIZ;
                return(1);
        } else if ( ! strcmp(p, "=")) {
-               dp->flags |= TBL_SPAN_DHORIZ;
+               dp->pos = TBL_SPAN_DHORIZ;
                return(1);
        }
 
+       dp->pos = TBL_SPAN_DATA;
+
+       /* This returns 0 when TBL_PART_CDATA is entered. */
+
        while ('\0' != p[pos])
-               data(tbl, dp, ln, p, &pos);
+               if ( ! getdata(tbl, dp, ln, p, &pos))
+                       return(0);
 
        return(1);
 }