2021-11-15 15:35:39 +00:00
|
|
|
/* $Id: tbl_data.c,v 1.59 2021/09/10 13:24:38 schwarze Exp $ */
|
2012-10-18 09:55:16 +00:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv>
|
2021-11-15 15:35:39 +00:00
|
|
|
* Copyright (c) 2011,2015,2017-2019,2021 Ingo Schwarze <schwarze@openbsd.org>
|
2012-10-18 09:55:16 +00:00
|
|
|
*
|
|
|
|
* Permission to use, copy, modify, and distribute this software for any
|
|
|
|
* purpose with or without fee is hereby granted, provided that the above
|
|
|
|
* copyright notice and this permission notice appear in all copies.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
|
|
|
|
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
|
|
|
|
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
|
|
|
|
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
|
|
|
|
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
|
|
|
|
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
|
|
|
|
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
|
|
|
|
*/
|
|
|
|
#include "config.h"
|
2014-12-02 07:34:06 +00:00
|
|
|
|
|
|
|
#include <sys/types.h>
|
2012-10-18 09:55:16 +00:00
|
|
|
|
|
|
|
#include <assert.h>
|
|
|
|
#include <ctype.h>
|
2021-11-15 15:35:39 +00:00
|
|
|
#include <stdint.h>
|
2019-03-29 13:13:30 +00:00
|
|
|
#include <stdio.h>
|
2012-10-18 09:55:16 +00:00
|
|
|
#include <stdlib.h>
|
|
|
|
#include <string.h>
|
|
|
|
#include <time.h>
|
|
|
|
|
2014-11-22 18:08:25 +00:00
|
|
|
#include "mandoc_aux.h"
|
2019-03-29 13:13:30 +00:00
|
|
|
#include "mandoc.h"
|
|
|
|
#include "tbl.h"
|
2012-10-18 09:55:16 +00:00
|
|
|
#include "libmandoc.h"
|
2019-03-29 13:13:30 +00:00
|
|
|
#include "tbl_int.h"
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
static void getdata(struct tbl_node *, struct tbl_span *,
|
2012-10-18 09:55:16 +00:00
|
|
|
int, const char *, int *);
|
2014-11-22 18:08:25 +00:00
|
|
|
static struct tbl_span *newspan(struct tbl_node *, int,
|
2012-10-18 09:55:16 +00:00
|
|
|
struct tbl_row *);
|
|
|
|
|
2014-11-22 18:08:25 +00:00
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
static void
|
2014-11-22 18:08:25 +00:00
|
|
|
getdata(struct tbl_node *tbl, struct tbl_span *dp,
|
2012-10-18 09:55:16 +00:00
|
|
|
int ln, const char *p, int *pos)
|
|
|
|
{
|
2019-03-29 13:13:30 +00:00
|
|
|
struct tbl_dat *dat, *pdat;
|
2012-10-18 09:55:16 +00:00
|
|
|
struct tbl_cell *cp;
|
2019-03-29 13:13:30 +00:00
|
|
|
struct tbl_span *pdp;
|
2021-11-15 15:35:39 +00:00
|
|
|
const char *ccp;
|
|
|
|
int startpos, endpos;
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2019-03-29 13:13:30 +00:00
|
|
|
/*
|
|
|
|
* Determine the length of the string in the cell
|
|
|
|
* and advance the parse point to the end of the cell.
|
|
|
|
*/
|
|
|
|
|
2021-11-15 15:35:39 +00:00
|
|
|
startpos = *pos;
|
|
|
|
ccp = p + startpos;
|
|
|
|
while (*ccp != '\0' && *ccp != tbl->opts.tab)
|
|
|
|
if (*ccp++ == '\\')
|
|
|
|
mandoc_escape(&ccp, NULL, NULL);
|
|
|
|
*pos = ccp - p;
|
2019-03-29 13:13:30 +00:00
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
/* Advance to the next layout cell, skipping spanners. */
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
cp = dp->last == NULL ? dp->layout->first : dp->last->layout->next;
|
|
|
|
while (cp != NULL && cp->pos == TBL_CELL_SPAN)
|
2012-10-18 09:55:16 +00:00
|
|
|
cp = cp->next;
|
|
|
|
|
|
|
|
/*
|
2017-07-31 19:17:54 +00:00
|
|
|
* If the current layout row is out of cells, allocate
|
|
|
|
* a new cell if another row of the table has at least
|
|
|
|
* this number of columns, or discard the input if we
|
|
|
|
* are beyond the last column of the table as a whole.
|
2012-10-18 09:55:16 +00:00
|
|
|
*/
|
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
if (cp == NULL) {
|
2017-07-31 19:17:54 +00:00
|
|
|
if (dp->layout->last->col + 1 < dp->opts->cols) {
|
|
|
|
cp = mandoc_calloc(1, sizeof(*cp));
|
|
|
|
cp->pos = TBL_CELL_LEFT;
|
2021-11-15 15:35:39 +00:00
|
|
|
cp->font = ESCAPE_FONTROMAN;
|
|
|
|
cp->spacing = SIZE_MAX;
|
2017-07-31 19:17:54 +00:00
|
|
|
dp->layout->last->next = cp;
|
|
|
|
cp->col = dp->layout->last->col + 1;
|
|
|
|
dp->layout->last = cp;
|
|
|
|
} else {
|
2019-03-29 13:13:30 +00:00
|
|
|
mandoc_msg(MANDOCERR_TBLDATA_EXTRA,
|
2021-11-15 15:35:39 +00:00
|
|
|
ln, startpos, "%s", p + startpos);
|
2019-03-29 13:13:30 +00:00
|
|
|
while (p[*pos] != '\0')
|
2017-07-31 19:17:54 +00:00
|
|
|
(*pos)++;
|
|
|
|
return;
|
|
|
|
}
|
2012-10-18 09:55:16 +00:00
|
|
|
}
|
|
|
|
|
2019-03-29 13:13:30 +00:00
|
|
|
dat = mandoc_malloc(sizeof(*dat));
|
2012-10-18 09:55:16 +00:00
|
|
|
dat->layout = cp;
|
2019-03-29 13:13:30 +00:00
|
|
|
dat->next = NULL;
|
|
|
|
dat->string = NULL;
|
|
|
|
dat->hspans = 0;
|
|
|
|
dat->vspans = 0;
|
|
|
|
dat->block = 0;
|
2012-10-18 09:55:16 +00:00
|
|
|
dat->pos = TBL_DATA_NONE;
|
2019-03-29 13:13:30 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Increment the number of vertical spans in a data cell above,
|
|
|
|
* if this cell vertically extends one or more cells above.
|
|
|
|
* The iteration must be done over data rows,
|
|
|
|
* not over layout rows, because one layout row
|
|
|
|
* can be reused for more than one data row.
|
|
|
|
*/
|
|
|
|
|
|
|
|
if (cp->pos == TBL_CELL_DOWN ||
|
2021-11-15 15:35:39 +00:00
|
|
|
(*pos - startpos == 2 &&
|
|
|
|
p[startpos] == '\\' && p[startpos + 1] == '^')) {
|
2019-03-29 13:13:30 +00:00
|
|
|
pdp = dp;
|
|
|
|
while ((pdp = pdp->prev) != NULL) {
|
|
|
|
pdat = pdp->first;
|
|
|
|
while (pdat != NULL &&
|
|
|
|
pdat->layout->col < dat->layout->col)
|
|
|
|
pdat = pdat->next;
|
|
|
|
if (pdat == NULL)
|
|
|
|
break;
|
|
|
|
if (pdat->layout->pos != TBL_CELL_DOWN &&
|
|
|
|
strcmp(pdat->string, "\\^") != 0) {
|
|
|
|
pdat->vspans++;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Count the number of horizontal spans to the right of this cell.
|
|
|
|
* This is purely a matter of the layout, independent of the data.
|
|
|
|
*/
|
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
for (cp = cp->next; cp != NULL; cp = cp->next)
|
|
|
|
if (cp->pos == TBL_CELL_SPAN)
|
2019-03-29 13:13:30 +00:00
|
|
|
dat->hspans++;
|
2012-10-18 09:55:16 +00:00
|
|
|
else
|
|
|
|
break;
|
2014-11-22 18:08:25 +00:00
|
|
|
|
2019-03-29 13:13:30 +00:00
|
|
|
/* Append the new data cell to the data row. */
|
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
if (dp->last == NULL)
|
|
|
|
dp->first = dat;
|
|
|
|
else
|
2012-10-18 09:55:16 +00:00
|
|
|
dp->last->next = dat;
|
2015-03-02 16:45:41 +00:00
|
|
|
dp->last = dat;
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2021-11-15 15:35:39 +00:00
|
|
|
/* Strip leading and trailing spaces, if requested. */
|
|
|
|
|
|
|
|
endpos = *pos;
|
|
|
|
if (dp->opts->opts & TBL_OPT_NOSPACE) {
|
|
|
|
while (p[startpos] == ' ')
|
|
|
|
startpos++;
|
|
|
|
while (endpos > startpos && p[endpos - 1] == ' ')
|
|
|
|
endpos--;
|
|
|
|
}
|
|
|
|
|
2012-10-18 09:55:16 +00:00
|
|
|
/*
|
|
|
|
* Check for a continued-data scope opening. This consists of a
|
|
|
|
* trailing `T{' at the end of the line. Subsequent lines,
|
|
|
|
* until a standalone `T}', are included in our cell.
|
|
|
|
*/
|
|
|
|
|
2021-11-15 15:35:39 +00:00
|
|
|
if (endpos - startpos == 2 &&
|
|
|
|
p[startpos] == 'T' && p[startpos + 1] == '{') {
|
2012-10-18 09:55:16 +00:00
|
|
|
tbl->part = TBL_PART_CDATA;
|
2015-03-02 16:45:41 +00:00
|
|
|
return;
|
2012-10-18 09:55:16 +00:00
|
|
|
}
|
|
|
|
|
2021-11-15 15:35:39 +00:00
|
|
|
dat->string = mandoc_strndup(p + startpos, endpos - startpos);
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2019-03-29 13:13:30 +00:00
|
|
|
if (p[*pos] != '\0')
|
2012-10-18 09:55:16 +00:00
|
|
|
(*pos)++;
|
|
|
|
|
|
|
|
if ( ! strcmp(dat->string, "_"))
|
|
|
|
dat->pos = TBL_DATA_HORIZ;
|
|
|
|
else if ( ! strcmp(dat->string, "="))
|
|
|
|
dat->pos = TBL_DATA_DHORIZ;
|
|
|
|
else if ( ! strcmp(dat->string, "\\_"))
|
|
|
|
dat->pos = TBL_DATA_NHORIZ;
|
|
|
|
else if ( ! strcmp(dat->string, "\\="))
|
|
|
|
dat->pos = TBL_DATA_NDHORIZ;
|
|
|
|
else
|
|
|
|
dat->pos = TBL_DATA_DATA;
|
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
if ((dat->layout->pos == TBL_CELL_HORIZ ||
|
|
|
|
dat->layout->pos == TBL_CELL_DHORIZ ||
|
|
|
|
dat->layout->pos == TBL_CELL_DOWN) &&
|
|
|
|
dat->pos == TBL_DATA_DATA && *dat->string != '\0')
|
|
|
|
mandoc_msg(MANDOCERR_TBLDATA_SPAN,
|
2021-11-15 15:35:39 +00:00
|
|
|
ln, startpos, "%s", dat->string);
|
2012-10-18 09:55:16 +00:00
|
|
|
}
|
|
|
|
|
2017-07-31 19:17:54 +00:00
|
|
|
void
|
2015-03-02 16:45:41 +00:00
|
|
|
tbl_cdata(struct tbl_node *tbl, int ln, const char *p, int pos)
|
2012-10-18 09:55:16 +00:00
|
|
|
{
|
|
|
|
struct tbl_dat *dat;
|
2014-11-22 18:08:25 +00:00
|
|
|
size_t sz;
|
2012-10-18 09:55:16 +00:00
|
|
|
|
|
|
|
dat = tbl->last_span->last;
|
|
|
|
|
|
|
|
if (p[pos] == 'T' && p[pos + 1] == '}') {
|
|
|
|
pos += 2;
|
2021-11-15 15:35:39 +00:00
|
|
|
if (tbl->opts.opts & TBL_OPT_NOSPACE)
|
|
|
|
while (p[pos] == ' ')
|
|
|
|
pos++;
|
2012-10-18 09:55:16 +00:00
|
|
|
if (p[pos] == tbl->opts.tab) {
|
|
|
|
tbl->part = TBL_PART_DATA;
|
|
|
|
pos++;
|
2016-01-15 23:08:59 +00:00
|
|
|
while (p[pos] != '\0')
|
|
|
|
getdata(tbl, tbl->last_span, ln, p, &pos);
|
2017-07-31 19:17:54 +00:00
|
|
|
return;
|
2015-03-02 16:45:41 +00:00
|
|
|
} else if (p[pos] == '\0') {
|
2012-10-18 09:55:16 +00:00
|
|
|
tbl->part = TBL_PART_DATA;
|
2017-07-31 19:17:54 +00:00
|
|
|
return;
|
2012-10-18 09:55:16 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Fallthrough: T} is part of a word. */
|
|
|
|
}
|
|
|
|
|
|
|
|
dat->pos = TBL_DATA_DATA;
|
2017-06-08 19:29:07 +00:00
|
|
|
dat->block = 1;
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
if (dat->string != NULL) {
|
|
|
|
sz = strlen(p + pos) + strlen(dat->string) + 2;
|
2012-10-18 09:55:16 +00:00
|
|
|
dat->string = mandoc_realloc(dat->string, sz);
|
2014-11-22 18:08:25 +00:00
|
|
|
(void)strlcat(dat->string, " ", sz);
|
2015-03-02 16:45:41 +00:00
|
|
|
(void)strlcat(dat->string, p + pos, sz);
|
2012-10-18 09:55:16 +00:00
|
|
|
} else
|
2015-03-02 16:45:41 +00:00
|
|
|
dat->string = mandoc_strdup(p + pos);
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
if (dat->layout->pos == TBL_CELL_DOWN)
|
2019-03-29 13:13:30 +00:00
|
|
|
mandoc_msg(MANDOCERR_TBLDATA_SPAN,
|
|
|
|
ln, pos, "%s", dat->string);
|
2012-10-18 09:55:16 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static struct tbl_span *
|
|
|
|
newspan(struct tbl_node *tbl, int line, struct tbl_row *rp)
|
|
|
|
{
|
|
|
|
struct tbl_span *dp;
|
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
dp = mandoc_calloc(1, sizeof(*dp));
|
2012-10-18 09:55:16 +00:00
|
|
|
dp->line = line;
|
2014-01-31 19:59:03 +00:00
|
|
|
dp->opts = &tbl->opts;
|
2012-10-18 09:55:16 +00:00
|
|
|
dp->layout = rp;
|
2015-03-02 16:45:41 +00:00
|
|
|
dp->prev = tbl->last_span;
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
if (dp->prev == NULL) {
|
|
|
|
tbl->first_span = dp;
|
2012-10-18 09:55:16 +00:00
|
|
|
tbl->current_span = NULL;
|
2015-03-02 16:45:41 +00:00
|
|
|
} else
|
|
|
|
dp->prev->next = dp;
|
|
|
|
tbl->last_span = dp;
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2016-01-15 23:08:59 +00:00
|
|
|
return dp;
|
2012-10-18 09:55:16 +00:00
|
|
|
}
|
|
|
|
|
2015-03-02 16:45:41 +00:00
|
|
|
void
|
|
|
|
tbl_data(struct tbl_node *tbl, int ln, const char *p, int pos)
|
2012-10-18 09:55:16 +00:00
|
|
|
{
|
|
|
|
struct tbl_row *rp;
|
2017-07-31 19:17:54 +00:00
|
|
|
struct tbl_cell *cp;
|
|
|
|
struct tbl_span *sp;
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2021-11-15 15:35:39 +00:00
|
|
|
for (sp = tbl->last_span; sp != NULL; sp = sp->prev)
|
|
|
|
if (sp->pos == TBL_SPAN_DATA)
|
|
|
|
break;
|
|
|
|
rp = sp == NULL ? tbl->first_row :
|
|
|
|
sp->layout->next == NULL ? sp->layout : sp->layout->next;
|
2017-07-31 19:17:54 +00:00
|
|
|
assert(rp != NULL);
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2019-03-29 13:13:30 +00:00
|
|
|
if (p[1] == '\0') {
|
|
|
|
switch (p[0]) {
|
|
|
|
case '.':
|
|
|
|
/*
|
|
|
|
* Empty request lines must be handled here
|
|
|
|
* and cannot be discarded in roff_parseln()
|
|
|
|
* because in the layout section, they
|
|
|
|
* are significant and end the layout.
|
|
|
|
*/
|
|
|
|
return;
|
|
|
|
case '_':
|
|
|
|
sp = newspan(tbl, ln, rp);
|
|
|
|
sp->pos = TBL_SPAN_HORIZ;
|
|
|
|
return;
|
|
|
|
case '=':
|
|
|
|
sp = newspan(tbl, ln, rp);
|
|
|
|
sp->pos = TBL_SPAN_DHORIZ;
|
|
|
|
return;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
2012-10-18 09:55:16 +00:00
|
|
|
}
|
|
|
|
|
2017-07-31 19:17:54 +00:00
|
|
|
/*
|
|
|
|
* If the layout row contains nothing but horizontal lines,
|
|
|
|
* allocate an empty span for it and assign the current span
|
|
|
|
* to the next layout row accepting data.
|
|
|
|
*/
|
|
|
|
|
|
|
|
while (rp->next != NULL) {
|
|
|
|
if (rp->last->col + 1 < tbl->opts.cols)
|
|
|
|
break;
|
|
|
|
for (cp = rp->first; cp != NULL; cp = cp->next)
|
|
|
|
if (cp->pos != TBL_CELL_HORIZ &&
|
|
|
|
cp->pos != TBL_CELL_DHORIZ)
|
|
|
|
break;
|
|
|
|
if (cp != NULL)
|
|
|
|
break;
|
|
|
|
sp = newspan(tbl, ln, rp);
|
|
|
|
sp->pos = TBL_SPAN_DATA;
|
|
|
|
rp = rp->next;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Process a real data row. */
|
2012-10-18 09:55:16 +00:00
|
|
|
|
2017-07-31 19:17:54 +00:00
|
|
|
sp = newspan(tbl, ln, rp);
|
|
|
|
sp->pos = TBL_SPAN_DATA;
|
2015-03-02 16:45:41 +00:00
|
|
|
while (p[pos] != '\0')
|
2017-07-31 19:17:54 +00:00
|
|
|
getdata(tbl, sp, ln, p, &pos);
|
2012-10-18 09:55:16 +00:00
|
|
|
}
|