version 1.4, 2011/01/01 21:23:01 |
version 1.47, 2018/12/14 01:18:26 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2009, 2010 Kristaps Dzonsons <kristaps@bsd.lv> |
* Copyright (c) 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv> |
|
* Copyright (c) 2012, 2014, 2015, 2017 Ingo Schwarze <schwarze@openbsd.org> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the above |
* purpose with or without fee is hereby granted, provided that the above |
|
|
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
*/ |
*/ |
#include <assert.h> |
#include "config.h" |
|
|
|
#include <sys/types.h> |
|
|
#include <ctype.h> |
#include <ctype.h> |
|
#include <stdint.h> |
|
#include <stdio.h> |
#include <stdlib.h> |
#include <stdlib.h> |
#include <string.h> |
#include <string.h> |
#include <time.h> |
#include <time.h> |
|
|
|
#include "mandoc_aux.h" |
#include "mandoc.h" |
#include "mandoc.h" |
|
#include "tbl.h" |
#include "libmandoc.h" |
#include "libmandoc.h" |
#include "libroff.h" |
#include "tbl_int.h" |
|
|
struct tbl_phrase { |
struct tbl_phrase { |
char name; |
char name; |
enum tbl_cellt key; |
enum tbl_cellt key; |
}; |
}; |
|
|
#define KEYS_MAX 11 |
static const struct tbl_phrase keys[] = { |
|
|
static const struct tbl_phrase keys[KEYS_MAX] = { |
|
{ 'c', TBL_CELL_CENTRE }, |
{ 'c', TBL_CELL_CENTRE }, |
{ 'r', TBL_CELL_RIGHT }, |
{ 'r', TBL_CELL_RIGHT }, |
{ 'l', TBL_CELL_LEFT }, |
{ 'l', TBL_CELL_LEFT }, |
Line 41 static const struct tbl_phrase keys[KEYS_MAX] = { |
|
Line 47 static const struct tbl_phrase keys[KEYS_MAX] = { |
|
{ '^', TBL_CELL_DOWN }, |
{ '^', TBL_CELL_DOWN }, |
{ '-', TBL_CELL_HORIZ }, |
{ '-', TBL_CELL_HORIZ }, |
{ '_', TBL_CELL_HORIZ }, |
{ '_', TBL_CELL_HORIZ }, |
{ '=', TBL_CELL_DHORIZ }, |
{ '=', TBL_CELL_DHORIZ } |
{ '|', TBL_CELL_VERT } |
|
}; |
}; |
|
|
static int mods(struct tbl *, struct tbl_cell *, |
#define KEYS_MAX ((int)(sizeof(keys)/sizeof(keys[0]))) |
int, const char *, int *); |
|
static int cell(struct tbl *, struct tbl_row *, |
|
int, const char *, int *); |
|
static void row(struct tbl *, int, const char *, int *); |
|
|
|
static int |
static void mods(struct tbl_node *, struct tbl_cell *, |
mods(struct tbl *tbl, struct tbl_cell *cp, |
int, const char *, int *); |
|
static void cell(struct tbl_node *, struct tbl_row *, |
|
int, const char *, int *); |
|
static struct tbl_cell *cell_alloc(struct tbl_node *, struct tbl_row *, |
|
enum tbl_cellt); |
|
|
|
|
|
static void |
|
mods(struct tbl_node *tbl, struct tbl_cell *cp, |
int ln, const char *p, int *pos) |
int ln, const char *p, int *pos) |
{ |
{ |
char buf[5]; |
char *endptr; |
int i; |
size_t sz; |
|
|
mod: |
mod: |
/* |
while (p[*pos] == ' ' || p[*pos] == '\t') |
* XXX: since, at least for now, modifiers are non-conflicting |
(*pos)++; |
* (are separable by value, regardless of position), we let |
|
* modifiers come in any order. The existing tbl doesn't let |
|
* this happen. |
|
*/ |
|
switch (p[*pos]) { |
|
case ('\0'): |
|
/* FALLTHROUGH */ |
|
case (' '): |
|
/* FALLTHROUGH */ |
|
case ('\t'): |
|
/* FALLTHROUGH */ |
|
case (','): |
|
/* FALLTHROUGH */ |
|
case ('.'): |
|
return(1); |
|
default: |
|
break; |
|
} |
|
|
|
/* Parse numerical spacing from modifier string. */ |
/* Row delimiters and cell specifiers end modifier lists. */ |
|
|
if (isdigit((unsigned char)p[*pos])) { |
if (strchr(".,-=^_ACLNRSaclnrs", p[*pos]) != NULL) |
for (i = 0; i < 4; i++) { |
return; |
if ( ! isdigit((unsigned char)p[*pos + i])) |
|
break; |
|
buf[i] = p[*pos + i]; |
|
} |
|
buf[i] = '\0'; |
|
|
|
/* No greater than 4 digits. */ |
/* Throw away parenthesised expression. */ |
|
|
if (4 == i) { |
if ('(' == p[*pos]) { |
TBL_MSG(tbl, MANDOCERR_TBLLAYOUT, ln, *pos); |
(*pos)++; |
return(0); |
while (p[*pos] && ')' != p[*pos]) |
|
(*pos)++; |
|
if (')' == p[*pos]) { |
|
(*pos)++; |
|
goto mod; |
} |
} |
|
mandoc_msg(MANDOCERR_TBLLAYOUT_PAR, tbl->parse, |
|
ln, *pos, NULL); |
|
return; |
|
} |
|
|
*pos += i; |
/* Parse numerical spacing from modifier string. */ |
cp->spacing = atoi(buf); |
|
|
|
|
if (isdigit((unsigned char)p[*pos])) { |
|
cp->spacing = strtoull(p + *pos, &endptr, 10); |
|
*pos = endptr - p; |
goto mod; |
goto mod; |
/* NOTREACHED */ |
} |
} |
|
|
|
/* TODO: GNU has many more extensions. */ |
switch (tolower((unsigned char)p[(*pos)++])) { |
|
case 'b': |
switch (tolower(p[(*pos)++])) { |
cp->flags |= TBL_CELL_BOLD; |
case ('z'): |
|
cp->flags |= TBL_CELL_WIGN; |
|
goto mod; |
goto mod; |
case ('u'): |
case 'd': |
cp->flags |= TBL_CELL_UP; |
cp->flags |= TBL_CELL_BALIGN; |
goto mod; |
goto mod; |
case ('e'): |
case 'e': |
cp->flags |= TBL_CELL_EQUAL; |
cp->flags |= TBL_CELL_EQUAL; |
goto mod; |
goto mod; |
case ('t'): |
case 'f': |
|
break; |
|
case 'i': |
|
cp->flags |= TBL_CELL_ITALIC; |
|
goto mod; |
|
case 'm': |
|
mandoc_msg(MANDOCERR_TBLLAYOUT_MOD, tbl->parse, |
|
ln, *pos, "m"); |
|
goto mod; |
|
case 'p': |
|
case 'v': |
|
if (p[*pos] == '-' || p[*pos] == '+') |
|
(*pos)++; |
|
while (isdigit((unsigned char)p[*pos])) |
|
(*pos)++; |
|
goto mod; |
|
case 't': |
cp->flags |= TBL_CELL_TALIGN; |
cp->flags |= TBL_CELL_TALIGN; |
goto mod; |
goto mod; |
case ('d'): |
case 'u': |
cp->flags |= TBL_CELL_BALIGN; |
cp->flags |= TBL_CELL_UP; |
goto mod; |
goto mod; |
case ('f'): |
case 'w': |
break; |
sz = 0; |
case ('b'): |
if (p[*pos] == '(') { |
/* FALLTHROUGH */ |
(*pos)++; |
case ('i'): |
while (p[*pos + sz] != '\0' && p[*pos + sz] != ')') |
(*pos)--; |
sz++; |
break; |
} else |
|
while (isdigit((unsigned char)p[*pos + sz])) |
|
sz++; |
|
if (sz) { |
|
free(cp->wstr); |
|
cp->wstr = mandoc_strndup(p + *pos, sz); |
|
*pos += sz; |
|
if (p[*pos] == ')') |
|
(*pos)++; |
|
} |
|
goto mod; |
|
case 'x': |
|
cp->flags |= TBL_CELL_WMAX; |
|
goto mod; |
|
case 'z': |
|
cp->flags |= TBL_CELL_WIGN; |
|
goto mod; |
|
case '|': |
|
if (cp->vert < 2) |
|
cp->vert++; |
|
else |
|
mandoc_msg(MANDOCERR_TBLLAYOUT_VERT, |
|
tbl->parse, ln, *pos - 1, NULL); |
|
goto mod; |
default: |
default: |
TBL_MSG(tbl, MANDOCERR_TBLLAYOUT, ln, *pos - 1); |
mandoc_vmsg(MANDOCERR_TBLLAYOUT_CHAR, tbl->parse, |
return(0); |
ln, *pos - 1, "%c", p[*pos - 1]); |
|
goto mod; |
} |
} |
|
|
switch (tolower(p[(*pos)++])) { |
/* Ignore parenthised font names for now. */ |
case ('b'): |
|
|
if (p[*pos] == '(') |
|
goto mod; |
|
|
|
/* Support only one-character font-names for now. */ |
|
|
|
if (p[*pos] == '\0' || (p[*pos + 1] != ' ' && p[*pos + 1] != '.')) { |
|
mandoc_vmsg(MANDOCERR_FT_BAD, tbl->parse, |
|
ln, *pos, "TS %s", p + *pos - 1); |
|
if (p[*pos] != '\0') |
|
(*pos)++; |
|
if (p[*pos] != '\0') |
|
(*pos)++; |
|
goto mod; |
|
} |
|
|
|
switch (p[(*pos)++]) { |
|
case '3': |
|
case 'B': |
cp->flags |= TBL_CELL_BOLD; |
cp->flags |= TBL_CELL_BOLD; |
goto mod; |
goto mod; |
case ('i'): |
case '2': |
|
case 'I': |
cp->flags |= TBL_CELL_ITALIC; |
cp->flags |= TBL_CELL_ITALIC; |
goto mod; |
goto mod; |
|
case '1': |
|
case 'R': |
|
goto mod; |
default: |
default: |
break; |
mandoc_vmsg(MANDOCERR_FT_BAD, tbl->parse, |
|
ln, *pos - 1, "TS f%c", p[*pos - 1]); |
|
goto mod; |
} |
} |
|
|
TBL_MSG(tbl, MANDOCERR_TBLLAYOUT, ln, *pos - 1); |
|
return(0); |
|
} |
} |
|
|
static int |
static void |
cell(struct tbl *tbl, struct tbl_row *rp, |
cell(struct tbl_node *tbl, struct tbl_row *rp, |
int ln, const char *p, int *pos) |
int ln, const char *p, int *pos) |
{ |
{ |
struct tbl_cell *cp; |
|
int i; |
int i; |
enum tbl_cellt c; |
enum tbl_cellt c; |
|
|
/* Parse the column position (`r', `R', `|', ...). */ |
/* Handle leading vertical lines */ |
|
|
|
while (p[*pos] == ' ' || p[*pos] == '\t' || p[*pos] == '|') { |
|
if (p[*pos] == '|') { |
|
if (rp->vert < 2) |
|
rp->vert++; |
|
else |
|
mandoc_msg(MANDOCERR_TBLLAYOUT_VERT, |
|
tbl->parse, ln, *pos, NULL); |
|
} |
|
(*pos)++; |
|
} |
|
|
|
again: |
|
while (p[*pos] == ' ' || p[*pos] == '\t') |
|
(*pos)++; |
|
|
|
if (p[*pos] == '.' || p[*pos] == '\0') |
|
return; |
|
|
|
/* Parse the column position (`c', `l', `r', ...). */ |
|
|
for (i = 0; i < KEYS_MAX; i++) |
for (i = 0; i < KEYS_MAX; i++) |
if (tolower(p[*pos]) == keys[i].name) |
if (tolower((unsigned char)p[*pos]) == keys[i].name) |
break; |
break; |
|
|
if (KEYS_MAX == i) { |
if (i == KEYS_MAX) { |
TBL_MSG(tbl, MANDOCERR_TBLLAYOUT, ln, *pos); |
mandoc_vmsg(MANDOCERR_TBLLAYOUT_CHAR, tbl->parse, |
return(0); |
ln, *pos, "%c", p[*pos]); |
|
(*pos)++; |
|
goto again; |
} |
} |
|
|
(*pos)++; |
|
c = keys[i].key; |
c = keys[i].key; |
|
|
/* Extra check for the double-vertical. */ |
/* Special cases of spanners. */ |
|
|
if (TBL_CELL_VERT == c && '|' == p[*pos]) { |
if (c == TBL_CELL_SPAN) { |
(*pos)++; |
if (rp->last == NULL) |
c = TBL_CELL_DVERT; |
mandoc_msg(MANDOCERR_TBLLAYOUT_SPAN, |
} |
tbl->parse, ln, *pos, NULL); |
|
else if (rp->last->pos == TBL_CELL_HORIZ || |
/* Disallow adjacent spacers. */ |
rp->last->pos == TBL_CELL_DHORIZ) |
|
c = rp->last->pos; |
|
} else if (c == TBL_CELL_DOWN && rp == tbl->first_row) |
|
mandoc_msg(MANDOCERR_TBLLAYOUT_DOWN, |
|
tbl->parse, ln, *pos, NULL); |
|
|
if (rp->last && (TBL_CELL_VERT == c || TBL_CELL_DVERT == c) && |
(*pos)++; |
(TBL_CELL_VERT == rp->last->pos || |
|
TBL_CELL_DVERT == rp->last->pos)) { |
|
TBL_MSG(tbl, MANDOCERR_TBLLAYOUT, ln, *pos - 1); |
|
return(0); |
|
} |
|
|
|
/* Allocate cell then parse its modifiers. */ |
/* Allocate cell then parse its modifiers. */ |
|
|
cp = mandoc_calloc(1, sizeof(struct tbl_cell)); |
mods(tbl, cell_alloc(tbl, rp, c), ln, p, pos); |
cp->pos = c; |
|
|
|
if (rp->last) { |
|
rp->last->next = cp; |
|
rp->last = cp; |
|
} else |
|
rp->last = rp->first = cp; |
|
|
|
return(mods(tbl, cp, ln, p, pos)); |
|
} |
} |
|
|
|
void |
static void |
tbl_layout(struct tbl_node *tbl, int ln, const char *p, int pos) |
row(struct tbl *tbl, int ln, const char *p, int *pos) |
|
{ |
{ |
struct tbl_row *rp; |
struct tbl_row *rp; |
|
|
row: /* |
rp = NULL; |
* EBNF describing this section: |
for (;;) { |
* |
/* Skip whitespace before and after each cell. */ |
* row ::= row_list [:space:]* [.]?[\n] |
|
* row_list ::= [:space:]* row_elem row_tail |
|
* row_tail ::= [:space:]*[,] row_list | |
|
* epsilon |
|
* row_elem ::= [\t\ ]*[:alpha:]+ |
|
*/ |
|
|
|
rp = mandoc_calloc(1, sizeof(struct tbl_row)); |
while (p[pos] == ' ' || p[pos] == '\t') |
if (tbl->last_row) { |
pos++; |
tbl->last_row->next = rp; |
|
tbl->last_row = rp; |
|
} else |
|
tbl->last_row = tbl->first_row = rp; |
|
|
|
cell: |
switch (p[pos]) { |
while (isspace((unsigned char)p[*pos])) |
case ',': /* Next row on this input line. */ |
(*pos)++; |
pos++; |
|
rp = NULL; |
|
continue; |
|
case '\0': /* Next row on next input line. */ |
|
return; |
|
case '.': /* End of layout. */ |
|
pos++; |
|
tbl->part = TBL_PART_DATA; |
|
|
/* Safely exit layout context. */ |
/* |
|
* When the layout is completely empty, |
|
* default to one left-justified column. |
|
*/ |
|
|
if ('.' == p[*pos]) { |
if (tbl->first_row == NULL) { |
tbl->part = TBL_PART_DATA; |
tbl->first_row = tbl->last_row = |
if (NULL == tbl->first_row) |
mandoc_calloc(1, sizeof(*rp)); |
TBL_MSG(tbl, MANDOCERR_TBLNOLAYOUT, ln, *pos); |
} |
(*pos)++; |
if (tbl->first_row->first == NULL) { |
return; |
mandoc_msg(MANDOCERR_TBLLAYOUT_NONE, |
} |
tbl->parse, ln, pos, NULL); |
|
cell_alloc(tbl, tbl->first_row, |
|
TBL_CELL_LEFT); |
|
if (tbl->opts.lvert < tbl->first_row->vert) |
|
tbl->opts.lvert = tbl->first_row->vert; |
|
return; |
|
} |
|
|
/* End (and possibly restart) a row. */ |
/* |
|
* Search for the widest line |
|
* along the left and right margins. |
|
*/ |
|
|
if (',' == p[*pos]) { |
for (rp = tbl->first_row; rp; rp = rp->next) { |
(*pos)++; |
if (tbl->opts.lvert < rp->vert) |
goto row; |
tbl->opts.lvert = rp->vert; |
} else if ('\0' == p[*pos]) |
if (rp->last != NULL && |
return; |
rp->last->col + 1 == tbl->opts.cols && |
|
tbl->opts.rvert < rp->last->vert) |
|
tbl->opts.rvert = rp->last->vert; |
|
|
if ( ! cell(tbl, rp, ln, p, pos)) |
/* If the last line is empty, drop it. */ |
return; |
|
|
|
goto cell; |
if (rp->next != NULL && |
/* NOTREACHED */ |
rp->next->first == NULL) { |
} |
free(rp->next); |
|
rp->next = NULL; |
|
tbl->last_row = rp; |
|
} |
|
} |
|
return; |
|
default: /* Cell. */ |
|
break; |
|
} |
|
|
|
/* |
|
* If the last line had at least one cell, |
|
* start a new one; otherwise, continue it. |
|
*/ |
|
|
int |
if (rp == NULL) { |
tbl_layout(struct tbl *tbl, int ln, const char *p) |
if (tbl->last_row == NULL || |
|
tbl->last_row->first != NULL) { |
|
rp = mandoc_calloc(1, sizeof(*rp)); |
|
if (tbl->last_row) |
|
tbl->last_row->next = rp; |
|
else |
|
tbl->first_row = rp; |
|
tbl->last_row = rp; |
|
} else |
|
rp = tbl->last_row; |
|
} |
|
cell(tbl, rp, ln, p, &pos); |
|
} |
|
} |
|
|
|
static struct tbl_cell * |
|
cell_alloc(struct tbl_node *tbl, struct tbl_row *rp, enum tbl_cellt pos) |
{ |
{ |
int pos; |
struct tbl_cell *p, *pp; |
|
|
pos = 0; |
p = mandoc_calloc(1, sizeof(*p)); |
row(tbl, ln, p, &pos); |
p->spacing = SIZE_MAX; |
|
p->pos = pos; |
|
|
/* Always succeed. */ |
if ((pp = rp->last) != NULL) { |
return(1); |
pp->next = p; |
|
p->col = pp->col + 1; |
|
} else |
|
rp->first = p; |
|
rp->last = p; |
|
|
|
if (tbl->opts.cols <= p->col) |
|
tbl->opts.cols = p->col + 1; |
|
|
|
return p; |
} |
} |