version 1.18, 2009/04/12 19:45:26 |
version 1.42, 2009/10/24 05:45:04 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@openbsd.org> |
* Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@kth.se> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the above |
* purpose with or without fee is hereby granted, provided that the above |
|
|
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
*/ |
*/ |
|
#include <sys/types.h> |
|
|
#include <assert.h> |
#include <assert.h> |
#include <ctype.h> |
#include <ctype.h> |
#include <stdarg.h> |
#include <stdarg.h> |
|
|
|
|
#include "libman.h" |
#include "libman.h" |
|
|
|
const char *const __man_merrnames[WERRMAX] = { |
|
"invalid character", /* WNPRINT */ |
|
"system: malloc error", /* WNMEM */ |
|
"invalid manual section", /* WMSEC */ |
|
"invalid date format", /* WDATE */ |
|
"scope of prior line violated", /* WLNSCOPE */ |
|
"trailing whitespace", /* WTSPACE */ |
|
"unterminated quoted parameter", /* WTQUOTE */ |
|
"document has no body", /* WNODATA */ |
|
"document has no title/section", /* WNOTITLE */ |
|
"invalid escape sequence", /* WESCAPE */ |
|
"invalid number format", /* WNUMFMT */ |
|
"expected block head arguments", /* WHEADARGS */ |
|
"expected block body arguments", /* WBODYARGS */ |
|
"expected empty block head", /* WNHEADARGS */ |
|
"unknown macro", /* WMACRO */ |
|
"ill-formed macro", /* WMACROFORM */ |
|
"scope open on exit", /* WEXITSCOPE */ |
|
"no scope context", /* WNOSCOPE */ |
|
"literal context already open", /* WOLITERAL */ |
|
"no literal context open" /* WNLITERAL */ |
|
}; |
|
|
const char *const __man_macronames[MAN_MAX] = { |
const char *const __man_macronames[MAN_MAX] = { |
"\\\"", "TH", "SH", "SS", |
"br", "TH", "SH", "SS", |
"TP", "LP", "PP", "P", |
"TP", "LP", "PP", "P", |
"IP", "HP", "SM", "SB", |
"IP", "HP", "SM", "SB", |
"BI", "IB", "BR", "RB", |
"BI", "IB", "BR", "RB", |
"R", "B", "I", "IR", |
"R", "B", "I", "IR", |
"RI", "br", "na", "i" |
"RI", "na", "i", "sp", |
|
"nf", "fi", "r", "RE", |
|
"RS", "DT", "UC", "PD" |
}; |
}; |
|
|
const char * const *man_macronames = __man_macronames; |
const char * const *man_macronames = __man_macronames; |
Line 42 static int man_ptext(struct man *, int, char *); |
|
Line 69 static int man_ptext(struct man *, int, char *); |
|
static int man_pmacro(struct man *, int, char *); |
static int man_pmacro(struct man *, int, char *); |
static void man_free1(struct man *); |
static void man_free1(struct man *); |
static int man_alloc1(struct man *); |
static int man_alloc1(struct man *); |
|
static int pstring(struct man *, int, int, |
|
const char *, size_t); |
|
|
|
#ifdef __linux__ |
|
extern size_t strlcpy(char *, const char *, size_t); |
|
#endif |
|
|
|
|
const struct man_node * |
const struct man_node * |
man_node(const struct man *m) |
man_node(const struct man *m) |
{ |
{ |
Line 74 man_free(struct man *man) |
|
Line 107 man_free(struct man *man) |
|
{ |
{ |
|
|
man_free1(man); |
man_free1(man); |
|
|
if (man->htab) |
|
man_hash_free(man->htab); |
|
free(man); |
free(man); |
} |
} |
|
|
Line 94 man_alloc(void *data, int pflags, const struct man_cb |
|
Line 124 man_alloc(void *data, int pflags, const struct man_cb |
|
return(NULL); |
return(NULL); |
} |
} |
|
|
|
man_hash_init(); |
|
|
p->data = data; |
p->data = data; |
p->pflags = pflags; |
p->pflags = pflags; |
(void)memcpy(&p->cb, cb, sizeof(struct man_cb)); |
(void)memcpy(&p->cb, cb, sizeof(struct man_cb)); |
|
|
if (NULL == (p->htab = man_hash_alloc())) { |
|
free(p); |
|
return(NULL); |
|
} |
|
return(p); |
return(p); |
} |
} |
|
|
Line 182 man_node_append(struct man *man, struct man_node *p) |
|
Line 209 man_node_append(struct man *man, struct man_node *p) |
|
abort(); |
abort(); |
/* NOTREACHED */ |
/* NOTREACHED */ |
} |
} |
|
|
|
p->parent->nchild++; |
|
|
|
if ( ! man_valid_pre(man, p)) |
|
return(0); |
|
|
|
switch (p->type) { |
|
case (MAN_HEAD): |
|
assert(MAN_BLOCK == p->parent->type); |
|
p->parent->head = p; |
|
break; |
|
case (MAN_BODY): |
|
assert(MAN_BLOCK == p->parent->type); |
|
p->parent->body = p; |
|
break; |
|
default: |
|
break; |
|
} |
|
|
man->last = p; |
man->last = p; |
|
|
switch (p->type) { |
switch (p->type) { |
Line 218 man_node_alloc(int line, int pos, enum man_type type, |
|
Line 263 man_node_alloc(int line, int pos, enum man_type type, |
|
|
|
|
|
int |
int |
man_elem_alloc(struct man *man, int line, int pos, int tok) |
man_elem_alloc(struct man *m, int line, int pos, int tok) |
{ |
{ |
struct man_node *p; |
struct man_node *p; |
|
|
p = man_node_alloc(line, pos, MAN_ELEM, tok); |
p = man_node_alloc(line, pos, MAN_ELEM, tok); |
if (NULL == p) |
if (NULL == p) |
return(0); |
return(0); |
return(man_node_append(man, p)); |
if ( ! man_node_append(m, p)) |
|
return(0); |
|
m->next = MAN_NEXT_CHILD; |
|
return(1); |
} |
} |
|
|
|
|
int |
int |
man_word_alloc(struct man *man, |
man_head_alloc(struct man *m, int line, int pos, int tok) |
int line, int pos, const char *word) |
|
{ |
{ |
struct man_node *p; |
struct man_node *p; |
|
|
p = man_node_alloc(line, pos, MAN_TEXT, -1); |
p = man_node_alloc(line, pos, MAN_HEAD, tok); |
if (NULL == p) |
if (NULL == p) |
return(0); |
return(0); |
if (NULL == (p->string = strdup(word))) |
if ( ! man_node_append(m, p)) |
return(0); |
return(0); |
return(man_node_append(man, p)); |
m->next = MAN_NEXT_CHILD; |
|
return(1); |
} |
} |
|
|
|
|
|
int |
|
man_body_alloc(struct man *m, int line, int pos, int tok) |
|
{ |
|
struct man_node *p; |
|
|
|
p = man_node_alloc(line, pos, MAN_BODY, tok); |
|
if (NULL == p) |
|
return(0); |
|
if ( ! man_node_append(m, p)) |
|
return(0); |
|
m->next = MAN_NEXT_CHILD; |
|
return(1); |
|
} |
|
|
|
|
|
int |
|
man_block_alloc(struct man *m, int line, int pos, int tok) |
|
{ |
|
struct man_node *p; |
|
|
|
p = man_node_alloc(line, pos, MAN_BLOCK, tok); |
|
if (NULL == p) |
|
return(0); |
|
if ( ! man_node_append(m, p)) |
|
return(0); |
|
m->next = MAN_NEXT_CHILD; |
|
return(1); |
|
} |
|
|
|
|
|
static int |
|
pstring(struct man *m, int line, int pos, |
|
const char *p, size_t len) |
|
{ |
|
struct man_node *n; |
|
size_t sv; |
|
|
|
n = man_node_alloc(line, pos, MAN_TEXT, -1); |
|
if (NULL == n) |
|
return(0); |
|
|
|
n->string = malloc(len + 1); |
|
if (NULL == n->string) { |
|
free(n); |
|
return(0); |
|
} |
|
|
|
sv = strlcpy(n->string, p, len + 1); |
|
|
|
/* Prohibit truncation. */ |
|
assert(sv < len + 1); |
|
|
|
if ( ! man_node_append(m, n)) |
|
return(0); |
|
m->next = MAN_NEXT_SIBLING; |
|
return(1); |
|
} |
|
|
|
|
|
int |
|
man_word_alloc(struct man *m, int line, int pos, const char *word) |
|
{ |
|
|
|
return(pstring(m, line, pos, word, strlen(word))); |
|
} |
|
|
|
|
void |
void |
man_node_free(struct man_node *p) |
man_node_free(struct man_node *p) |
{ |
{ |
|
|
if (p->string) |
if (p->string) |
free(p->string); |
free(p->string); |
|
if (p->parent) |
|
p->parent->nchild--; |
free(p); |
free(p); |
} |
} |
|
|
Line 257 man_node_free(struct man_node *p) |
|
Line 374 man_node_free(struct man_node *p) |
|
void |
void |
man_node_freelist(struct man_node *p) |
man_node_freelist(struct man_node *p) |
{ |
{ |
|
struct man_node *n; |
|
|
if (p->child) |
if (p->child) |
man_node_freelist(p->child); |
man_node_freelist(p->child); |
if (p->next) |
assert(0 == p->nchild); |
man_node_freelist(p->next); |
n = p->next; |
|
|
man_node_free(p); |
man_node_free(p); |
|
if (n) |
|
man_node_freelist(n); |
} |
} |
|
|
|
|
static int |
static int |
man_ptext(struct man *m, int line, char *buf) |
man_ptext(struct man *m, int line, char *buf) |
{ |
{ |
|
int i, j; |
|
|
if ( ! man_word_alloc(m, line, 0, buf)) |
/* Literal free-form text whitespace is preserved. */ |
|
|
|
if (MAN_LITERAL & m->flags) { |
|
if ( ! man_word_alloc(m, line, 0, buf)) |
|
return(0); |
|
goto descope; |
|
} |
|
|
|
/* First de-chunk and allocate words. */ |
|
|
|
for (i = 0; ' ' == buf[i]; i++) |
|
/* Skip leading whitespace. */ ; |
|
if (0 == buf[i]) { |
|
if ( ! pstring(m, line, 0, &buf[i], 0)) |
|
return(0); |
|
goto descope; |
|
} |
|
|
|
for (j = i; buf[i]; i++) { |
|
if (' ' != buf[i]) |
|
continue; |
|
|
|
/* Escaped whitespace. */ |
|
if (i && ' ' == buf[i] && '\\' == buf[i - 1]) |
|
continue; |
|
|
|
buf[i++] = 0; |
|
if ( ! pstring(m, line, j, &buf[j], (size_t)(i - j))) |
|
return(0); |
|
|
|
for ( ; ' ' == buf[i]; i++) |
|
/* Skip trailing whitespace. */ ; |
|
|
|
j = i; |
|
if (0 == buf[i]) |
|
break; |
|
} |
|
|
|
if (j != i && ! pstring(m, line, j, &buf[j], (size_t)(i - j))) |
return(0); |
return(0); |
m->next = MAN_NEXT_SIBLING; |
|
|
|
|
descope: |
|
|
/* |
/* |
* If this is one of the zany NLINE macros that consumes the |
* Co-ordinate what happens with having a next-line scope open: |
* next line of input as being influenced, then close out the |
* first close out the element scope (if applicable), then close |
* existing macro "scope" and continue processing. |
* out the block scope (also if applicable). |
*/ |
*/ |
|
|
if ( ! (MAN_NLINE & m->flags)) |
if (MAN_ELINE & m->flags) { |
|
m->flags &= ~MAN_ELINE; |
|
if ( ! man_unscope(m, m->last->parent)) |
|
return(0); |
|
} |
|
|
|
if ( ! (MAN_BLINE & m->flags)) |
return(1); |
return(1); |
|
m->flags &= ~MAN_BLINE; |
|
|
m->flags &= ~MAN_NLINE; |
if ( ! man_unscope(m, m->last->parent)) |
m->last = m->last->parent; |
|
|
|
assert(MAN_ROOT != m->last->type); |
|
if ( ! man_valid_post(m)) |
|
return(0); |
return(0); |
if ( ! man_action_post(m)) |
return(man_body_alloc(m, line, 0, m->last->tok)); |
return(0); |
|
|
|
return(1); |
|
} |
} |
|
|
|
|
int |
int |
man_pmacro(struct man *m, int ln, char *buf) |
man_pmacro(struct man *m, int ln, char *buf) |
{ |
{ |
int i, j, c, ppos, fl; |
int i, j, c, ppos, fl; |
char mac[5]; |
char mac[5]; |
struct man_node *n; |
struct man_node *n; |
|
|
/* Comments and empties are quickly ignored. */ |
/* Comments and empties are quickly ignored. */ |
|
|
n = m->last; |
fl = m->flags; |
fl = MAN_NLINE & m->flags; |
|
|
|
if (0 == buf[1]) |
if (0 == buf[1]) |
goto out; |
goto out; |
Line 324 man_pmacro(struct man *m, int ln, char *buf) |
|
Line 482 man_pmacro(struct man *m, int ln, char *buf) |
|
|
|
ppos = i; |
ppos = i; |
|
|
if (buf[i] && '\\' == buf[i]) |
|
if (buf[i + 1] && '\"' == buf[i + 1]) |
|
goto out; |
|
|
|
/* Copy the first word into a nil-terminated buffer. */ |
/* Copy the first word into a nil-terminated buffer. */ |
|
|
for (j = 0; j < 4; j++, i++) { |
for (j = 0; j < 4; j++, i++) { |
Line 335 man_pmacro(struct man *m, int ln, char *buf) |
|
Line 489 man_pmacro(struct man *m, int ln, char *buf) |
|
break; |
break; |
else if (' ' == buf[i]) |
else if (' ' == buf[i]) |
break; |
break; |
|
|
|
/* Check for invalid characters. */ |
|
|
|
if (isgraph((u_char)buf[i])) |
|
continue; |
|
return(man_perr(m, ln, i, WNPRINT)); |
} |
} |
|
|
mac[j] = 0; |
mac[j] = 0; |
|
|
if (j == 4 || j < 1) { |
if (j == 4 || j < 1) { |
if ( ! (MAN_IGN_MACRO & m->pflags)) { |
if ( ! (MAN_IGN_MACRO & m->pflags)) { |
(void)man_verr(m, ln, ppos, |
(void)man_perr(m, ln, ppos, WMACROFORM); |
"ill-formed macro: %s", mac); |
|
goto err; |
goto err; |
} |
} |
if ( ! man_vwarn(m, ln, ppos, |
if ( ! man_pwarn(m, ln, ppos, WMACROFORM)) |
"ill-formed macro: %s", mac)) |
|
goto err; |
goto err; |
return(1); |
return(1); |
} |
} |
|
|
if (MAN_MAX == (c = man_hash_find(m->htab, mac))) { |
if (MAN_MAX == (c = man_hash_find(mac))) { |
if ( ! (MAN_IGN_MACRO & m->pflags)) { |
if ( ! (MAN_IGN_MACRO & m->pflags)) { |
(void)man_verr(m, ln, ppos, |
(void)man_perr(m, ln, ppos, WMACRO); |
"unknown macro: %s", mac); |
|
goto err; |
goto err; |
} |
} |
if ( ! man_vwarn(m, ln, ppos, |
if ( ! man_pwarn(m, ln, ppos, WMACRO)) |
"unknown macro: %s", mac)) |
|
goto err; |
goto err; |
return(1); |
return(1); |
} |
} |
Line 368 man_pmacro(struct man *m, int ln, char *buf) |
|
Line 524 man_pmacro(struct man *m, int ln, char *buf) |
|
while (buf[i] && ' ' == buf[i]) |
while (buf[i] && ' ' == buf[i]) |
i++; |
i++; |
|
|
|
/* Remove prior ELINE macro, if applicable. */ |
|
|
|
if (m->flags & MAN_ELINE) { |
|
n = m->last; |
|
assert(NULL == n->child); |
|
assert(0 == n->nchild); |
|
if ( ! man_nwarn(m, n, WLNSCOPE)) |
|
return(0); |
|
|
|
if (n->prev) { |
|
assert(n != n->parent->child); |
|
assert(n == n->prev->next); |
|
n->prev->next = NULL; |
|
m->last = n->prev; |
|
m->next = MAN_NEXT_SIBLING; |
|
} else { |
|
assert(n == n->parent->child); |
|
n->parent->child = NULL; |
|
m->last = n->parent; |
|
m->next = MAN_NEXT_CHILD; |
|
} |
|
|
|
man_node_free(n); |
|
m->flags &= ~MAN_ELINE; |
|
} |
|
|
/* Begin recursive parse sequence. */ |
/* Begin recursive parse sequence. */ |
|
|
if ( ! man_macro(m, c, ln, ppos, &i, buf)) |
assert(man_macros[c].fp); |
|
|
|
if ( ! (*man_macros[c].fp)(m, c, ln, ppos, &i, buf)) |
goto err; |
goto err; |
|
|
out: |
out: |
if (fl) { |
if ( ! (MAN_BLINE & fl)) |
/* |
return(1); |
* A NLINE macro has been immediately followed with |
|
* another. Close out the preceding macro's scope, and |
|
* continue. |
|
*/ |
|
assert(MAN_ROOT != m->last->type); |
|
assert(m->last->parent); |
|
assert(MAN_ROOT != m->last->parent->type); |
|
|
|
if (n != m->last) |
/* |
m->last = m->last->parent; |
* If we've opened a new next-line element scope, then return |
|
* now, as the next line will close out the block scope. |
|
*/ |
|
|
if ( ! man_valid_post(m)) |
if (MAN_ELINE & m->flags) |
return(0); |
return(1); |
if ( ! man_action_post(m)) |
|
return(0); |
|
m->next = MAN_NEXT_SIBLING; |
|
m->flags &= ~MAN_NLINE; |
|
} |
|
|
|
return(1); |
/* Close out the block scope opened in the prior line. */ |
|
|
|
assert(MAN_BLINE & m->flags); |
|
m->flags &= ~MAN_BLINE; |
|
|
|
if ( ! man_unscope(m, m->last->parent)) |
|
return(0); |
|
return(man_body_alloc(m, ln, 0, m->last->tok)); |
|
|
err: /* Error out. */ |
err: /* Error out. */ |
|
|
m->flags |= MAN_HALT; |
m->flags |= MAN_HALT; |
Line 436 man_vwarn(struct man *man, int ln, int pos, const char |
|
Line 617 man_vwarn(struct man *man, int ln, int pos, const char |
|
} |
} |
|
|
|
|
|
int |
|
man_err(struct man *m, int line, int pos, int iserr, enum merr type) |
|
{ |
|
const char *p; |
|
|
|
p = __man_merrnames[(int)type]; |
|
assert(p); |
|
|
|
if (iserr) |
|
return(man_verr(m, line, pos, p)); |
|
|
|
return(man_vwarn(m, line, pos, p)); |
|
} |