version 1.6, 2009/03/25 16:07:36 |
version 1.165, 2015/10/06 18:32:19 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@openbsd.org> |
* Copyright (c) 2008, 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv> |
|
* Copyright (c) 2013, 2014, 2015 Ingo Schwarze <schwarze@openbsd.org> |
|
* Copyright (c) 2011 Joerg Sonnenberger <joerg@netbsd.org> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the |
* purpose with or without fee is hereby granted, provided that the above |
* above copyright notice and this permission notice appear in all |
* copyright notice and this permission notice appear in all copies. |
* copies. |
|
* |
* |
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL |
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHORS DISCLAIM ALL WARRANTIES |
* WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED |
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF |
* WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE |
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR |
* AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL |
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES |
* DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR |
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN |
* PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
* PERFORMANCE OF THIS SOFTWARE. |
|
*/ |
*/ |
|
#include "config.h" |
|
|
|
#include <sys/types.h> |
|
|
#include <assert.h> |
#include <assert.h> |
#include <ctype.h> |
#include <ctype.h> |
#include <err.h> |
|
#include <stdarg.h> |
#include <stdarg.h> |
#include <stdlib.h> |
#include <stdlib.h> |
#include <stdio.h> |
#include <stdio.h> |
#include <string.h> |
#include <string.h> |
|
|
|
#include "mandoc_aux.h" |
|
#include "mandoc.h" |
|
#include "roff.h" |
|
#include "man.h" |
|
#include "libmandoc.h" |
|
#include "roff_int.h" |
#include "libman.h" |
#include "libman.h" |
|
|
const char *const __man_macronames[MAN_MAX] = { |
const char *const __man_macronames[MAN_MAX] = { |
"\\\"", "TH", "SH", "SS", |
"br", "TH", "SH", "SS", |
"TP", "LP", "PP", "P", |
"TP", "LP", "PP", "P", |
"IP", "HP", "SM", "SB", |
"IP", "HP", "SM", "SB", |
"BI", "IB", "BR", "RB", |
"BI", "IB", "BR", "RB", |
"R", "B", "I", "IR" |
"R", "B", "I", "IR", |
|
"RI", "sp", "nf", |
|
"fi", "RE", "RS", "DT", |
|
"UC", "PD", "AT", "in", |
|
"ft", "OP", "EX", "EE", |
|
"UR", "UE", "ll" |
}; |
}; |
|
|
const char * const *man_macronames = __man_macronames; |
const char * const *man_macronames = __man_macronames; |
|
|
static struct man_node *man_node_alloc(int, int, enum man_type); |
static void man_descope(struct roff_man *, int, int); |
static int man_node_append(struct man *, |
static int man_ptext(struct roff_man *, int, char *, int); |
struct man_node *); |
static int man_pmacro(struct roff_man *, int, char *, int); |
static int man_ptext(struct man *, int, char *); |
|
static int man_pmacro(struct man *, int, char *); |
|
static void man_free1(struct man *); |
|
static void man_alloc1(struct man *); |
|
|
|
|
|
const struct man_node * |
int |
man_node(const struct man *m) |
man_parseln(struct roff_man *man, int ln, char *buf, int offs) |
{ |
{ |
|
|
return(MAN_HALT & m->flags ? NULL : m->first); |
if (man->last->type != ROFFT_EQN || ln > man->last->line) |
} |
man->flags |= MAN_NEWLINE; |
|
|
|
return roff_getcontrol(man->roff, buf, &offs) ? |
const struct man_meta * |
man_pmacro(man, ln, buf, offs) : |
man_meta(const struct man *m) |
man_ptext(man, ln, buf, offs); |
{ |
|
|
|
return(MAN_HALT & m->flags ? NULL : &m->meta); |
|
} |
} |
|
|
|
static void |
void |
man_descope(struct roff_man *man, int line, int offs) |
man_reset(struct man *man) |
|
{ |
{ |
|
/* |
|
* Co-ordinate what happens with having a next-line scope open: |
|
* first close out the element scope (if applicable), then close |
|
* out the block scope (also if applicable). |
|
*/ |
|
|
man_free1(man); |
if (man->flags & MAN_ELINE) { |
man_alloc1(man); |
man->flags &= ~MAN_ELINE; |
|
man_unscope(man, man->last->parent); |
|
} |
|
if ( ! (man->flags & MAN_BLINE)) |
|
return; |
|
man->flags &= ~MAN_BLINE; |
|
man_unscope(man, man->last->parent); |
|
roff_body_alloc(man, line, offs, man->last->tok); |
} |
} |
|
|
|
static int |
void |
man_ptext(struct roff_man *man, int line, char *buf, int offs) |
man_free(struct man *man) |
|
{ |
{ |
|
int i; |
|
|
man_free1(man); |
/* Literal free-form text whitespace is preserved. */ |
|
|
if (man->htab) |
if (man->flags & MAN_LITERAL) { |
man_hash_free(man->htab); |
roff_word_alloc(man, line, offs, buf + offs); |
free(man); |
man_descope(man, line, offs); |
} |
return 1; |
|
} |
|
|
|
for (i = offs; buf[i] == ' '; i++) |
|
/* Skip leading whitespace. */ ; |
|
|
struct man * |
/* |
man_alloc(void *data, const struct man_cb *cb) |
* Blank lines are ignored right after headings |
{ |
* but add a single vertical space elsewhere. |
struct man *p; |
*/ |
|
|
p = calloc(1, sizeof(struct man)); |
if (buf[i] == '\0') { |
if (NULL == p) |
/* Allocate a blank entry. */ |
err(1, "calloc"); |
if (man->last->tok != MAN_SH && |
|
man->last->tok != MAN_SS) { |
|
roff_elem_alloc(man, line, offs, MAN_sp); |
|
man->next = ROFF_NEXT_SIBLING; |
|
} |
|
return 1; |
|
} |
|
|
man_alloc1(p); |
/* |
|
* Warn if the last un-escaped character is whitespace. Then |
|
* strip away the remaining spaces (tabs stay!). |
|
*/ |
|
|
if (cb) |
i = (int)strlen(buf); |
(void)memcpy(&p->cb, cb, sizeof(struct man_cb)); |
assert(i); |
|
|
p->htab = man_hash_alloc(); |
if (' ' == buf[i - 1] || '\t' == buf[i - 1]) { |
p->data = data; |
if (i > 1 && '\\' != buf[i - 2]) |
return(p); |
mandoc_msg(MANDOCERR_SPACE_EOL, man->parse, |
} |
line, i - 1, NULL); |
|
|
|
for (--i; i && ' ' == buf[i]; i--) |
|
/* Spin back to non-space. */ ; |
|
|
int |
/* Jump ahead of escaped whitespace. */ |
man_endparse(struct man *m) |
i += '\\' == buf[i] ? 2 : 1; |
{ |
|
|
|
if (MAN_HALT & m->flags) |
buf[i] = '\0'; |
return(0); |
} |
else if (man_macroend(m)) |
roff_word_alloc(man, line, offs, buf + offs); |
return(1); |
|
m->flags |= MAN_HALT; |
|
return(0); |
|
} |
|
|
|
|
/* |
|
* End-of-sentence check. If the last character is an unescaped |
|
* EOS character, then flag the node as being the end of a |
|
* sentence. The front-end will know how to interpret this. |
|
*/ |
|
|
int |
assert(i); |
man_parseln(struct man *m, int ln, char *buf) |
if (mandoc_eos(buf, (size_t)i)) |
{ |
man->last->flags |= MAN_EOS; |
|
|
return('.' == *buf ? |
man_descope(man, line, offs); |
man_pmacro(m, ln, buf) : |
return 1; |
man_ptext(m, ln, buf)); |
|
} |
} |
|
|
|
static int |
static void |
man_pmacro(struct roff_man *man, int ln, char *buf, int offs) |
man_free1(struct man *man) |
|
{ |
{ |
|
struct roff_node *n; |
|
const char *cp; |
|
int tok; |
|
int i, ppos; |
|
int bline; |
|
char mac[5]; |
|
|
if (man->first) |
ppos = offs; |
man_node_freelist(man->first); |
|
if (man->meta.title) |
|
free(man->meta.title); |
|
if (man->meta.source) |
|
free(man->meta.source); |
|
if (man->meta.vol) |
|
free(man->meta.vol); |
|
} |
|
|
|
|
/* |
|
* Copy the first word into a nil-terminated buffer. |
|
* Stop when a space, tab, escape, or eoln is encountered. |
|
*/ |
|
|
static void |
i = 0; |
man_alloc1(struct man *m) |
while (i < 4 && strchr(" \t\\", buf[offs]) == NULL) |
{ |
mac[i++] = buf[offs++]; |
|
|
bzero(&m->meta, sizeof(struct man_meta)); |
mac[i] = '\0'; |
m->flags = 0; |
|
m->last = calloc(1, sizeof(struct man_node)); |
|
if (NULL == m->last) |
|
err(1, "calloc"); |
|
m->first = m->last; |
|
m->last->type = MAN_ROOT; |
|
m->next = MAN_NEXT_CHILD; |
|
} |
|
|
|
|
tok = (i > 0 && i < 4) ? man_hash_find(mac) : TOKEN_NONE; |
|
|
static int |
if (tok == TOKEN_NONE) { |
man_node_append(struct man *man, struct man_node *p) |
mandoc_msg(MANDOCERR_MACRO, man->parse, |
{ |
ln, ppos, buf + ppos - 1); |
|
return 1; |
|
} |
|
|
assert(man->last); |
/* Skip a leading escape sequence or tab. */ |
assert(man->first); |
|
assert(MAN_ROOT != p->type); |
|
|
|
switch (man->next) { |
switch (buf[offs]) { |
case (MAN_NEXT_SIBLING): |
case '\\': |
man->last->next = p; |
cp = buf + offs + 1; |
p->prev = man->last; |
mandoc_escape(&cp, NULL, NULL); |
p->parent = man->last->parent; |
offs = cp - buf; |
break; |
break; |
case (MAN_NEXT_CHILD): |
case '\t': |
man->last->child = p; |
offs++; |
p->parent = man->last; |
|
break; |
break; |
default: |
default: |
abort(); |
|
/* NOTREACHED */ |
|
} |
|
|
|
man->last = p; |
|
|
|
switch (p->type) { |
|
case (MAN_TEXT): |
|
if ( ! man_valid_post(man)) |
|
return(0); |
|
if ( ! man_action_post(man)) |
|
return(0); |
|
break; |
break; |
default: |
|
break; |
|
} |
} |
|
|
return(1); |
/* Jump to the next non-whitespace word. */ |
} |
|
|
|
|
while (buf[offs] && buf[offs] == ' ') |
|
offs++; |
|
|
static struct man_node * |
/* |
man_node_alloc(int line, int pos, enum man_type type) |
* Trailing whitespace. Note that tabs are allowed to be passed |
{ |
* into the parser as "text", so we only warn about spaces here. |
struct man_node *p; |
*/ |
|
|
if (NULL == (p = calloc(1, sizeof(struct man_node)))) |
if (buf[offs] == '\0' && buf[offs - 1] == ' ') |
err(1, "malloc"); |
mandoc_msg(MANDOCERR_SPACE_EOL, man->parse, |
p->line = line; |
ln, offs - 1, NULL); |
p->pos = pos; |
|
p->type = type; |
|
|
|
return(p); |
/* |
} |
* Some macros break next-line scopes; otherwise, remember |
|
* whether we are in next-line scope for a block head. |
|
*/ |
|
|
|
man_breakscope(man, tok); |
|
bline = man->flags & MAN_BLINE; |
|
|
int |
/* Call to handler... */ |
man_elem_alloc(struct man *man, int line, int pos, int tok) |
|
{ |
|
struct man_node *p; |
|
|
|
p = man_node_alloc(line, pos, MAN_ELEM); |
assert(man_macros[tok].fp); |
p->tok = tok; |
(*man_macros[tok].fp)(man, tok, ln, ppos, &offs, buf); |
|
|
return(man_node_append(man, p)); |
/* In quick mode (for mandocdb), abort after the NAME section. */ |
} |
|
|
|
|
if (man->quick && tok == MAN_SH) { |
|
n = man->last; |
|
if (n->type == ROFFT_BODY && |
|
strcmp(n->prev->child->string, "NAME")) |
|
return 2; |
|
} |
|
|
int |
/* |
man_word_alloc(struct man *man, |
* If we are in a next-line scope for a block head, |
int line, int pos, const char *word) |
* close it out now and switch to the body, |
{ |
* unless the next-line scope is allowed to continue. |
struct man_node *p; |
*/ |
|
|
p = man_node_alloc(line, pos, MAN_TEXT); |
if ( ! bline || man->flags & MAN_ELINE || |
if (NULL == (p->string = strdup(word))) |
man_macros[tok].flags & MAN_NSCOPED) |
err(1, "strdup"); |
return 1; |
|
|
return(man_node_append(man, p)); |
assert(man->flags & MAN_BLINE); |
} |
man->flags &= ~MAN_BLINE; |
|
|
|
man_unscope(man, man->last->parent); |
void |
roff_body_alloc(man, ln, ppos, man->last->tok); |
man_node_free(struct man_node *p) |
return 1; |
{ |
|
|
|
if (p->string) |
|
free(p->string); |
|
free(p); |
|
} |
} |
|
|
|
|
void |
void |
man_node_freelist(struct man_node *p) |
man_breakscope(struct roff_man *man, int tok) |
{ |
{ |
|
struct roff_node *n; |
|
|
if (p->child) |
/* |
man_node_freelist(p->child); |
* An element next line scope is open, |
if (p->next) |
* and the new macro is not allowed inside elements. |
man_node_freelist(p->next); |
* Delete the element that is being broken. |
|
*/ |
|
|
man_node_free(p); |
if (man->flags & MAN_ELINE && (tok == TOKEN_NONE || |
} |
! (man_macros[tok].flags & MAN_NSCOPED))) { |
|
n = man->last; |
|
assert(n->type != ROFFT_TEXT); |
|
if (man_macros[n->tok].flags & MAN_NSCOPED) |
|
n = n->parent; |
|
|
|
mandoc_vmsg(MANDOCERR_BLK_LINE, man->parse, |
|
n->line, n->pos, "%s breaks %s", |
|
tok == TOKEN_NONE ? "TS" : man_macronames[tok], |
|
man_macronames[n->tok]); |
|
|
static int |
roff_node_delete(man, n); |
man_ptext(struct man *m, int line, char *buf) |
man->flags &= ~MAN_ELINE; |
{ |
|
|
|
if ( ! man_word_alloc(m, line, 0, buf)) |
|
return(0); |
|
m->next = MAN_NEXT_SIBLING; |
|
return(1); |
|
} |
|
|
|
|
|
int |
|
man_pmacro(struct man *m, int ln, char *buf) |
|
{ |
|
int i, c; |
|
char mac[5]; |
|
|
|
/* Comments and empties are quickly ignored. */ |
|
|
|
if (0 == buf[1]) |
|
return(1); |
|
|
|
if (' ' == buf[1]) { |
|
i = 2; |
|
while (buf[i] && ' ' == buf[i]) |
|
i++; |
|
if (0 == buf[i]) |
|
return(1); |
|
warnx("invalid syntax"); |
|
return(0); |
|
} |
} |
|
|
if (buf[1] && '\\' == buf[1]) |
/* |
if (buf[2] && '\"' == buf[2]) |
* Weird special case: |
return(1); |
* Switching fill mode closes section headers. |
|
*/ |
|
|
/* Copy the first word into a nil-terminated buffer. */ |
if (man->flags & MAN_BLINE && |
|
(tok == MAN_nf || tok == MAN_fi) && |
for (i = 1; i < 5; i++) { |
(man->last->tok == MAN_SH || man->last->tok == MAN_SS)) { |
if (0 == (mac[i - 1] = buf[i])) |
n = man->last; |
break; |
man_unscope(man, n); |
else if (' ' == buf[i]) |
roff_body_alloc(man, n->line, n->pos, n->tok); |
break; |
man->flags &= ~MAN_BLINE; |
} |
} |
|
|
mac[i - 1] = 0; |
/* |
|
* A block header next line scope is open, |
|
* and the new macro is not allowed inside block headers. |
|
* Delete the block that is being broken. |
|
*/ |
|
|
if (i == 5 || i <= 1) { |
if (man->flags & MAN_BLINE && (tok == TOKEN_NONE || |
warnx("unknown macro: %s", mac); |
man_macros[tok].flags & MAN_BSCOPE)) { |
goto err; |
n = man->last; |
} |
if (n->type == ROFFT_TEXT) |
|
n = n->parent; |
if (MAN_MAX == (c = man_hash_find(m->htab, mac))) { |
if ( ! (man_macros[n->tok].flags & MAN_BSCOPE)) |
warnx("unknown macro: %s", mac); |
n = n->parent; |
goto err; |
|
} |
|
|
|
/* The macro is sane. Jump to the next word. */ |
assert(n->type == ROFFT_HEAD); |
|
n = n->parent; |
|
assert(n->type == ROFFT_BLOCK); |
|
assert(man_macros[n->tok].flags & MAN_SCOPED); |
|
|
while (buf[i] && ' ' == buf[i]) |
mandoc_vmsg(MANDOCERR_BLK_LINE, man->parse, |
i++; |
n->line, n->pos, "%s breaks %s", |
|
tok == TOKEN_NONE ? "TS" : man_macronames[tok], |
|
man_macronames[n->tok]); |
|
|
/* Begin recursive parse sequence. */ |
roff_node_delete(man, n); |
|
man->flags &= ~MAN_BLINE; |
if ( ! man_macro(m, c, ln, 1, &i, buf)) |
} |
goto err; |
|
|
|
return(1); |
|
|
|
err: /* Error out. */ |
|
|
|
m->flags |= MAN_HALT; |
|
return(0); |
|
} |
} |
|
|
|
const struct mparse * |
int |
man_mparse(const struct roff_man *man) |
man_verr(struct man *man, int ln, int pos, const char *fmt, ...) |
|
{ |
{ |
char buf[256]; |
|
va_list ap; |
|
|
|
if (NULL == man->cb.man_err) |
assert(man && man->parse); |
return(0); |
return man->parse; |
|
|
va_start(ap, fmt); |
|
(void)vsnprintf(buf, sizeof(buf) - 1, fmt, ap); |
|
va_end(ap); |
|
return((*man->cb.man_err)(man->data, ln, pos, buf)); |
|
} |
} |
|
|
|
|
int |
|
man_vwarn(struct man *man, int ln, int pos, const char *fmt, ...) |
|
{ |
|
char buf[256]; |
|
va_list ap; |
|
|
|
if (NULL == man->cb.man_warn) |
|
return(0); |
|
|
|
va_start(ap, fmt); |
|
(void)vsnprintf(buf, sizeof(buf) - 1, fmt, ap); |
|
va_end(ap); |
|
return((*man->cb.man_warn)(man->data, ln, pos, buf)); |
|
} |
|
|
|
|
|