version 1.35, 2013/05/30 03:52:59 |
version 1.44, 2014/03/19 21:51:20 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2008, 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv> |
* Copyright (c) 2008, 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv> |
* Copyright (c) 2010, 2011, 2012, 2013 Ingo Schwarze <schwarze@openbsd.org> |
* Copyright (c) 2010-2014 Ingo Schwarze <schwarze@openbsd.org> |
|
* Copyright (c) 2010, 2012 Joerg Sonnenberger <joerg@netbsd.org> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the above |
* purpose with or without fee is hereby granted, provided that the above |
|
|
|
|
#include <assert.h> |
#include <assert.h> |
#include <ctype.h> |
#include <ctype.h> |
|
#include <errno.h> |
#include <fcntl.h> |
#include <fcntl.h> |
#include <stdarg.h> |
#include <stdarg.h> |
#include <stdint.h> |
#include <stdint.h> |
|
|
#include "man.h" |
#include "man.h" |
#include "main.h" |
#include "main.h" |
|
|
#ifndef MAP_FILE |
|
#define MAP_FILE 0 |
|
#endif |
|
|
|
#define REPARSE_LIMIT 1000 |
#define REPARSE_LIMIT 1000 |
|
|
struct buf { |
struct buf { |
|
|
enum mandoclevel file_status; /* status of current parse */ |
enum mandoclevel file_status; /* status of current parse */ |
enum mandoclevel wlevel; /* ignore messages below this */ |
enum mandoclevel wlevel; /* ignore messages below this */ |
int line; /* line number in the file */ |
int line; /* line number in the file */ |
enum mparset inttype; /* which parser to use */ |
int options; /* parser options */ |
struct man *pman; /* persistent man parser */ |
struct man *pman; /* persistent man parser */ |
struct mdoc *pmdoc; /* persistent mdoc parser */ |
struct mdoc *pmdoc; /* persistent mdoc parser */ |
struct man *man; /* man parser */ |
struct man *man; /* man parser */ |
|
|
struct roff *roff; /* roff parser (!NULL) */ |
struct roff *roff; /* roff parser (!NULL) */ |
int reparse_count; /* finite interp. stack */ |
int reparse_count; /* finite interp. stack */ |
mandocmsg mmsg; /* warning/error message handler */ |
mandocmsg mmsg; /* warning/error message handler */ |
void *arg; /* argument to mmsg */ |
|
const char *file; |
const char *file; |
struct buf *secondary; |
struct buf *secondary; |
char *defos; /* default operating system */ |
char *defos; /* default operating system */ |
|
|
|
|
static void resize_buf(struct buf *, size_t); |
static void resize_buf(struct buf *, size_t); |
static void mparse_buf_r(struct mparse *, struct buf, int); |
static void mparse_buf_r(struct mparse *, struct buf, int); |
static void mparse_readfd_r(struct mparse *, int, const char *, int); |
|
static void pset(const char *, int, struct mparse *); |
static void pset(const char *, int, struct mparse *); |
static int read_whole_file(const char *, int, struct buf *, int *); |
static int read_whole_file(struct mparse *, const char *, int, |
|
struct buf *, int *); |
static void mparse_end(struct mparse *); |
static void mparse_end(struct mparse *); |
|
static void mparse_parse_buffer(struct mparse *, struct buf, |
|
const char *); |
|
|
static const enum mandocerr mandoclimits[MANDOCLEVEL_MAX] = { |
static const enum mandocerr mandoclimits[MANDOCLEVEL_MAX] = { |
MANDOCERR_OK, |
MANDOCERR_OK, |
Line 109 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
Line 108 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
"bad NAME section contents", |
"bad NAME section contents", |
"sections out of conventional order", |
"sections out of conventional order", |
"duplicate section name", |
"duplicate section name", |
"section not in conventional manual section", |
"section header suited to sections 2, 3, and 9 only", |
|
|
/* related to macros and nesting */ |
/* related to macros and nesting */ |
"skipping obsolete macro", |
"skipping obsolete macro", |
Line 188 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
Line 187 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
"macro requires line argument(s)", |
"macro requires line argument(s)", |
"macro requires body argument(s)", |
"macro requires body argument(s)", |
"macro requires argument(s)", |
"macro requires argument(s)", |
|
"request requires a numeric argument", |
"missing list type", |
"missing list type", |
"line argument(s) will be lost", |
"line argument(s) will be lost", |
"body argument(s) will be lost", |
"body argument(s) will be lost", |
|
|
"generic fatal error", |
"generic fatal error", |
|
|
|
"input too large", |
"not a manual", |
"not a manual", |
"column syntax is inconsistent", |
"column syntax is inconsistent", |
"NOT IMPLEMENTED: .Bd -file", |
"NOT IMPLEMENTED: .Bd -file", |
Line 204 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
Line 205 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
"no document body", |
"no document body", |
"no document prologue", |
"no document prologue", |
"static buffer exhausted", |
"static buffer exhausted", |
|
|
|
/* system errors */ |
|
"cannot open file", |
|
"cannot stat file", |
|
"cannot read file", |
}; |
}; |
|
|
static const char * const mandoclevels[MANDOCLEVEL_MAX] = { |
static const char * const mandoclevels[MANDOCLEVEL_MAX] = { |
Line 248 pset(const char *buf, int pos, struct mparse *curp) |
|
Line 254 pset(const char *buf, int pos, struct mparse *curp) |
|
return; |
return; |
} |
} |
|
|
switch (curp->inttype) { |
if (MPARSE_MDOC & curp->options) { |
case (MPARSE_MDOC): |
|
if (NULL == curp->pmdoc) |
if (NULL == curp->pmdoc) |
curp->pmdoc = mdoc_alloc(curp->roff, curp, |
curp->pmdoc = mdoc_alloc( |
curp->defos); |
curp->roff, curp, curp->defos, |
|
MPARSE_QUICK & curp->options ? 1 : 0); |
assert(curp->pmdoc); |
assert(curp->pmdoc); |
curp->mdoc = curp->pmdoc; |
curp->mdoc = curp->pmdoc; |
return; |
return; |
case (MPARSE_MAN): |
} else if (MPARSE_MAN & curp->options) { |
if (NULL == curp->pman) |
if (NULL == curp->pman) |
curp->pman = man_alloc(curp->roff, curp); |
curp->pman = man_alloc(curp->roff, curp, |
|
MPARSE_QUICK & curp->options ? 1 : 0); |
assert(curp->pman); |
assert(curp->pman); |
curp->man = curp->pman; |
curp->man = curp->pman; |
return; |
return; |
default: |
|
break; |
|
} |
} |
|
|
if (pos >= 3 && 0 == memcmp(buf, ".Dd", 3)) { |
if (pos >= 3 && 0 == memcmp(buf, ".Dd", 3)) { |
if (NULL == curp->pmdoc) |
if (NULL == curp->pmdoc) |
curp->pmdoc = mdoc_alloc(curp->roff, curp, |
curp->pmdoc = mdoc_alloc( |
curp->defos); |
curp->roff, curp, curp->defos, |
|
MPARSE_QUICK & curp->options ? 1 : 0); |
assert(curp->pmdoc); |
assert(curp->pmdoc); |
curp->mdoc = curp->pmdoc; |
curp->mdoc = curp->pmdoc; |
return; |
return; |
} |
} |
|
|
if (NULL == curp->pman) |
if (NULL == curp->pman) |
curp->pman = man_alloc(curp->roff, curp); |
curp->pman = man_alloc(curp->roff, curp, |
|
MPARSE_QUICK & curp->options ? 1 : 0); |
assert(curp->pman); |
assert(curp->pman); |
curp->man = curp->pman; |
curp->man = curp->pman; |
} |
} |
|
|
*/ |
*/ |
if (curp->secondary) |
if (curp->secondary) |
curp->secondary->sz -= pos + 1; |
curp->secondary->sz -= pos + 1; |
mparse_readfd_r(curp, -1, ln.buf + of, 1); |
mparse_readfd(curp, -1, ln.buf + of); |
if (MANDOCLEVEL_FATAL <= curp->file_status) |
if (MANDOCLEVEL_FATAL <= curp->file_status) |
break; |
break; |
pos = 0; |
pos = 0; |
|
|
if (0 == rc) { |
if (0 == rc) { |
assert(MANDOCLEVEL_FATAL <= curp->file_status); |
assert(MANDOCLEVEL_FATAL <= curp->file_status); |
break; |
break; |
} |
} else if (2 == rc) |
|
break; |
|
|
/* Temporary buffers typically are not full. */ |
/* Temporary buffers typically are not full. */ |
|
|
|
|
} |
} |
|
|
static int |
static int |
read_whole_file(const char *file, int fd, struct buf *fb, int *with_mmap) |
read_whole_file(struct mparse *curp, const char *file, int fd, |
|
struct buf *fb, int *with_mmap) |
{ |
{ |
size_t off; |
size_t off; |
ssize_t ssz; |
ssize_t ssz; |
Line 578 read_whole_file(const char *file, int fd, struct buf * |
|
Line 587 read_whole_file(const char *file, int fd, struct buf * |
|
#ifdef HAVE_MMAP |
#ifdef HAVE_MMAP |
struct stat st; |
struct stat st; |
if (-1 == fstat(fd, &st)) { |
if (-1 == fstat(fd, &st)) { |
perror(file); |
curp->file_status = MANDOCLEVEL_SYSERR; |
|
if (curp->mmsg) |
|
(*curp->mmsg)(MANDOCERR_SYSSTAT, curp->file_status, |
|
file, 0, 0, strerror(errno)); |
return(0); |
return(0); |
} |
} |
|
|
Line 591 read_whole_file(const char *file, int fd, struct buf * |
|
Line 603 read_whole_file(const char *file, int fd, struct buf * |
|
|
|
if (S_ISREG(st.st_mode)) { |
if (S_ISREG(st.st_mode)) { |
if (st.st_size >= (1U << 31)) { |
if (st.st_size >= (1U << 31)) { |
fprintf(stderr, "%s: input too large\n", file); |
curp->file_status = MANDOCLEVEL_FATAL; |
|
if (curp->mmsg) |
|
(*curp->mmsg)(MANDOCERR_TOOLARGE, |
|
curp->file_status, file, 0, 0, NULL); |
return(0); |
return(0); |
} |
} |
*with_mmap = 1; |
*with_mmap = 1; |
fb->sz = (size_t)st.st_size; |
fb->sz = (size_t)st.st_size; |
fb->buf = mmap(NULL, fb->sz, PROT_READ, |
fb->buf = mmap(NULL, fb->sz, PROT_READ, MAP_SHARED, fd, 0); |
MAP_FILE|MAP_SHARED, fd, 0); |
|
if (fb->buf != MAP_FAILED) |
if (fb->buf != MAP_FAILED) |
return(1); |
return(1); |
} |
} |
Line 615 read_whole_file(const char *file, int fd, struct buf * |
|
Line 629 read_whole_file(const char *file, int fd, struct buf * |
|
for (;;) { |
for (;;) { |
if (off == fb->sz) { |
if (off == fb->sz) { |
if (fb->sz == (1U << 31)) { |
if (fb->sz == (1U << 31)) { |
fprintf(stderr, "%s: input too large\n", file); |
curp->file_status = MANDOCLEVEL_FATAL; |
|
if (curp->mmsg) |
|
(*curp->mmsg)(MANDOCERR_TOOLARGE, |
|
curp->file_status, |
|
file, 0, 0, NULL); |
break; |
break; |
} |
} |
resize_buf(fb, 65536); |
resize_buf(fb, 65536); |
Line 626 read_whole_file(const char *file, int fd, struct buf * |
|
Line 644 read_whole_file(const char *file, int fd, struct buf * |
|
return(1); |
return(1); |
} |
} |
if (ssz == -1) { |
if (ssz == -1) { |
perror(file); |
curp->file_status = MANDOCLEVEL_SYSERR; |
|
if (curp->mmsg) |
|
(*curp->mmsg)(MANDOCERR_SYSREAD, |
|
curp->file_status, file, 0, 0, |
|
strerror(errno)); |
break; |
break; |
} |
} |
off += (size_t)ssz; |
off += (size_t)ssz; |
Line 664 mparse_end(struct mparse *curp) |
|
Line 686 mparse_end(struct mparse *curp) |
|
} |
} |
|
|
static void |
static void |
mparse_parse_buffer(struct mparse *curp, struct buf blk, const char *file, |
mparse_parse_buffer(struct mparse *curp, struct buf blk, const char *file) |
int re) |
|
{ |
{ |
const char *svfile; |
const char *svfile; |
|
static int recursion_depth; |
|
|
|
if (64 < recursion_depth) { |
|
mandoc_msg(MANDOCERR_ROFFLOOP, curp, curp->line, 0, NULL); |
|
return; |
|
} |
|
|
/* Line number is per-file. */ |
/* Line number is per-file. */ |
svfile = curp->file; |
svfile = curp->file; |
curp->file = file; |
curp->file = file; |
curp->line = 1; |
curp->line = 1; |
|
recursion_depth++; |
|
|
mparse_buf_r(curp, blk, 1); |
mparse_buf_r(curp, blk, 1); |
|
|
if (0 == re && MANDOCLEVEL_FATAL > curp->file_status) |
if (0 == --recursion_depth && MANDOCLEVEL_FATAL > curp->file_status) |
mparse_end(curp); |
mparse_end(curp); |
|
|
curp->file = svfile; |
curp->file = svfile; |
Line 691 mparse_readmem(struct mparse *curp, const void *buf, s |
|
Line 719 mparse_readmem(struct mparse *curp, const void *buf, s |
|
blk.buf = UNCONST(buf); |
blk.buf = UNCONST(buf); |
blk.sz = len; |
blk.sz = len; |
|
|
mparse_parse_buffer(curp, blk, file, 0); |
mparse_parse_buffer(curp, blk, file); |
return(curp->file_status); |
return(curp->file_status); |
} |
} |
|
|
static void |
enum mandoclevel |
mparse_readfd_r(struct mparse *curp, int fd, const char *file, int re) |
mparse_readfd(struct mparse *curp, int fd, const char *file) |
{ |
{ |
struct buf blk; |
struct buf blk; |
int with_mmap; |
int with_mmap; |
|
|
if (-1 == fd) |
if (-1 == fd && -1 == (fd = open(file, O_RDONLY, 0))) { |
if (-1 == (fd = open(file, O_RDONLY, 0))) { |
curp->file_status = MANDOCLEVEL_SYSERR; |
perror(file); |
if (curp->mmsg) |
curp->file_status = MANDOCLEVEL_SYSERR; |
(*curp->mmsg)(MANDOCERR_SYSOPEN, |
return; |
curp->file_status, |
} |
file, 0, 0, strerror(errno)); |
|
goto out; |
|
} |
|
|
/* |
/* |
* Run for each opened file; may be called more than once for |
* Run for each opened file; may be called more than once for |
* each full parse sequence if the opened file is nested (i.e., |
* each full parse sequence if the opened file is nested (i.e., |
Line 714 mparse_readfd_r(struct mparse *curp, int fd, const cha |
|
Line 745 mparse_readfd_r(struct mparse *curp, int fd, const cha |
|
* the parse phase for the file. |
* the parse phase for the file. |
*/ |
*/ |
|
|
if ( ! read_whole_file(file, fd, &blk, &with_mmap)) { |
if ( ! read_whole_file(curp, file, fd, &blk, &with_mmap)) |
curp->file_status = MANDOCLEVEL_SYSERR; |
goto out; |
return; |
|
} |
|
|
|
mparse_parse_buffer(curp, blk, file, re); |
mparse_parse_buffer(curp, blk, file); |
|
|
#ifdef HAVE_MMAP |
#ifdef HAVE_MMAP |
if (with_mmap) |
if (with_mmap) |
Line 730 mparse_readfd_r(struct mparse *curp, int fd, const cha |
|
Line 759 mparse_readfd_r(struct mparse *curp, int fd, const cha |
|
|
|
if (STDIN_FILENO != fd && -1 == close(fd)) |
if (STDIN_FILENO != fd && -1 == close(fd)) |
perror(file); |
perror(file); |
} |
out: |
|
|
enum mandoclevel |
|
mparse_readfd(struct mparse *curp, int fd, const char *file) |
|
{ |
|
|
|
mparse_readfd_r(curp, fd, file, 0); |
|
return(curp->file_status); |
return(curp->file_status); |
} |
} |
|
|
struct mparse * |
struct mparse * |
mparse_alloc(enum mparset inttype, enum mandoclevel wlevel, |
mparse_alloc(int options, enum mandoclevel wlevel, |
mandocmsg mmsg, void *arg, char *defos) |
mandocmsg mmsg, char *defos) |
{ |
{ |
struct mparse *curp; |
struct mparse *curp; |
|
|
Line 750 mparse_alloc(enum mparset inttype, enum mandoclevel wl |
|
Line 773 mparse_alloc(enum mparset inttype, enum mandoclevel wl |
|
|
|
curp = mandoc_calloc(1, sizeof(struct mparse)); |
curp = mandoc_calloc(1, sizeof(struct mparse)); |
|
|
|
curp->options = options; |
curp->wlevel = wlevel; |
curp->wlevel = wlevel; |
curp->mmsg = mmsg; |
curp->mmsg = mmsg; |
curp->arg = arg; |
|
curp->inttype = inttype; |
|
curp->defos = defos; |
curp->defos = defos; |
|
|
curp->roff = roff_alloc(inttype, curp); |
curp->roff = roff_alloc(curp, options); |
return(curp); |
return(curp); |
} |
} |
|
|