version 1.108, 2015/01/14 22:02:50 |
version 1.133, 2015/04/02 21:36:50 |
|
|
* purpose with or without fee is hereby granted, provided that the above |
* purpose with or without fee is hereby granted, provided that the above |
* copyright notice and this permission notice appear in all copies. |
* copyright notice and this permission notice appear in all copies. |
* |
* |
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES |
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHORS DISCLAIM ALL WARRANTIES |
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF |
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF |
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR |
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR |
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES |
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES |
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN |
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
|
|
#include <ctype.h> |
#include <ctype.h> |
#include <errno.h> |
#include <errno.h> |
#include <fcntl.h> |
#include <fcntl.h> |
|
#include <signal.h> |
#include <stdarg.h> |
#include <stdarg.h> |
#include <stdint.h> |
#include <stdint.h> |
#include <stdio.h> |
#include <stdio.h> |
|
|
#include <string.h> |
#include <string.h> |
#include <unistd.h> |
#include <unistd.h> |
|
|
#include "mandoc.h" |
|
#include "mandoc_aux.h" |
#include "mandoc_aux.h" |
#include "libmandoc.h" |
#include "mandoc.h" |
|
#include "roff.h" |
#include "mdoc.h" |
#include "mdoc.h" |
#include "man.h" |
#include "man.h" |
|
#include "libmandoc.h" |
|
|
#define REPARSE_LIMIT 1000 |
#define REPARSE_LIMIT 1000 |
|
|
Line 80 static const enum mandocerr mandoclimits[MANDOCLEVEL_M |
|
Line 82 static const enum mandocerr mandoclimits[MANDOCLEVEL_M |
|
MANDOCERR_WARNING, |
MANDOCERR_WARNING, |
MANDOCERR_WARNING, |
MANDOCERR_WARNING, |
MANDOCERR_ERROR, |
MANDOCERR_ERROR, |
MANDOCERR_FATAL, |
MANDOCERR_UNSUPP, |
MANDOCERR_MAX, |
MANDOCERR_MAX, |
MANDOCERR_MAX |
MANDOCERR_MAX |
}; |
}; |
Line 109 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
Line 111 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
"no document body", |
"no document body", |
"content before first section header", |
"content before first section header", |
"first section is not \"NAME\"", |
"first section is not \"NAME\"", |
"bad NAME section contents", |
"NAME section without name", |
|
"NAME section without description", |
|
"description not at the end of NAME", |
|
"bad NAME section content", |
|
"missing description line, using \"\"", |
"sections out of conventional order", |
"sections out of conventional order", |
"duplicate section title", |
"duplicate section title", |
"unexpected section", |
"unexpected section", |
Line 135 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
Line 141 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
"skipping empty request", |
"skipping empty request", |
"conditional request controls empty scope", |
"conditional request controls empty scope", |
"skipping empty macro", |
"skipping empty macro", |
|
"empty block", |
"empty argument, using 0n", |
"empty argument, using 0n", |
"argument count wrong", |
|
"missing display type, using -ragged", |
"missing display type, using -ragged", |
"list type is not the first argument", |
"list type is not the first argument", |
"missing -width in -tag list, using 8n", |
"missing -width in -tag list, using 8n", |
"missing utility name, using \"\"", |
"missing utility name, using \"\"", |
|
"missing function name, using \"\"", |
"empty head in list item", |
"empty head in list item", |
"empty list item", |
"empty list item", |
"missing font type, using \\fR", |
"missing font type, using \\fR", |
"unknown font type, using \\fR", |
"unknown font type, using \\fR", |
"nothing follows prefix", |
"nothing follows prefix", |
|
"empty reference block", |
"missing -std argument, adding it", |
"missing -std argument, adding it", |
|
"missing option string, using \"\"", |
|
"missing resource identifier, using \"\"", |
"missing eqn box, using \"\"", |
"missing eqn box, using \"\"", |
|
|
/* related to bad macro arguments */ |
/* related to bad macro arguments */ |
Line 156 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
Line 166 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
"skipping duplicate display type", |
"skipping duplicate display type", |
"skipping duplicate list type", |
"skipping duplicate list type", |
"skipping -width argument", |
"skipping -width argument", |
|
"wrong number of cells", |
"unknown AT&T UNIX version", |
"unknown AT&T UNIX version", |
"comma in function argument", |
"comma in function argument", |
"parenthesis in function name", |
"parenthesis in function name", |
"invalid content in Rs block", |
"invalid content in Rs block", |
"invalid Boolean argument", |
"invalid Boolean argument", |
"unknown font, skipping request", |
"unknown font, skipping request", |
|
"odd number of characters in request", |
|
|
/* related to plain text */ |
/* related to plain text */ |
"blank line in fill mode, using .sp", |
"blank line in fill mode, using .sp", |
Line 171 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
Line 183 static const char * const mandocerrs[MANDOCERR_MAX] = |
|
"invalid escape sequence", |
"invalid escape sequence", |
"undefined string, using \"\"", |
"undefined string, using \"\"", |
|
|
|
/* related to tables */ |
|
"tbl line starts with span", |
|
"tbl column starts with span", |
|
"skipping vertical bar in tbl layout", |
|
|
"generic error", |
"generic error", |
|
|
/* related to equations */ |
|
"unexpected equation scope closure", |
|
"equation scope open on exit", |
|
"overlapping equation scopes", |
|
"unexpected end of equation", |
|
|
|
/* related to tables */ |
/* related to tables */ |
"bad table syntax", |
"non-alphabetic character in tbl options", |
"bad table option", |
"skipping unknown tbl option", |
"bad table layout", |
"missing tbl option argument", |
"no table layout cells specified", |
"wrong tbl option argument size", |
"no table data cells specified", |
"empty tbl layout", |
"ignore data in cell", |
"invalid character in tbl layout", |
"data block still open", |
"unmatched parenthesis in tbl layout", |
"ignoring extra data cells", |
"tbl without any data cells", |
"ignoring macro in table", |
"ignoring data in spanned tbl cell", |
|
"ignoring extra tbl data cells", |
|
"data block open at end of tbl", |
|
|
/* related to document structure and macros */ |
/* related to document structure and macros */ |
NULL, |
NULL, |
"input stack limit exceeded, infinite loop?", |
"input stack limit exceeded, infinite loop?", |
"skipping bad character", |
"skipping bad character", |
"skipping unknown macro", |
"skipping unknown macro", |
|
"skipping insecure request", |
"skipping item outside list", |
"skipping item outside list", |
"skipping column outside column list", |
"skipping column outside column list", |
"skipping end of block that is not open", |
"skipping end of block that is not open", |
|
"fewer RS blocks open, skipping", |
"inserting missing end of block", |
"inserting missing end of block", |
"appending missing end of block", |
"appending missing end of block", |
|
|
/* related to request and macro arguments */ |
/* related to request and macro arguments */ |
"escaped character not allowed in a name", |
"escaped character not allowed in a name", |
"argument count wrong", |
|
"NOT IMPLEMENTED: Bd -file", |
"NOT IMPLEMENTED: Bd -file", |
"missing list type, using -item", |
"missing list type, using -item", |
"missing manual name, using \"\"", |
"missing manual name, using \"\"", |
"uname(3) system call failed, using UNKNOWN", |
"uname(3) system call failed, using UNKNOWN", |
"unknown standard specifier", |
"unknown standard specifier", |
"skipping request without numeric argument", |
"skipping request without numeric argument", |
|
"NOT IMPLEMENTED: .so with absolute path or \"..\"", |
|
".so request failed", |
"skipping all arguments", |
"skipping all arguments", |
"skipping excess arguments", |
"skipping excess arguments", |
"divide by zero", |
"divide by zero", |
|
|
"generic fatal error", |
"unsupported feature", |
|
|
"input too large", |
"input too large", |
"NOT IMPLEMENTED: .so with absolute path or \"..\"", |
"unsupported control character", |
".so request failed", |
"unsupported roff request", |
|
"eqn delim option in tbl", |
|
"unsupported tbl layout modifier", |
|
"ignoring macro in table", |
}; |
}; |
|
|
static const char * const mandoclevels[MANDOCLEVEL_MAX] = { |
static const char * const mandoclevels[MANDOCLEVEL_MAX] = { |
Line 226 static const char * const mandoclevels[MANDOCLEVEL_MAX |
|
Line 244 static const char * const mandoclevels[MANDOCLEVEL_MAX |
|
"RESERVED", |
"RESERVED", |
"WARNING", |
"WARNING", |
"ERROR", |
"ERROR", |
"FATAL", |
"UNSUPP", |
"BADARG", |
"BADARG", |
"SYSERR" |
"SYSERR" |
}; |
}; |
Line 306 mparse_buf_r(struct mparse *curp, struct buf blk, size |
|
Line 324 mparse_buf_r(struct mparse *curp, struct buf blk, size |
|
{ |
{ |
const struct tbl_span *span; |
const struct tbl_span *span; |
struct buf ln; |
struct buf ln; |
|
const char *save_file; |
|
char *cp; |
size_t pos; /* byte number in the ln buffer */ |
size_t pos; /* byte number in the ln buffer */ |
enum rofferr rr; |
enum rofferr rr; |
int of; |
int of; |
int lnn; /* line number in the real file */ |
int lnn; /* line number in the real file */ |
|
int fd; |
|
pid_t save_child; |
unsigned char c; |
unsigned char c; |
|
|
memset(&ln, 0, sizeof(ln)); |
memset(&ln, 0, sizeof(ln)); |
Line 364 mparse_buf_r(struct mparse *curp, struct buf blk, size |
|
Line 386 mparse_buf_r(struct mparse *curp, struct buf blk, size |
|
if (c & 0x80) { |
if (c & 0x80) { |
if ( ! (curp->filenc && preconv_encode( |
if ( ! (curp->filenc && preconv_encode( |
&blk, &i, &ln, &pos, &curp->filenc))) { |
&blk, &i, &ln, &pos, &curp->filenc))) { |
mandoc_vmsg(MANDOCERR_BADCHAR, |
mandoc_vmsg(MANDOCERR_CHAR_BAD, curp, |
curp, curp->line, pos, |
curp->line, pos, "0x%x", c); |
"0x%x", c); |
|
ln.buf[pos++] = '?'; |
ln.buf[pos++] = '?'; |
i++; |
i++; |
} |
} |
Line 378 mparse_buf_r(struct mparse *curp, struct buf blk, size |
|
Line 399 mparse_buf_r(struct mparse *curp, struct buf blk, size |
|
*/ |
*/ |
|
|
if (c == 0x7f || (c < 0x20 && c != 0x09)) { |
if (c == 0x7f || (c < 0x20 && c != 0x09)) { |
mandoc_vmsg(MANDOCERR_BADCHAR, curp, |
mandoc_vmsg(c == 0x00 || c == 0x04 || |
curp->line, pos, "0x%x", c); |
c > 0x0a ? MANDOCERR_CHAR_BAD : |
|
MANDOCERR_CHAR_UNSUPP, |
|
curp, curp->line, pos, "0x%x", c); |
i++; |
i++; |
ln.buf[pos++] = '?'; |
if (c != '\r') |
|
ln.buf[pos++] = '?'; |
continue; |
continue; |
} |
} |
|
|
Line 435 mparse_buf_r(struct mparse *curp, struct buf blk, size |
|
Line 459 mparse_buf_r(struct mparse *curp, struct buf blk, size |
|
|
|
if ( ! (isascii(c) && |
if ( ! (isascii(c) && |
(isgraph(c) || isblank(c)))) { |
(isgraph(c) || isblank(c)))) { |
mandoc_vmsg(MANDOCERR_BADCHAR, curp, |
mandoc_vmsg(MANDOCERR_CHAR_BAD, curp, |
curp->line, pos, "0x%x", c); |
curp->line, pos, "0x%x", c); |
i += 2; |
i += 2; |
ln.buf[pos++] = '?'; |
ln.buf[pos++] = '?'; |
|
|
case ROFF_IGN: |
case ROFF_IGN: |
pos = 0; |
pos = 0; |
continue; |
continue; |
case ROFF_ERR: |
|
assert(MANDOCLEVEL_FATAL <= curp->file_status); |
|
break; |
|
case ROFF_SO: |
case ROFF_SO: |
if ( ! (curp->options & MPARSE_SO) && |
if ( ! (curp->options & MPARSE_SO) && |
(i >= blk.sz || blk.buf[i] == '\0')) { |
(i >= blk.sz || blk.buf[i] == '\0')) { |
|
|
*/ |
*/ |
if (curp->secondary) |
if (curp->secondary) |
curp->secondary->sz -= pos + 1; |
curp->secondary->sz -= pos + 1; |
mparse_readfd(curp, -1, ln.buf + of); |
save_file = curp->file; |
if (MANDOCLEVEL_FATAL <= curp->file_status) { |
save_child = curp->child; |
|
if (mparse_open(curp, &fd, ln.buf + of) == |
|
MANDOCLEVEL_OK) { |
|
mparse_readfd(curp, fd, ln.buf + of); |
|
curp->file = save_file; |
|
} else { |
|
curp->file = save_file; |
mandoc_vmsg(MANDOCERR_SO_FAIL, |
mandoc_vmsg(MANDOCERR_SO_FAIL, |
curp, curp->line, pos, |
curp, curp->line, pos, |
".so %s", ln.buf + of); |
".so %s", ln.buf + of); |
break; |
ln.sz = mandoc_asprintf(&cp, |
|
".sp\nSee the file %s.\n.sp", |
|
ln.buf + of); |
|
free(ln.buf); |
|
ln.buf = cp; |
|
of = 0; |
|
mparse_buf_r(curp, ln, of, 0); |
} |
} |
|
curp->child = save_child; |
pos = 0; |
pos = 0; |
continue; |
continue; |
default: |
default: |
|
|
} |
} |
|
|
/* |
/* |
* If we encounter errors in the recursive parse, make |
|
* sure we don't continue parsing. |
|
*/ |
|
|
|
if (MANDOCLEVEL_FATAL <= curp->file_status) |
|
break; |
|
|
|
/* |
|
* If input parsers have not been allocated, do so now. |
* If input parsers have not been allocated, do so now. |
* We keep these instanced between parsers, but set them |
* We keep these instanced between parsers, but set them |
* locally per parse routine since we can use different |
* locally per parse routine since we can use different |
Line 612 read_whole_file(struct mparse *curp, const char *file, |
|
Line 638 read_whole_file(struct mparse *curp, const char *file, |
|
*/ |
*/ |
|
|
if (S_ISREG(st.st_mode)) { |
if (S_ISREG(st.st_mode)) { |
if (st.st_size >= (1U << 31)) { |
if (st.st_size > 0x7fffffff) { |
curp->file_status = MANDOCLEVEL_FATAL; |
mandoc_msg(MANDOCERR_TOOLARGE, curp, 0, 0, NULL); |
if (curp->mmsg) |
|
(*curp->mmsg)(MANDOCERR_TOOLARGE, |
|
curp->file_status, file, 0, 0, NULL); |
|
return(0); |
return(0); |
} |
} |
*with_mmap = 1; |
*with_mmap = 1; |
Line 639 read_whole_file(struct mparse *curp, const char *file, |
|
Line 662 read_whole_file(struct mparse *curp, const char *file, |
|
for (;;) { |
for (;;) { |
if (off == fb->sz) { |
if (off == fb->sz) { |
if (fb->sz == (1U << 31)) { |
if (fb->sz == (1U << 31)) { |
curp->file_status = MANDOCLEVEL_FATAL; |
mandoc_msg(MANDOCERR_TOOLARGE, curp, |
if (curp->mmsg) |
0, 0, NULL); |
(*curp->mmsg)(MANDOCERR_TOOLARGE, |
|
curp->file_status, |
|
file, 0, 0, NULL); |
|
break; |
break; |
} |
} |
resize_buf(fb, 65536); |
resize_buf(fb, 65536); |
|
|
mparse_end(struct mparse *curp) |
mparse_end(struct mparse *curp) |
{ |
{ |
|
|
if (MANDOCLEVEL_FATAL <= curp->file_status) |
|
return; |
|
|
|
if (curp->mdoc == NULL && |
if (curp->mdoc == NULL && |
curp->man == NULL && |
curp->man == NULL && |
curp->sodest == NULL) { |
curp->sodest == NULL) { |
Line 685 mparse_end(struct mparse *curp) |
|
Line 702 mparse_end(struct mparse *curp) |
|
curp->man = curp->pman; |
curp->man = curp->pman; |
} |
} |
} |
} |
|
if (curp->mdoc) |
if (curp->mdoc && ! mdoc_endparse(curp->mdoc)) { |
mdoc_endparse(curp->mdoc); |
assert(MANDOCLEVEL_FATAL <= curp->file_status); |
if (curp->man) |
return; |
man_endparse(curp->man); |
} |
|
|
|
if (curp->man && ! man_endparse(curp->man)) { |
|
assert(MANDOCLEVEL_FATAL <= curp->file_status); |
|
return; |
|
} |
|
|
|
roff_endparse(curp->roff); |
roff_endparse(curp->roff); |
} |
} |
|
|
Line 732 mparse_parse_buffer(struct mparse *curp, struct buf bl |
|
Line 742 mparse_parse_buffer(struct mparse *curp, struct buf bl |
|
|
|
mparse_buf_r(curp, blk, offset, 1); |
mparse_buf_r(curp, blk, offset, 1); |
|
|
if (0 == --recursion_depth && MANDOCLEVEL_FATAL > curp->file_status) |
if (--recursion_depth == 0) |
mparse_end(curp); |
mparse_end(curp); |
|
|
curp->primary = svprimary; |
curp->primary = svprimary; |
Line 753 mparse_readmem(struct mparse *curp, void *buf, size_t |
|
Line 763 mparse_readmem(struct mparse *curp, void *buf, size_t |
|
} |
} |
|
|
/* |
/* |
* If a file descriptor is given, use it and assume it points |
|
* to the named file. Otherwise, open the named file. |
|
* Read the whole file into memory and call the parsers. |
* Read the whole file into memory and call the parsers. |
* Called recursively when an .so request is encountered. |
* Called recursively when an .so request is encountered. |
*/ |
*/ |
Line 764 mparse_readfd(struct mparse *curp, int fd, const char |
|
Line 772 mparse_readfd(struct mparse *curp, int fd, const char |
|
struct buf blk; |
struct buf blk; |
int with_mmap; |
int with_mmap; |
int save_filenc; |
int save_filenc; |
pid_t save_child; |
|
|
|
save_child = curp->child; |
|
if (fd != -1) |
|
curp->child = 0; |
|
else if (mparse_open(curp, &fd, file) != MANDOCLEVEL_OK) |
|
goto out; |
|
|
|
if (read_whole_file(curp, file, fd, &blk, &with_mmap)) { |
if (read_whole_file(curp, file, fd, &blk, &with_mmap)) { |
save_filenc = curp->filenc; |
save_filenc = curp->filenc; |
curp->filenc = curp->options & |
curp->filenc = curp->options & |
Line 790 mparse_readfd(struct mparse *curp, int fd, const char |
|
Line 791 mparse_readfd(struct mparse *curp, int fd, const char |
|
perror(file); |
perror(file); |
|
|
mparse_wait(curp); |
mparse_wait(curp); |
out: |
|
curp->child = save_child; |
|
return(curp->file_status); |
return(curp->file_status); |
} |
} |
|
|
Line 849 mparse_open(struct mparse *curp, int *fd, const char * |
|
Line 848 mparse_open(struct mparse *curp, int *fd, const char * |
|
perror("dup"); |
perror("dup"); |
exit((int)MANDOCLEVEL_SYSERR); |
exit((int)MANDOCLEVEL_SYSERR); |
} |
} |
|
signal(SIGPIPE, SIG_DFL); |
execlp("gunzip", "gunzip", "-c", file, NULL); |
execlp("gunzip", "gunzip", "-c", file, NULL); |
perror("exec"); |
perror("exec"); |
exit((int)MANDOCLEVEL_SYSERR); |
exit((int)MANDOCLEVEL_SYSERR); |
Line 871 mparse_wait(struct mparse *curp) |
|
Line 871 mparse_wait(struct mparse *curp) |
|
perror("wait"); |
perror("wait"); |
exit((int)MANDOCLEVEL_SYSERR); |
exit((int)MANDOCLEVEL_SYSERR); |
} |
} |
|
curp->child = 0; |
if (WIFSIGNALED(status)) { |
if (WIFSIGNALED(status)) { |
mandoc_vmsg(MANDOCERR_FILE, curp, 0, 0, |
mandoc_vmsg(MANDOCERR_FILE, curp, 0, 0, |
"gunzip died from signal %d", WTERMSIG(status)); |
"gunzip died from signal %d", WTERMSIG(status)); |
Line 890 mparse_alloc(int options, enum mandoclevel wlevel, man |
|
Line 891 mparse_alloc(int options, enum mandoclevel wlevel, man |
|
{ |
{ |
struct mparse *curp; |
struct mparse *curp; |
|
|
assert(wlevel <= MANDOCLEVEL_FATAL); |
|
|
|
curp = mandoc_calloc(1, sizeof(struct mparse)); |
curp = mandoc_calloc(1, sizeof(struct mparse)); |
|
|
curp->options = options; |
curp->options = options; |
Line 988 mandoc_msg(enum mandocerr er, struct mparse *m, |
|
Line 987 mandoc_msg(enum mandocerr er, struct mparse *m, |
|
{ |
{ |
enum mandoclevel level; |
enum mandoclevel level; |
|
|
level = MANDOCLEVEL_FATAL; |
level = MANDOCLEVEL_UNSUPP; |
while (er < mandoclimits[level]) |
while (er < mandoclimits[level]) |
level--; |
level--; |
|
|