version 1.24, 2009/01/21 17:56:32 |
version 1.56, 2009/03/23 14:22:11 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2008 Kristaps Dzonsons <kristaps@kth.se> |
* Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@openbsd.org> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the |
* purpose with or without fee is hereby granted, provided that the |
|
|
* TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR |
* TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR |
* PERFORMANCE OF THIS SOFTWARE. |
* PERFORMANCE OF THIS SOFTWARE. |
*/ |
*/ |
|
#include <sys/types.h> |
|
|
#include <assert.h> |
#include <assert.h> |
#include <ctype.h> |
#include <ctype.h> |
#include <err.h> |
#include <err.h> |
|
|
#include <stdio.h> |
#include <stdio.h> |
#include <string.h> |
#include <string.h> |
|
|
#include "private.h" |
#include "libmdoc.h" |
|
|
/* |
/* |
* Parse arguments and parameters of macros. Arguments follow the |
* Routines to parse arguments of macros. Arguments follow the syntax |
* syntax of `-arg [val [valN...]]', while parameters are free-form text |
* of `-arg [val [valN...]]'. Arguments come in all types: quoted |
* following arguments (if any). This file must correctly handle the |
* arguments, multiple arguments per value, no-value arguments, etc. |
* strange punctuation rules dictated by groff. |
* |
|
* There's no limit to the number or arguments that may be allocated. |
*/ |
*/ |
|
|
#define ARGS_QUOTED (1 << 0) |
#define ARGS_QUOTED (1 << 0) |
#define ARGS_DELIM (1 << 1) |
#define ARGS_DELIM (1 << 1) |
#define ARGS_TABSEP (1 << 2) |
#define ARGS_TABSEP (1 << 2) |
|
#define ARGS_ARGVLIKE (1 << 3) |
|
|
static int lookup(int, const char *); |
#define ARGV_NONE (1 << 0) |
static int parse(struct mdoc *, int, |
#define ARGV_SINGLE (1 << 1) |
struct mdoc_arg *, int *, char *); |
#define ARGV_MULTI (1 << 2) |
static int parse_single(struct mdoc *, int, |
#define ARGV_OPT_SINGLE (1 << 3) |
struct mdoc_arg *, int *, char *); |
|
static int parse_multi(struct mdoc *, int, |
|
struct mdoc_arg *, int *, char *); |
|
static int postparse(struct mdoc *, int, |
|
const struct mdoc_arg *, int); |
|
static int pwarn(struct mdoc *, int, int, int); |
|
|
|
#define WQUOTPARM (0) |
#define MULTI_STEP 5 |
#define WARGVPARM (1) |
|
|
|
|
enum mwarn { |
|
WQUOTPARM, |
|
WARGVPARM, |
|
WCOLEMPTY, |
|
WTAILWS |
|
}; |
|
|
|
enum merr { |
|
EQUOTTERM, |
|
EARGVAL |
|
}; |
|
|
|
static int argv_a2arg(int, const char *); |
|
static int args(struct mdoc *, int, int *, |
|
char *, int, char **); |
|
static int argv(struct mdoc *, int, |
|
struct mdoc_argv *, int *, char *); |
|
static int argv_single(struct mdoc *, int, |
|
struct mdoc_argv *, int *, char *); |
|
static int argv_opt_single(struct mdoc *, int, |
|
struct mdoc_argv *, int *, char *); |
|
static int argv_multi(struct mdoc *, int, |
|
struct mdoc_argv *, int *, char *); |
|
static int pwarn(struct mdoc *, int, int, enum mwarn); |
|
static int perr(struct mdoc *, int, int, enum merr); |
|
|
|
/* Per-argument flags. */ |
|
|
|
static int mdoc_argvflags[MDOC_ARG_MAX] = { |
|
ARGV_NONE, /* MDOC_Split */ |
|
ARGV_NONE, /* MDOC_Nosplit */ |
|
ARGV_NONE, /* MDOC_Ragged */ |
|
ARGV_NONE, /* MDOC_Unfilled */ |
|
ARGV_NONE, /* MDOC_Literal */ |
|
ARGV_NONE, /* MDOC_File */ |
|
ARGV_SINGLE, /* MDOC_Offset */ |
|
ARGV_NONE, /* MDOC_Bullet */ |
|
ARGV_NONE, /* MDOC_Dash */ |
|
ARGV_NONE, /* MDOC_Hyphen */ |
|
ARGV_NONE, /* MDOC_Item */ |
|
ARGV_NONE, /* MDOC_Enum */ |
|
ARGV_NONE, /* MDOC_Tag */ |
|
ARGV_NONE, /* MDOC_Diag */ |
|
ARGV_NONE, /* MDOC_Hang */ |
|
ARGV_NONE, /* MDOC_Ohang */ |
|
ARGV_NONE, /* MDOC_Inset */ |
|
ARGV_MULTI, /* MDOC_Column */ |
|
ARGV_SINGLE, /* MDOC_Width */ |
|
ARGV_NONE, /* MDOC_Compact */ |
|
ARGV_OPT_SINGLE, /* MDOC_Std */ |
|
ARGV_NONE, /* MDOC_Filled */ |
|
ARGV_NONE, /* MDOC_Words */ |
|
ARGV_NONE, /* MDOC_Emphasis */ |
|
ARGV_NONE, /* MDOC_Symbolic */ |
|
ARGV_NONE /* MDOC_Symbolic */ |
|
}; |
|
|
static int mdoc_argflags[MDOC_MAX] = { |
static int mdoc_argflags[MDOC_MAX] = { |
0, /* \" */ |
0, /* \" */ |
0, /* Dd */ |
0, /* Dd */ |
Line 64 static int mdoc_argflags[MDOC_MAX] = { |
|
Line 118 static int mdoc_argflags[MDOC_MAX] = { |
|
0, /* Ed */ |
0, /* Ed */ |
0, /* Bl */ |
0, /* Bl */ |
0, /* El */ |
0, /* El */ |
ARGS_DELIM, /* It */ |
0, /* It */ |
ARGS_DELIM, /* Ad */ |
ARGS_DELIM, /* Ad */ |
ARGS_DELIM, /* An */ |
ARGS_DELIM, /* An */ |
ARGS_DELIM, /* Ar */ |
ARGS_DELIM, /* Ar */ |
Line 88 static int mdoc_argflags[MDOC_MAX] = { |
|
Line 142 static int mdoc_argflags[MDOC_MAX] = { |
|
0, /* Ot */ |
0, /* Ot */ |
ARGS_DELIM, /* Pa */ |
ARGS_DELIM, /* Pa */ |
0, /* Rv */ |
0, /* Rv */ |
ARGS_DELIM, /* St */ |
ARGS_DELIM | ARGS_ARGVLIKE, /* St */ |
ARGS_DELIM, /* Va */ |
ARGS_DELIM, /* Va */ |
ARGS_DELIM, /* Vt */ |
ARGS_DELIM, /* Vt */ |
ARGS_DELIM, /* Xr */ |
ARGS_DELIM, /* Xr */ |
Line 157 static int mdoc_argflags[MDOC_MAX] = { |
|
Line 211 static int mdoc_argflags[MDOC_MAX] = { |
|
0, /* Hf */ |
0, /* Hf */ |
0, /* Fr */ |
0, /* Fr */ |
0, /* Ud */ |
0, /* Ud */ |
|
0, /* Lb */ |
|
0, /* Ap */ |
|
ARGS_DELIM, /* Lp */ |
|
ARGS_DELIM | ARGS_QUOTED, /* Lk */ |
|
ARGS_DELIM | ARGS_QUOTED, /* Mt */ |
|
ARGS_DELIM, /* Brq */ |
|
0, /* Bro */ |
|
ARGS_DELIM, /* Brc */ |
|
ARGS_QUOTED, /* %C */ |
|
0, /* Es */ |
|
0, /* En */ |
|
0, /* Dx */ |
|
ARGS_QUOTED, /* %Q */ |
}; |
}; |
|
|
|
|
|
/* |
|
* Parse an argument from line text. This comes in the form of -key |
|
* [value0...], which may either have a single mandatory value, at least |
|
* one mandatory value, an optional single value, or no value. |
|
*/ |
|
int |
|
mdoc_argv(struct mdoc *mdoc, int line, int tok, |
|
struct mdoc_arg **v, int *pos, char *buf) |
|
{ |
|
int i; |
|
char *p, sv; |
|
struct mdoc_argv tmp; |
|
struct mdoc_arg *arg; |
|
|
|
if (0 == buf[*pos]) |
|
return(ARGV_EOLN); |
|
|
|
assert(' ' != buf[*pos]); |
|
|
|
if ('-' != buf[*pos] || ARGS_ARGVLIKE & mdoc_argflags[tok]) |
|
return(ARGV_WORD); |
|
|
|
/* Parse through to the first unescaped space. */ |
|
|
|
i = *pos; |
|
p = &buf[++(*pos)]; |
|
|
|
assert(*pos > 0); |
|
|
|
/* LINTED */ |
|
while (buf[*pos]) { |
|
if (' ' == buf[*pos]) |
|
if ('\\' != buf[*pos - 1]) |
|
break; |
|
(*pos)++; |
|
} |
|
|
|
/* XXX - save zeroed byte, if not an argument. */ |
|
|
|
sv = 0; |
|
if (buf[*pos]) { |
|
sv = buf[*pos]; |
|
buf[(*pos)++] = 0; |
|
} |
|
|
|
(void)memset(&tmp, 0, sizeof(struct mdoc_argv)); |
|
tmp.line = line; |
|
tmp.pos = *pos; |
|
|
|
/* See if our token accepts the argument. */ |
|
|
|
if (MDOC_ARG_MAX == (tmp.arg = argv_a2arg(tok, p))) { |
|
/* XXX - restore saved zeroed byte. */ |
|
if (sv) |
|
buf[*pos - 1] = sv; |
|
if ( ! pwarn(mdoc, line, i, WARGVPARM)) |
|
return(ARGV_ERROR); |
|
return(ARGV_WORD); |
|
} |
|
|
|
while (buf[*pos] && ' ' == buf[*pos]) |
|
(*pos)++; |
|
|
|
if ( ! argv(mdoc, line, &tmp, pos, buf)) |
|
return(ARGV_ERROR); |
|
|
|
if (NULL == (arg = *v)) { |
|
if (NULL == (*v = calloc(1, sizeof(struct mdoc_arg)))) |
|
err(1, "calloc"); |
|
arg = *v; |
|
} |
|
|
|
arg->argc++; |
|
arg->argv = xrealloc(arg->argv, arg->argc * |
|
sizeof(struct mdoc_argv)); |
|
|
|
(void)memcpy(&arg->argv[(int)arg->argc - 1], |
|
&tmp, sizeof(struct mdoc_argv)); |
|
|
|
return(ARGV_ARG); |
|
} |
|
|
|
|
|
void |
|
mdoc_argv_free(struct mdoc_arg *p) |
|
{ |
|
int i, j; |
|
|
|
if (NULL == p) |
|
return; |
|
|
|
if (p->refcnt) { |
|
--(p->refcnt); |
|
if (p->refcnt) |
|
return; |
|
} |
|
|
|
assert(p->argc); |
|
|
|
/* LINTED */ |
|
for (i = 0; i < (int)p->argc; i++) { |
|
if (0 == p->argv[i].sz) |
|
continue; |
|
/* LINTED */ |
|
for (j = 0; j < (int)p->argv[i].sz; j++) |
|
free(p->argv[i].value[j]); |
|
|
|
free(p->argv[i].value); |
|
} |
|
|
|
free(p->argv); |
|
free(p); |
|
} |
|
|
|
|
|
|
static int |
static int |
pwarn(struct mdoc *mdoc, int line, int pos, int code) |
perr(struct mdoc *mdoc, int line, int pos, enum merr code) |
{ |
{ |
|
char *p; |
|
|
|
p = NULL; |
|
|
|
switch (code) { |
|
case (EQUOTTERM): |
|
p = "unterminated quoted parameter"; |
|
break; |
|
case (EARGVAL): |
|
p = "argument requires a value"; |
|
break; |
|
} |
|
|
|
assert(p); |
|
return(mdoc_perr(mdoc, line, pos, p)); |
|
} |
|
|
|
|
|
static int |
|
pwarn(struct mdoc *mdoc, int line, int pos, enum mwarn code) |
|
{ |
|
char *p; |
int c; |
int c; |
|
|
|
p = NULL; |
|
c = WARN_SYNTAX; |
|
|
switch (code) { |
switch (code) { |
case (WQUOTPARM): |
case (WQUOTPARM): |
c = mdoc_pwarn(mdoc, line, pos, WARN_SYNTAX, |
p = "unexpected quoted parameter"; |
"unexpected quoted parameter"); |
|
break; |
break; |
case (WARGVPARM): |
case (WARGVPARM): |
c = mdoc_pwarn(mdoc, line, pos, WARN_SYNTAX, |
p = "argument-like parameter"; |
"argument-like parameter"); |
|
break; |
break; |
default: |
case (WCOLEMPTY): |
abort(); |
p = "last list column is empty"; |
/* NOTREACHED */ |
c = WARN_COMPAT; |
|
break; |
|
case (WTAILWS): |
|
p = "trailing whitespace"; |
|
c = WARN_COMPAT; |
|
break; |
} |
} |
return(c); |
|
|
assert(p); |
|
return(mdoc_pwarn(mdoc, line, pos, c, p)); |
} |
} |
|
|
|
|
|
|
mdoc_args(struct mdoc *mdoc, int line, |
mdoc_args(struct mdoc *mdoc, int line, |
int *pos, char *buf, int tok, char **v) |
int *pos, char *buf, int tok, char **v) |
{ |
{ |
int i, c, fl; |
int fl, c, i; |
char *p, *pp; |
|
struct mdoc_node *n; |
struct mdoc_node *n; |
|
|
|
fl = (0 == tok) ? 0 : mdoc_argflags[tok]; |
|
|
|
/* |
|
* Override per-macro argument flags with context-specific ones. |
|
* As of now, this is only valid for `It' depending on its list |
|
* context. |
|
*/ |
|
|
|
switch (tok) { |
|
case (MDOC_It): |
|
for (n = mdoc->last; n; n = n->parent) |
|
if (MDOC_BLOCK == n->type && MDOC_Bl == n->tok) |
|
break; |
|
|
|
assert(n); |
|
c = (int)(n->args ? n->args->argc : 0); |
|
assert(c > 0); |
|
|
|
/* |
|
* Using `Bl -column' adds ARGS_TABSEP to the arguments |
|
* and invalidates ARGS_DELIM. Using `Bl -diag' allows |
|
* for quoted arguments. |
|
*/ |
|
|
|
/* LINTED */ |
|
for (i = 0; i < c; i++) { |
|
switch (n->args->argv[i].arg) { |
|
case (MDOC_Column): |
|
fl |= ARGS_TABSEP; |
|
fl &= ~ARGS_DELIM; |
|
i = c; |
|
break; |
|
case (MDOC_Diag): |
|
fl |= ARGS_QUOTED; |
|
i = c; |
|
break; |
|
default: |
|
break; |
|
} |
|
} |
|
break; |
|
default: |
|
break; |
|
} |
|
|
|
return(args(mdoc, line, pos, buf, fl, v)); |
|
} |
|
|
|
|
|
static int |
|
args(struct mdoc *mdoc, int line, |
|
int *pos, char *buf, int fl, char **v) |
|
{ |
|
int i; |
|
char *p, *pp; |
|
|
assert(*pos > 0); |
assert(*pos > 0); |
|
|
if (0 == buf[*pos]) |
if (0 == buf[*pos]) |
return(ARGS_EOLN); |
return(ARGS_EOLN); |
|
|
fl = (0 == tok) ? 0 : mdoc_argflags[tok]; |
|
|
|
if ('\"' == buf[*pos] && ! (fl & ARGS_QUOTED)) |
if ('\"' == buf[*pos] && ! (fl & ARGS_QUOTED)) |
if ( ! pwarn(mdoc, line, *pos, WQUOTPARM)) |
if ( ! pwarn(mdoc, line, *pos, WQUOTPARM)) |
return(ARGS_ERROR); |
return(ARGS_ERROR); |
|
|
if ('-' == buf[*pos]) |
if ( ! (fl & ARGS_ARGVLIKE) && '-' == buf[*pos]) |
if ( ! pwarn(mdoc, line, *pos, WARGVPARM)) |
if ( ! pwarn(mdoc, line, *pos, WARGVPARM)) |
return(ARGS_ERROR); |
return(ARGS_ERROR); |
|
|
/* |
/* |
* First see if we should use TABSEP (Bl -column). This |
|
* invalidates the use of ARGS_DELIM. |
|
*/ |
|
|
|
if (MDOC_It == tok) { |
|
for (n = mdoc->last; n; n = n->parent) |
|
if (MDOC_BLOCK == n->type) |
|
if (MDOC_Bl == n->tok) |
|
break; |
|
assert(n); |
|
c = (int)n->data.block.argc; |
|
assert(c > 0); |
|
for (i = 0; i < c; i++) { |
|
if (MDOC_Column != n->data.block.argv[i].arg) |
|
continue; |
|
fl |= ARGS_TABSEP; |
|
fl &= ~ARGS_DELIM; |
|
} |
|
} |
|
|
|
/* |
|
* If the first character is a delimiter and we're to look for |
* If the first character is a delimiter and we're to look for |
* delimited strings, then pass down the buffer seeing if it |
* delimited strings, then pass down the buffer seeing if it |
* follows the pattern of [[::delim::][ ]+]+. |
* follows the pattern of [[::delim::][ ]+]+. |
*/ |
*/ |
|
|
if ((fl & ARGS_DELIM) && mdoc_iscdelim(buf[*pos])) { |
if ((fl & ARGS_DELIM) && mdoc_iscdelim(buf[*pos])) { |
for (i = *pos; (c = buf[i]); ) { |
for (i = *pos; buf[i]; ) { |
if ( ! mdoc_iscdelim(c)) |
if ( ! mdoc_iscdelim(buf[i])) |
break; |
break; |
i++; |
i++; |
if (0 == buf[i] || ! isspace(c)) |
/* There must be at least one space... */ |
|
if (0 == buf[i] || ' ' != buf[i]) |
break; |
break; |
i++; |
i++; |
while (buf[i] && isspace(c)) |
while (buf[i] && ' ' == buf[i]) |
i++; |
i++; |
} |
} |
if (0 == buf[i]) { |
if (0 == buf[i]) { |
Line 256 mdoc_args(struct mdoc *mdoc, int line, |
|
Line 502 mdoc_args(struct mdoc *mdoc, int line, |
|
|
|
/* |
/* |
* Thar be dragons here! If we're tab-separated, search |
* Thar be dragons here! If we're tab-separated, search |
* ahead for either a tab or the `Ta' macro. If a tab |
* ahead for either a tab or the `Ta' macro. |
* is detected, it mustn't be escaped; if a `Ta' is |
* If a `Ta' is detected, it must be space-buffered before and |
* detected, it must be space-buffered before and after. |
* after. If either of these hold true, then prune out the |
* If either of these hold true, then prune out the |
|
* extra spaces and call it an argument. |
* extra spaces and call it an argument. |
*/ |
*/ |
|
|
if (ARGS_TABSEP & fl) { |
if (ARGS_TABSEP & fl) { |
/* Scan ahead to unescaped tab. */ |
/* Scan ahead to unescaped tab. */ |
|
|
for (p = *v; ; p++) { |
p = strchr(*v, '\t'); |
if (NULL == (p = strchr(p, '\t'))) |
|
break; |
|
if (p == *v) |
|
break; |
|
if ('\\' != *(p - 1)) |
|
break; |
|
} |
|
|
|
/* Scan ahead to unescaped `Ta'. */ |
/* Scan ahead to unescaped `Ta'. */ |
|
|
Line 318 mdoc_args(struct mdoc *mdoc, int line, |
|
Line 556 mdoc_args(struct mdoc *mdoc, int line, |
|
p++; |
p++; |
if (0 != *p) |
if (0 != *p) |
*(p - 1) = 0; |
*(p - 1) = 0; |
else if (0 == *p) |
*pos += (int)(p - *v); |
if ( ! mdoc_pwarn(mdoc, line, *pos, WARN_SYNTAX, "empty final token")) /* FIXME: verbiage */ |
|
return(0); |
|
*pos += p - *v; |
|
} |
} |
|
|
/* Configure the eoln case, too. */ |
if (p && 0 == *p) |
|
if ( ! pwarn(mdoc, line, *pos, WCOLEMPTY)) |
|
return(0); |
|
if (p && 0 == *p && p > *v && ' ' == *(p - 1)) |
|
if ( ! pwarn(mdoc, line, *pos, WTAILWS)) |
|
return(0); |
|
|
if (NULL == p) { |
if (p) |
p = strchr(*v, 0); |
return(ARGS_PHRASE); |
assert(p); |
|
|
|
/*if (p > *v && ' ' == *(p - 1)) |
/* Configure the eoln case, too. */ |
Warn about whitespace. */ |
|
|
|
*pos += p - *v; |
p = strchr(*v, 0); |
} |
assert(p); |
|
|
return(ARGS_WORD); |
if (p > *v && ' ' == *(p - 1)) |
} |
if ( ! pwarn(mdoc, line, *pos, WTAILWS)) |
|
return(0); |
|
*pos += (int)(p - *v); |
|
|
|
return(ARGS_PHRASE); |
|
} |
|
|
/* Do non-tabsep look-ahead here. */ |
/* Do non-tabsep look-ahead here. */ |
|
|
if ( ! (ARGS_TABSEP & fl)) |
if ( ! (ARGS_TABSEP & fl)) |
while ((c = buf[*pos])) { |
while (buf[*pos]) { |
if (isspace(c)) |
if (' ' == buf[*pos]) |
if ('\\' != buf[*pos - 1]) |
if ('\\' != buf[*pos - 1]) |
break; |
break; |
(*pos)++; |
(*pos)++; |
Line 358 mdoc_args(struct mdoc *mdoc, int line, |
|
Line 601 mdoc_args(struct mdoc *mdoc, int line, |
|
return(ARGS_WORD); |
return(ARGS_WORD); |
|
|
if ( ! (ARGS_TABSEP & fl)) |
if ( ! (ARGS_TABSEP & fl)) |
while (buf[*pos] && isspace((int)buf[*pos])) |
while (buf[*pos] && ' ' == buf[*pos]) |
(*pos)++; |
(*pos)++; |
|
|
if (buf[*pos]) |
if (buf[*pos]) |
return(ARGS_WORD); |
return(ARGS_WORD); |
|
|
if ( ! mdoc_pwarn(mdoc, line, *pos, WARN_COMPAT, "whitespace at end-of-line")) |
if ( ! pwarn(mdoc, line, *pos, WTAILWS)) |
return(ARGS_ERROR); |
return(ARGS_ERROR); |
|
|
return(ARGS_WORD); |
return(ARGS_WORD); |
Line 382 mdoc_args(struct mdoc *mdoc, int line, |
|
Line 625 mdoc_args(struct mdoc *mdoc, int line, |
|
(*pos)++; |
(*pos)++; |
|
|
if (0 == buf[*pos]) { |
if (0 == buf[*pos]) { |
(void)mdoc_perr(mdoc, line, *pos, "unterminated quoted parameter"); |
(void)perr(mdoc, line, *pos, EQUOTTERM); |
return(ARGS_ERROR); |
return(ARGS_ERROR); |
} |
} |
|
|
Line 390 mdoc_args(struct mdoc *mdoc, int line, |
|
Line 633 mdoc_args(struct mdoc *mdoc, int line, |
|
if (0 == buf[*pos]) |
if (0 == buf[*pos]) |
return(ARGS_QWORD); |
return(ARGS_QWORD); |
|
|
while (buf[*pos] && isspace((int)buf[*pos])) |
while (buf[*pos] && ' ' == buf[*pos]) |
(*pos)++; |
(*pos)++; |
|
|
if (buf[*pos]) |
if (buf[*pos]) |
return(ARGS_QWORD); |
return(ARGS_QWORD); |
|
|
if ( ! mdoc_pwarn(mdoc, line, *pos, WARN_COMPAT, "whitespace at end-of-line")) |
if ( ! pwarn(mdoc, line, *pos, WTAILWS)) |
return(ARGS_ERROR); |
return(ARGS_ERROR); |
|
|
return(ARGS_QWORD); |
return(ARGS_QWORD); |
Line 404 mdoc_args(struct mdoc *mdoc, int line, |
|
Line 647 mdoc_args(struct mdoc *mdoc, int line, |
|
|
|
|
|
static int |
static int |
lookup(int tok, const char *argv) |
argv_a2arg(int tok, const char *argv) |
{ |
{ |
|
|
|
/* |
|
* Parse an argument identifier from its text. XXX - this |
|
* should really be table-driven to clarify the code. |
|
* |
|
* If you add an argument to the list, make sure that you |
|
* register it here with its one or more macros! |
|
*/ |
|
|
switch (tok) { |
switch (tok) { |
case (MDOC_An): |
case (MDOC_An): |
if (xstrcmp(argv, "split")) |
if (xstrcmp(argv, "split")) |
Line 428 lookup(int tok, const char *argv) |
|
Line 679 lookup(int tok, const char *argv) |
|
return(MDOC_File); |
return(MDOC_File); |
else if (xstrcmp(argv, "offset")) |
else if (xstrcmp(argv, "offset")) |
return(MDOC_Offset); |
return(MDOC_Offset); |
|
else if (xstrcmp(argv, "compact")) |
|
return(MDOC_Compact); |
break; |
break; |
|
|
case (MDOC_Bf): |
case (MDOC_Bf): |
Line 473 lookup(int tok, const char *argv) |
|
Line 726 lookup(int tok, const char *argv) |
|
return(MDOC_Offset); |
return(MDOC_Offset); |
else if (xstrcmp(argv, "compact")) |
else if (xstrcmp(argv, "compact")) |
return(MDOC_Compact); |
return(MDOC_Compact); |
|
else if (xstrcmp(argv, "nested")) |
|
return(MDOC_Nested); |
break; |
break; |
|
|
case (MDOC_Rv): |
case (MDOC_Rv): |
Line 481 lookup(int tok, const char *argv) |
|
Line 736 lookup(int tok, const char *argv) |
|
if (xstrcmp(argv, "std")) |
if (xstrcmp(argv, "std")) |
return(MDOC_Std); |
return(MDOC_Std); |
break; |
break; |
|
|
case (MDOC_St): |
|
if (xstrcmp(argv, "p1003.1-88")) |
|
return(MDOC_p1003_1_88); |
|
else if (xstrcmp(argv, "p1003.1-90")) |
|
return(MDOC_p1003_1_90); |
|
else if (xstrcmp(argv, "p1003.1-96")) |
|
return(MDOC_p1003_1_96); |
|
else if (xstrcmp(argv, "p1003.1-2001")) |
|
return(MDOC_p1003_1_2001); |
|
else if (xstrcmp(argv, "p1003.1-2004")) |
|
return(MDOC_p1003_1_2004); |
|
else if (xstrcmp(argv, "p1003.1")) |
|
return(MDOC_p1003_1); |
|
else if (xstrcmp(argv, "p1003.1b")) |
|
return(MDOC_p1003_1b); |
|
else if (xstrcmp(argv, "p1003.1b-93")) |
|
return(MDOC_p1003_1b_93); |
|
else if (xstrcmp(argv, "p1003.1c-95")) |
|
return(MDOC_p1003_1c_95); |
|
else if (xstrcmp(argv, "p1003.1g-2000")) |
|
return(MDOC_p1003_1g_2000); |
|
else if (xstrcmp(argv, "p1003.2-92")) |
|
return(MDOC_p1003_2_92); |
|
else if (xstrcmp(argv, "p1003.2-95")) |
|
return(MDOC_p1387_2_95); |
|
else if (xstrcmp(argv, "p1003.2")) |
|
return(MDOC_p1003_2); |
|
else if (xstrcmp(argv, "p1387.2-95")) |
|
return(MDOC_p1387_2); |
|
else if (xstrcmp(argv, "isoC-90")) |
|
return(MDOC_isoC_90); |
|
else if (xstrcmp(argv, "isoC-amd1")) |
|
return(MDOC_isoC_amd1); |
|
else if (xstrcmp(argv, "isoC-tcor1")) |
|
return(MDOC_isoC_tcor1); |
|
else if (xstrcmp(argv, "isoC-tcor2")) |
|
return(MDOC_isoC_tcor2); |
|
else if (xstrcmp(argv, "isoC-99")) |
|
return(MDOC_isoC_99); |
|
else if (xstrcmp(argv, "ansiC")) |
|
return(MDOC_ansiC); |
|
else if (xstrcmp(argv, "ansiC-89")) |
|
return(MDOC_ansiC_89); |
|
else if (xstrcmp(argv, "ansiC-99")) |
|
return(MDOC_ansiC_99); |
|
else if (xstrcmp(argv, "ieee754")) |
|
return(MDOC_ieee754); |
|
else if (xstrcmp(argv, "iso8802-3")) |
|
return(MDOC_iso8802_3); |
|
else if (xstrcmp(argv, "xpg3")) |
|
return(MDOC_xpg3); |
|
else if (xstrcmp(argv, "xpg4")) |
|
return(MDOC_xpg4); |
|
else if (xstrcmp(argv, "xpg4.2")) |
|
return(MDOC_xpg4_2); |
|
else if (xstrcmp(argv, "xpg4.3")) |
|
return(MDOC_xpg4_3); |
|
else if (xstrcmp(argv, "xbd5")) |
|
return(MDOC_xbd5); |
|
else if (xstrcmp(argv, "xcu5")) |
|
return(MDOC_xcu5); |
|
else if (xstrcmp(argv, "xsh5")) |
|
return(MDOC_xsh5); |
|
else if (xstrcmp(argv, "xns5")) |
|
return(MDOC_xns5); |
|
else if (xstrcmp(argv, "xns5.2d2.0")) |
|
return(MDOC_xns5_2d2_0); |
|
else if (xstrcmp(argv, "xcurses4.2")) |
|
return(MDOC_xcurses4_2); |
|
else if (xstrcmp(argv, "susv2")) |
|
return(MDOC_susv2); |
|
else if (xstrcmp(argv, "susv3")) |
|
return(MDOC_susv3); |
|
else if (xstrcmp(argv, "svid4")) |
|
return(MDOC_svid4); |
|
break; |
|
|
|
default: |
default: |
break; |
break; |
} |
} |
Line 568 lookup(int tok, const char *argv) |
|
Line 745 lookup(int tok, const char *argv) |
|
|
|
|
|
static int |
static int |
postparse(struct mdoc *mdoc, int line, const struct mdoc_arg *v, int pos) |
argv_multi(struct mdoc *mdoc, int line, |
|
struct mdoc_argv *v, int *pos, char *buf) |
{ |
{ |
|
int c, ppos; |
|
char *p; |
|
|
switch (v->arg) { |
ppos = *pos; |
case (MDOC_Offset): |
|
assert(v->value); |
for (v->sz = 0; ; v->sz++) { |
assert(v->value[0]); |
if ('-' == buf[*pos]) |
if (xstrcmp(v->value[0], "left")) |
|
break; |
break; |
if (xstrcmp(v->value[0], "right")) |
c = args(mdoc, line, pos, buf, ARGS_QUOTED, &p); |
|
if (ARGS_ERROR == c) |
|
return(0); |
|
else if (ARGS_EOLN == c) |
break; |
break; |
if (xstrcmp(v->value[0], "center")) |
|
break; |
if (0 == v->sz % MULTI_STEP) |
if (xstrcmp(v->value[0], "indent")) |
v->value = xrealloc(v->value, |
break; |
(v->sz + MULTI_STEP) * sizeof(char *)); |
if (xstrcmp(v->value[0], "indent-two")) |
|
break; |
v->value[(int)v->sz] = xstrdup(p); |
return(mdoc_perr(mdoc, line, pos, "invalid offset value")); |
|
default: |
|
break; |
|
} |
} |
|
|
return(1); |
if (v->sz) |
|
return(1); |
|
|
|
return(perr(mdoc, line, ppos, EARGVAL)); |
} |
} |
|
|
|
|
static int |
static int |
parse_multi(struct mdoc *mdoc, int line, |
argv_opt_single(struct mdoc *mdoc, int line, |
struct mdoc_arg *v, int *pos, char *buf) |
struct mdoc_argv *v, int *pos, char *buf) |
{ |
{ |
int c, ppos; |
int c; |
char *p; |
char *p; |
|
|
v->sz = 0; |
if ('-' == buf[*pos]) |
v->value = xcalloc(MDOC_LINEARG_MAX, sizeof(char *)); |
return(1); |
|
|
ppos = *pos; |
c = args(mdoc, line, pos, buf, ARGS_QUOTED, &p); |
|
if (ARGS_ERROR == c) |
for (v->sz = 0; v->sz < MDOC_LINEARG_MAX; v->sz++) { |
return(0); |
if ('-' == buf[*pos]) |
if (ARGS_EOLN == c) |
break; |
|
c = mdoc_args(mdoc, line, pos, buf, ARGS_QUOTED, &p); |
|
if (ARGS_ERROR == c) { |
|
free(v->value); |
|
return(0); |
|
} else if (ARGS_EOLN == c) |
|
break; |
|
v->value[v->sz] = p; |
|
} |
|
|
|
if (0 < v->sz && v->sz < MDOC_LINEARG_MAX) |
|
return(1); |
return(1); |
|
|
free(v->value); |
v->sz = 1; |
return(mdoc_perr(mdoc, line, ppos, 0 == v->sz ? |
if (NULL == (v->value = calloc(1, sizeof(char *)))) |
"argument requires a value" : |
err(1, "calloc"); |
"too many values to argument")); |
if (NULL == (v->value[0] = strdup(p))) |
|
err(1, "strdup"); |
|
return(1); |
} |
} |
|
|
|
|
|
/* |
|
* Parse a single, mandatory value from the stream. |
|
*/ |
static int |
static int |
parse_single(struct mdoc *mdoc, int line, |
argv_single(struct mdoc *mdoc, int line, |
struct mdoc_arg *v, int *pos, char *buf) |
struct mdoc_argv *v, int *pos, char *buf) |
{ |
{ |
int c, ppos; |
int c, ppos; |
char *p; |
char *p; |
|
|
ppos = *pos; |
ppos = *pos; |
|
|
c = mdoc_args(mdoc, line, pos, buf, ARGS_QUOTED, &p); |
c = args(mdoc, line, pos, buf, ARGS_QUOTED, &p); |
if (ARGS_ERROR == c) |
if (ARGS_ERROR == c) |
return(0); |
return(0); |
if (ARGS_EOLN == c) |
if (ARGS_EOLN == c) |
return(mdoc_perr(mdoc, line, ppos, "argument requires a value")); |
return(perr(mdoc, line, ppos, EARGVAL)); |
|
|
v->sz = 1; |
v->sz = 1; |
v->value = xcalloc(1, sizeof(char *)); |
if (NULL == (v->value = calloc(1, sizeof(char *)))) |
v->value[0] = p; |
err(1, "calloc"); |
|
if (NULL == (v->value[0] = strdup(p))) |
|
err(1, "strdup"); |
return(1); |
return(1); |
} |
} |
|
|
|
|
|
/* |
|
* Determine rules for parsing arguments. Arguments can either accept |
|
* no parameters, an optional single parameter, one parameter, or |
|
* multiple parameters. |
|
*/ |
static int |
static int |
parse(struct mdoc *mdoc, int line, |
argv(struct mdoc *mdoc, int line, |
struct mdoc_arg *v, int *pos, char *buf) |
struct mdoc_argv *v, int *pos, char *buf) |
{ |
{ |
|
|
v->sz = 0; |
v->sz = 0; |
v->value = NULL; |
v->value = NULL; |
|
|
switch (v->arg) { |
switch (mdoc_argvflags[v->arg]) { |
case(MDOC_Std): |
case (ARGV_SINGLE): |
/* FALLTHROUGH */ |
return(argv_single(mdoc, line, v, pos, buf)); |
case(MDOC_Width): |
case (ARGV_MULTI): |
/* FALLTHROUGH */ |
return(argv_multi(mdoc, line, v, pos, buf)); |
case(MDOC_Offset): |
case (ARGV_OPT_SINGLE): |
return(parse_single(mdoc, line, v, pos, buf)); |
return(argv_opt_single(mdoc, line, v, pos, buf)); |
case(MDOC_Column): |
|
return(parse_multi(mdoc, line, v, pos, buf)); |
|
default: |
default: |
|
/* ARGV_NONE */ |
break; |
break; |
} |
} |
|
|
return(1); |
return(1); |
} |
} |
|
|
|
|
int |
|
mdoc_argv(struct mdoc *mdoc, int line, int tok, |
|
struct mdoc_arg *v, int *pos, char *buf) |
|
{ |
|
int i, ppos; |
|
char *argv; |
|
|
|
(void)memset(v, 0, sizeof(struct mdoc_arg)); |
|
|
|
if (0 == buf[*pos]) |
|
return(ARGV_EOLN); |
|
|
|
assert( ! isspace((int)buf[*pos])); |
|
|
|
if ('-' != buf[*pos]) |
|
return(ARGV_WORD); |
|
|
|
i = *pos; |
|
argv = &buf[++(*pos)]; |
|
|
|
v->line = line; |
|
v->pos = *pos; |
|
|
|
assert(*pos > 0); |
|
while (buf[*pos]) { |
|
if (isspace((int)buf[*pos])) |
|
if ('\\' != buf[*pos - 1]) |
|
break; |
|
(*pos)++; |
|
} |
|
|
|
if (buf[*pos]) |
|
buf[(*pos)++] = 0; |
|
|
|
if (MDOC_ARG_MAX == (v->arg = lookup(tok, argv))) { |
|
if ( ! mdoc_pwarn(mdoc, line, i, WARN_SYNTAX, "argument-like parameter")) |
|
return(ARGV_ERROR); |
|
return(ARGV_WORD); |
|
} |
|
|
|
while (buf[*pos] && isspace((int)buf[*pos])) |
|
(*pos)++; |
|
|
|
/* FIXME: whitespace if no value. */ |
|
|
|
ppos = *pos; |
|
if ( ! parse(mdoc, line, v, pos, buf)) |
|
return(ARGV_ERROR); |
|
if ( ! postparse(mdoc, line, v, ppos)) |
|
return(ARGV_ERROR); |
|
|
|
return(ARGV_ARG); |
|
} |
|
|
|
|
|
void |
|
mdoc_argv_free(int sz, struct mdoc_arg *arg) |
|
{ |
|
int i; |
|
|
|
for (i = 0; i < sz; i++) { |
|
if (0 == arg[i].sz) { |
|
assert(NULL == arg[i].value); |
|
continue; |
|
} |
|
assert(arg[i].value); |
|
free(arg[i].value); |
|
} |
|
} |
|
|
|