Annotation of mandoc/argv.c, Revision 1.49
1.49 ! kristaps 1: /* $Id: argv.c,v 1.48 2009/03/11 00:39:58 kristaps Exp $ */
1.1 kristaps 2: /*
3: * Copyright (c) 2008 Kristaps Dzonsons <kristaps@kth.se>
4: *
5: * Permission to use, copy, modify, and distribute this software for any
6: * purpose with or without fee is hereby granted, provided that the
7: * above copyright notice and this permission notice appear in all
8: * copies.
9: *
10: * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL
11: * WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED
12: * WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE
13: * AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
14: * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
15: * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
16: * TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
17: * PERFORMANCE OF THIS SOFTWARE.
18: */
1.44 kristaps 19: #include <sys/types.h>
20:
1.1 kristaps 21: #include <assert.h>
22: #include <ctype.h>
23: #include <err.h>
24: #include <stdlib.h>
25: #include <stdio.h>
26: #include <string.h>
27:
28: #include "private.h"
29:
1.20 kristaps 30: /*
1.27 kristaps 31: * Routines to parse arguments of macros. Arguments follow the syntax
32: * of `-arg [val [valN...]]'. Arguments come in all types: quoted
33: * arguments, multiple arguments per value, no-value arguments, etc.
1.39 kristaps 34: *
35: * There's no limit to the number or arguments that may be allocated.
1.20 kristaps 36: */
37:
1.24 kristaps 38: #define ARGS_QUOTED (1 << 0)
39: #define ARGS_DELIM (1 << 1)
40: #define ARGS_TABSEP (1 << 2)
1.38 kristaps 41: #define ARGS_ARGVLIKE (1 << 3)
1.15 kristaps 42:
1.36 kristaps 43: #define ARGV_NONE (1 << 0)
44: #define ARGV_SINGLE (1 << 1)
45: #define ARGV_MULTI (1 << 2)
46: #define ARGV_OPT_SINGLE (1 << 3)
47:
1.39 kristaps 48: enum mwarn {
49: WQUOTPARM,
50: WARGVPARM,
51: WCOLEMPTY,
52: WTAILWS
53: };
54:
55: enum merr {
56: EQUOTTERM,
57: EARGVAL
58: };
59:
1.30 kristaps 60: static int argv_a2arg(int, const char *);
1.26 kristaps 61: static int args(struct mdoc *, int, int *,
62: char *, int, char **);
1.37 kristaps 63: static int argv(struct mdoc *, int, int,
1.39 kristaps 64: struct mdoc_argv *, int *, char *);
1.26 kristaps 65: static int argv_single(struct mdoc *, int,
1.39 kristaps 66: struct mdoc_argv *, int *, char *);
1.36 kristaps 67: static int argv_opt_single(struct mdoc *, int,
1.39 kristaps 68: struct mdoc_argv *, int *, char *);
1.26 kristaps 69: static int argv_multi(struct mdoc *, int,
1.39 kristaps 70: struct mdoc_argv *, int *, char *);
71: static int pwarn(struct mdoc *, int, int, enum mwarn);
72: static int perr(struct mdoc *, int, int, enum merr);
1.22 kristaps 73:
1.36 kristaps 74: /* Per-argument flags. */
75:
76: static int mdoc_argvflags[MDOC_ARG_MAX] = {
77: ARGV_NONE, /* MDOC_Split */
78: ARGV_NONE, /* MDOC_Nosplit */
79: ARGV_NONE, /* MDOC_Ragged */
80: ARGV_NONE, /* MDOC_Unfilled */
81: ARGV_NONE, /* MDOC_Literal */
82: ARGV_NONE, /* MDOC_File */
83: ARGV_SINGLE, /* MDOC_Offset */
84: ARGV_NONE, /* MDOC_Bullet */
85: ARGV_NONE, /* MDOC_Dash */
86: ARGV_NONE, /* MDOC_Hyphen */
87: ARGV_NONE, /* MDOC_Item */
88: ARGV_NONE, /* MDOC_Enum */
89: ARGV_NONE, /* MDOC_Tag */
90: ARGV_NONE, /* MDOC_Diag */
91: ARGV_NONE, /* MDOC_Hang */
92: ARGV_NONE, /* MDOC_Ohang */
93: ARGV_NONE, /* MDOC_Inset */
94: ARGV_MULTI, /* MDOC_Column */
95: ARGV_SINGLE, /* MDOC_Width */
96: ARGV_NONE, /* MDOC_Compact */
1.37 kristaps 97: ARGV_SINGLE, /* MDOC_Std */
1.36 kristaps 98: ARGV_NONE, /* MDOC_Filled */
99: ARGV_NONE, /* MDOC_Words */
100: ARGV_NONE, /* MDOC_Emphasis */
101: ARGV_NONE /* MDOC_Symbolic */
102: };
103:
1.22 kristaps 104: static int mdoc_argflags[MDOC_MAX] = {
105: 0, /* \" */
106: 0, /* Dd */
107: 0, /* Dt */
108: 0, /* Os */
109: 0, /* Sh */
110: 0, /* Ss */
111: ARGS_DELIM, /* Pp */
112: ARGS_DELIM, /* D1 */
113: ARGS_DELIM, /* Dl */
114: 0, /* Bd */
115: 0, /* Ed */
116: 0, /* Bl */
117: 0, /* El */
1.32 kristaps 118: 0, /* It */
1.22 kristaps 119: ARGS_DELIM, /* Ad */
120: ARGS_DELIM, /* An */
121: ARGS_DELIM, /* Ar */
122: ARGS_QUOTED, /* Cd */
123: ARGS_DELIM, /* Cm */
124: ARGS_DELIM, /* Dv */
125: ARGS_DELIM, /* Er */
126: ARGS_DELIM, /* Ev */
127: 0, /* Ex */
128: ARGS_DELIM | ARGS_QUOTED, /* Fa */
129: 0, /* Fd */
130: ARGS_DELIM, /* Fl */
131: ARGS_DELIM | ARGS_QUOTED, /* Fn */
132: ARGS_DELIM | ARGS_QUOTED, /* Ft */
133: ARGS_DELIM, /* Ic */
134: 0, /* In */
135: ARGS_DELIM, /* Li */
136: 0, /* Nd */
137: ARGS_DELIM, /* Nm */
138: ARGS_DELIM, /* Op */
139: 0, /* Ot */
140: ARGS_DELIM, /* Pa */
141: 0, /* Rv */
1.38 kristaps 142: ARGS_DELIM | ARGS_ARGVLIKE, /* St */
1.22 kristaps 143: ARGS_DELIM, /* Va */
144: ARGS_DELIM, /* Vt */
145: ARGS_DELIM, /* Xr */
146: ARGS_QUOTED, /* %A */
147: ARGS_QUOTED, /* %B */
148: ARGS_QUOTED, /* %D */
149: ARGS_QUOTED, /* %I */
150: ARGS_QUOTED, /* %J */
151: ARGS_QUOTED, /* %N */
152: ARGS_QUOTED, /* %O */
153: ARGS_QUOTED, /* %P */
154: ARGS_QUOTED, /* %R */
155: ARGS_QUOTED, /* %T */
156: ARGS_QUOTED, /* %V */
157: ARGS_DELIM, /* Ac */
158: 0, /* Ao */
159: ARGS_DELIM, /* Aq */
160: ARGS_DELIM, /* At */
161: ARGS_DELIM, /* Bc */
162: 0, /* Bf */
163: 0, /* Bo */
164: ARGS_DELIM, /* Bq */
165: ARGS_DELIM, /* Bsx */
166: ARGS_DELIM, /* Bx */
167: 0, /* Db */
168: ARGS_DELIM, /* Dc */
169: 0, /* Do */
170: ARGS_DELIM, /* Dq */
171: ARGS_DELIM, /* Ec */
172: 0, /* Ef */
173: ARGS_DELIM, /* Em */
174: 0, /* Eo */
175: ARGS_DELIM, /* Fx */
176: ARGS_DELIM, /* Ms */
177: ARGS_DELIM, /* No */
178: ARGS_DELIM, /* Ns */
179: ARGS_DELIM, /* Nx */
180: ARGS_DELIM, /* Ox */
181: ARGS_DELIM, /* Pc */
182: ARGS_DELIM, /* Pf */
183: 0, /* Po */
184: ARGS_DELIM, /* Pq */
185: ARGS_DELIM, /* Qc */
186: ARGS_DELIM, /* Ql */
187: 0, /* Qo */
188: ARGS_DELIM, /* Qq */
189: 0, /* Re */
190: 0, /* Rs */
191: ARGS_DELIM, /* Sc */
192: 0, /* So */
193: ARGS_DELIM, /* Sq */
194: 0, /* Sm */
195: ARGS_DELIM, /* Sx */
196: ARGS_DELIM, /* Sy */
197: ARGS_DELIM, /* Tn */
198: ARGS_DELIM, /* Ux */
199: ARGS_DELIM, /* Xc */
200: 0, /* Xo */
201: 0, /* Fo */
202: 0, /* Fc */
203: 0, /* Oo */
204: ARGS_DELIM, /* Oc */
205: 0, /* Bk */
206: 0, /* Ek */
207: 0, /* Bt */
208: 0, /* Hf */
209: 0, /* Fr */
210: 0, /* Ud */
1.38 kristaps 211: 0, /* Lb */
1.42 kristaps 212: 0, /* Ap */
1.45 kristaps 213: ARGS_DELIM, /* Lp */
214: ARGS_DELIM | ARGS_QUOTED, /* Lk */
215: ARGS_DELIM | ARGS_QUOTED, /* Mt */
1.48 kristaps 216: ARGS_DELIM, /* Brq */
217: 0, /* Bro */
218: ARGS_DELIM, /* Brc */
1.22 kristaps 219: };
220:
1.1 kristaps 221:
1.39 kristaps 222: /*
223: * Parse an argument from line text. This comes in the form of -key
224: * [value0...], which may either have a single mandatory value, at least
225: * one mandatory value, an optional single value, or no value.
226: */
227: int
228: mdoc_argv(struct mdoc *mdoc, int line, int tok,
229: struct mdoc_arg **v, int *pos, char *buf)
230: {
231: int i;
1.46 kristaps 232: char *p, sv;
1.39 kristaps 233: struct mdoc_argv tmp;
234: struct mdoc_arg *arg;
235:
236: if (0 == buf[*pos])
237: return(ARGV_EOLN);
238:
239: assert( ! isspace((u_char)buf[*pos]));
240:
241: if ('-' != buf[*pos])
242: return(ARGV_WORD);
243:
244: i = *pos;
245: p = &buf[++(*pos)];
246:
247: assert(*pos > 0);
248:
249: /* LINTED */
250: while (buf[*pos]) {
251: if (isspace((u_char)buf[*pos]))
252: if ('\\' != buf[*pos - 1])
253: break;
254: (*pos)++;
255: }
256:
1.46 kristaps 257: /*
258: * XXX: save the nullified byte as we'll restore it if this
1.47 kristaps 259: * doesn't end up being a command after all. This is a little
260: * bit hacky. I don't like it, but it works for now.
1.46 kristaps 261: */
262:
1.47 kristaps 263: sv = 0;
1.46 kristaps 264: if (buf[*pos]) {
265: sv = buf[*pos];
1.39 kristaps 266: buf[(*pos)++] = 0;
1.46 kristaps 267: }
1.39 kristaps 268:
269: (void)memset(&tmp, 0, sizeof(struct mdoc_argv));
270: tmp.line = line;
271: tmp.pos = *pos;
272:
273: /*
274: * We now parse out the per-macro arguments. XXX - this can be
275: * made much cleaner using per-argument tables. See argv_a2arg
276: * for details.
277: */
278:
279: if (MDOC_ARG_MAX == (tmp.arg = argv_a2arg(tok, p))) {
1.47 kristaps 280: /* XXX - restore saved byte. */
281: if (sv)
282: buf[*pos - 1] = sv;
1.39 kristaps 283: if ( ! pwarn(mdoc, line, i, WARGVPARM))
284: return(ARGV_ERROR);
285: return(ARGV_WORD);
286: }
287:
288: while (buf[*pos] && isspace((u_char)buf[*pos]))
289: (*pos)++;
290:
291: /* FIXME: whitespace if no value. */
292:
293: if ( ! argv(mdoc, tok, line, &tmp, pos, buf))
294: return(ARGV_ERROR);
295:
296: if (NULL == (arg = *v)) {
1.40 kristaps 297: *v = xcalloc(1, sizeof(struct mdoc_arg));
1.39 kristaps 298: arg = *v;
1.40 kristaps 299: }
1.39 kristaps 300:
301: arg->argc++;
302: arg->argv = xrealloc(arg->argv, arg->argc *
1.40 kristaps 303: sizeof(struct mdoc_argv));
1.39 kristaps 304:
305: (void)memcpy(&arg->argv[(int)arg->argc - 1],
306: &tmp, sizeof(struct mdoc_argv));
307:
308: return(ARGV_ARG);
309: }
310:
311:
312: void
313: mdoc_argv_free(struct mdoc_arg *p)
314: {
315: int i, j;
316:
1.41 kristaps 317: if (NULL == p)
318: return;
319:
1.40 kristaps 320: if (p->refcnt) {
321: --(p->refcnt);
322: if (p->refcnt)
323: return;
324: }
325:
326: assert(p->argc);
1.39 kristaps 327:
328: /* LINTED */
329: for (i = 0; i < (int)p->argc; i++) {
330: if (0 == p->argv[i].sz)
331: continue;
332: /* LINTED */
333: for (j = 0; j < (int)p->argv[i].sz; j++)
334: free(p->argv[i].value[j]);
1.40 kristaps 335:
1.39 kristaps 336: free(p->argv[i].value);
337: }
338:
1.40 kristaps 339: free(p->argv);
1.39 kristaps 340: free(p);
341: }
342:
343:
344:
1.24 kristaps 345: static int
1.39 kristaps 346: perr(struct mdoc *mdoc, int line, int pos, enum merr code)
1.25 kristaps 347: {
1.39 kristaps 348: char *p;
349:
350: p = NULL;
1.25 kristaps 351:
352: switch (code) {
353: case (EQUOTTERM):
1.39 kristaps 354: p = "unterminated quoted parameter";
1.25 kristaps 355: break;
356: case (EARGVAL):
1.39 kristaps 357: p = "argument requires a value";
1.25 kristaps 358: break;
359: }
1.39 kristaps 360:
361: assert(p);
362: return(mdoc_perr(mdoc, line, pos, p));
1.25 kristaps 363: }
364:
365:
366: static int
1.39 kristaps 367: pwarn(struct mdoc *mdoc, int line, int pos, enum mwarn code)
1.24 kristaps 368: {
1.39 kristaps 369: char *p;
1.24 kristaps 370: int c;
371:
1.39 kristaps 372: p = NULL;
373: c = WARN_SYNTAX;
374:
1.24 kristaps 375: switch (code) {
376: case (WQUOTPARM):
1.39 kristaps 377: p = "unexpected quoted parameter";
1.24 kristaps 378: break;
379: case (WARGVPARM):
1.39 kristaps 380: p = "argument-like parameter";
1.24 kristaps 381: break;
1.25 kristaps 382: case (WCOLEMPTY):
1.39 kristaps 383: p = "last list column is empty";
384: c = WARN_COMPAT;
1.25 kristaps 385: break;
386: case (WTAILWS):
1.39 kristaps 387: p = "trailing whitespace";
388: c = WARN_COMPAT;
1.25 kristaps 389: break;
1.24 kristaps 390: }
1.39 kristaps 391:
392: assert(p);
393: return(mdoc_pwarn(mdoc, line, pos, c, p));
1.24 kristaps 394: }
395:
396:
1.2 kristaps 397: int
1.22 kristaps 398: mdoc_args(struct mdoc *mdoc, int line,
399: int *pos, char *buf, int tok, char **v)
1.1 kristaps 400: {
1.26 kristaps 401: int fl, c, i;
1.22 kristaps 402: struct mdoc_node *n;
403:
1.24 kristaps 404: fl = (0 == tok) ? 0 : mdoc_argflags[tok];
405:
406: /*
1.36 kristaps 407: * Override per-macro argument flags with context-specific ones.
408: * As of now, this is only valid for `It' depending on its list
409: * context.
1.24 kristaps 410: */
411:
1.36 kristaps 412: switch (tok) {
413: case (MDOC_It):
1.24 kristaps 414: for (n = mdoc->last; n; n = n->parent)
1.36 kristaps 415: if (MDOC_BLOCK == n->type && MDOC_Bl == n->tok)
416: break;
417:
1.24 kristaps 418: assert(n);
1.39 kristaps 419: c = (int)(n->args ? n->args->argc : 0);
1.24 kristaps 420: assert(c > 0);
1.26 kristaps 421:
1.36 kristaps 422: /*
423: * Using `Bl -column' adds ARGS_TABSEP to the arguments
424: * and invalidates ARGS_DELIM. Using `Bl -diag' allows
425: * for quoted arguments.
426: */
427:
1.26 kristaps 428: /* LINTED */
1.24 kristaps 429: for (i = 0; i < c; i++) {
1.39 kristaps 430: switch (n->args->argv[i].arg) {
1.35 kristaps 431: case (MDOC_Column):
432: fl |= ARGS_TABSEP;
433: fl &= ~ARGS_DELIM;
434: i = c;
435: break;
436: case (MDOC_Diag):
437: fl |= ARGS_QUOTED;
438: i = c;
439: break;
440: default:
441: break;
442: }
1.24 kristaps 443: }
1.39 kristaps 444: break;
1.36 kristaps 445: default:
446: break;
1.24 kristaps 447: }
448:
1.36 kristaps 449: /* Continue parsing the arguments themselves... */
450:
1.26 kristaps 451: return(args(mdoc, line, pos, buf, fl, v));
452: }
453:
454:
455: static int
456: args(struct mdoc *mdoc, int line,
457: int *pos, char *buf, int fl, char **v)
458: {
1.31 kristaps 459: int i;
1.26 kristaps 460: char *p, *pp;
461:
462: assert(*pos > 0);
463:
464: if (0 == buf[*pos])
465: return(ARGS_EOLN);
466:
467: if ('\"' == buf[*pos] && ! (fl & ARGS_QUOTED))
468: if ( ! pwarn(mdoc, line, *pos, WQUOTPARM))
469: return(ARGS_ERROR);
470:
1.38 kristaps 471: if ( ! (fl & ARGS_ARGVLIKE) && '-' == buf[*pos])
1.26 kristaps 472: if ( ! pwarn(mdoc, line, *pos, WARGVPARM))
473: return(ARGS_ERROR);
474:
1.24 kristaps 475: /*
476: * If the first character is a delimiter and we're to look for
477: * delimited strings, then pass down the buffer seeing if it
478: * follows the pattern of [[::delim::][ ]+]+.
479: */
480:
1.2 kristaps 481: if ((fl & ARGS_DELIM) && mdoc_iscdelim(buf[*pos])) {
1.31 kristaps 482: for (i = *pos; buf[i]; ) {
483: if ( ! mdoc_iscdelim(buf[i]))
1.2 kristaps 484: break;
485: i++;
1.34 kristaps 486: /* There must be at least one space... */
1.37 kristaps 487: if (0 == buf[i] || ! isspace((u_char)buf[i]))
1.34 kristaps 488: break;
489: i++;
1.37 kristaps 490: while (buf[i] && isspace((u_char)buf[i]))
1.2 kristaps 491: i++;
492: }
493: if (0 == buf[i]) {
494: *v = &buf[*pos];
495: return(ARGS_PUNCT);
496: }
497: }
498:
1.24 kristaps 499: /* First parse non-quoted strings. */
1.1 kristaps 500:
1.17 kristaps 501: if ('\"' != buf[*pos] || ! (ARGS_QUOTED & fl)) {
1.1 kristaps 502: *v = &buf[*pos];
503:
1.24 kristaps 504: /*
505: * Thar be dragons here! If we're tab-separated, search
506: * ahead for either a tab or the `Ta' macro. If a tab
507: * is detected, it mustn't be escaped; if a `Ta' is
508: * detected, it must be space-buffered before and after.
509: * If either of these hold true, then prune out the
510: * extra spaces and call it an argument.
511: */
512:
513: if (ARGS_TABSEP & fl) {
514: /* Scan ahead to unescaped tab. */
1.12 kristaps 515:
1.24 kristaps 516: for (p = *v; ; p++) {
517: if (NULL == (p = strchr(p, '\t')))
518: break;
519: if (p == *v)
520: break;
521: if ('\\' != *(p - 1))
1.12 kristaps 522: break;
523: }
1.24 kristaps 524:
525: /* Scan ahead to unescaped `Ta'. */
526:
527: for (pp = *v; ; pp++) {
528: if (NULL == (pp = strstr(pp, "Ta")))
529: break;
530: if (pp > *v && ' ' != *(pp - 1))
531: continue;
532: if (' ' == *(pp + 2) || 0 == *(pp + 2))
533: break;
534: }
535:
536: /* Choose delimiter tab/Ta. */
537:
538: if (p && pp)
539: p = (p < pp ? p : pp);
540: else if ( ! p && pp)
541: p = pp;
542:
543: /* Strip delimiter's preceding whitespace. */
544:
545: if (p && p > *v) {
546: pp = p - 1;
547: while (pp > *v && ' ' == *pp)
548: pp--;
549: if (pp == *v && ' ' == *pp)
550: *pp = 0;
551: else if (' ' == *pp)
552: *(pp + 1) = 0;
553: }
554:
555: /* ...in- and proceding whitespace. */
556:
557: if (p && ('\t' != *p)) {
558: *p++ = 0;
559: *p++ = 0;
560: } else if (p)
561: *p++ = 0;
562:
563: if (p) {
564: while (' ' == *p)
565: p++;
566: if (0 != *p)
567: *(p - 1) = 0;
1.33 kristaps 568: *pos += (int)(p - *v);
1.24 kristaps 569: }
570:
1.25 kristaps 571: if (p && 0 == *p)
572: if ( ! pwarn(mdoc, line, *pos, WCOLEMPTY))
573: return(0);
574: if (p && 0 == *p && p > *v && ' ' == *(p - 1))
575: if ( ! pwarn(mdoc, line, *pos, WTAILWS))
576: return(0);
577:
1.26 kristaps 578: if (p)
1.49 ! kristaps 579: return(ARGS_PHRASE);
1.26 kristaps 580:
1.24 kristaps 581: /* Configure the eoln case, too. */
582:
1.26 kristaps 583: p = strchr(*v, 0);
584: assert(p);
585:
586: if (p > *v && ' ' == *(p - 1))
587: if ( ! pwarn(mdoc, line, *pos, WTAILWS))
588: return(0);
1.33 kristaps 589: *pos += (int)(p - *v);
1.24 kristaps 590:
1.49 ! kristaps 591: return(ARGS_PHRASE);
1.24 kristaps 592: }
1.46 kristaps 593:
1.24 kristaps 594: /* Do non-tabsep look-ahead here. */
595:
596: if ( ! (ARGS_TABSEP & fl))
1.31 kristaps 597: while (buf[*pos]) {
1.37 kristaps 598: if (isspace((u_char)buf[*pos]))
1.17 kristaps 599: if ('\\' != buf[*pos - 1])
600: break;
1.12 kristaps 601: (*pos)++;
1.17 kristaps 602: }
1.1 kristaps 603:
604: if (0 == buf[*pos])
1.2 kristaps 605: return(ARGS_WORD);
1.1 kristaps 606:
607: buf[(*pos)++] = 0;
1.12 kristaps 608:
1.1 kristaps 609: if (0 == buf[*pos])
1.2 kristaps 610: return(ARGS_WORD);
1.1 kristaps 611:
1.12 kristaps 612: if ( ! (ARGS_TABSEP & fl))
1.37 kristaps 613: while (buf[*pos] && isspace((u_char)buf[*pos]))
1.12 kristaps 614: (*pos)++;
1.1 kristaps 615:
616: if (buf[*pos])
1.2 kristaps 617: return(ARGS_WORD);
1.1 kristaps 618:
1.25 kristaps 619: if ( ! pwarn(mdoc, line, *pos, WTAILWS))
1.2 kristaps 620: return(ARGS_ERROR);
1.1 kristaps 621:
1.2 kristaps 622: return(ARGS_WORD);
623: }
624:
625: /*
626: * If we're a quoted string (and quoted strings are allowed),
627: * then parse ahead to the next quote. If none's found, it's an
1.4 kristaps 628: * error. After, parse to the next word.
1.2 kristaps 629: */
1.1 kristaps 630:
631: *v = &buf[++(*pos)];
632:
633: while (buf[*pos] && '\"' != buf[*pos])
634: (*pos)++;
635:
636: if (0 == buf[*pos]) {
1.25 kristaps 637: (void)perr(mdoc, line, *pos, EQUOTTERM);
1.2 kristaps 638: return(ARGS_ERROR);
1.1 kristaps 639: }
640:
641: buf[(*pos)++] = 0;
642: if (0 == buf[*pos])
1.19 kristaps 643: return(ARGS_QWORD);
1.1 kristaps 644:
1.37 kristaps 645: while (buf[*pos] && isspace((u_char)buf[*pos]))
1.1 kristaps 646: (*pos)++;
647:
648: if (buf[*pos])
1.19 kristaps 649: return(ARGS_QWORD);
1.1 kristaps 650:
1.25 kristaps 651: if ( ! pwarn(mdoc, line, *pos, WTAILWS))
1.2 kristaps 652: return(ARGS_ERROR);
653:
1.19 kristaps 654: return(ARGS_QWORD);
1.1 kristaps 655: }
656:
657:
1.2 kristaps 658: static int
1.30 kristaps 659: argv_a2arg(int tok, const char *argv)
1.1 kristaps 660: {
661:
1.36 kristaps 662: /*
663: * Parse an argument identifier from its text. XXX - this
664: * should really be table-driven to clarify the code.
665: *
666: * If you add an argument to the list, make sure that you
667: * register it here with its one or more macros!
668: */
669:
1.1 kristaps 670: switch (tok) {
1.6 kristaps 671: case (MDOC_An):
672: if (xstrcmp(argv, "split"))
673: return(MDOC_Split);
674: else if (xstrcmp(argv, "nosplit"))
675: return(MDOC_Nosplit);
676: break;
677:
1.2 kristaps 678: case (MDOC_Bd):
1.1 kristaps 679: if (xstrcmp(argv, "ragged"))
680: return(MDOC_Ragged);
681: else if (xstrcmp(argv, "unfilled"))
682: return(MDOC_Unfilled);
1.13 kristaps 683: else if (xstrcmp(argv, "filled"))
684: return(MDOC_Filled);
1.1 kristaps 685: else if (xstrcmp(argv, "literal"))
686: return(MDOC_Literal);
687: else if (xstrcmp(argv, "file"))
688: return(MDOC_File);
689: else if (xstrcmp(argv, "offset"))
690: return(MDOC_Offset);
1.49 ! kristaps 691: else if (xstrcmp(argv, "compact"))
! 692: return(MDOC_Compact);
1.2 kristaps 693: break;
694:
1.8 kristaps 695: case (MDOC_Bf):
696: if (xstrcmp(argv, "emphasis"))
697: return(MDOC_Emphasis);
698: else if (xstrcmp(argv, "literal"))
699: return(MDOC_Literal);
700: else if (xstrcmp(argv, "symbolic"))
701: return(MDOC_Symbolic);
702: break;
703:
1.7 kristaps 704: case (MDOC_Bk):
705: if (xstrcmp(argv, "words"))
706: return(MDOC_Words);
707: break;
708:
1.2 kristaps 709: case (MDOC_Bl):
710: if (xstrcmp(argv, "bullet"))
1.1 kristaps 711: return(MDOC_Bullet);
712: else if (xstrcmp(argv, "dash"))
713: return(MDOC_Dash);
714: else if (xstrcmp(argv, "hyphen"))
715: return(MDOC_Hyphen);
716: else if (xstrcmp(argv, "item"))
717: return(MDOC_Item);
718: else if (xstrcmp(argv, "enum"))
719: return(MDOC_Enum);
720: else if (xstrcmp(argv, "tag"))
721: return(MDOC_Tag);
722: else if (xstrcmp(argv, "diag"))
723: return(MDOC_Diag);
724: else if (xstrcmp(argv, "hang"))
725: return(MDOC_Hang);
726: else if (xstrcmp(argv, "ohang"))
727: return(MDOC_Ohang);
728: else if (xstrcmp(argv, "inset"))
729: return(MDOC_Inset);
730: else if (xstrcmp(argv, "column"))
731: return(MDOC_Column);
732: else if (xstrcmp(argv, "width"))
733: return(MDOC_Width);
1.2 kristaps 734: else if (xstrcmp(argv, "offset"))
735: return(MDOC_Offset);
1.1 kristaps 736: else if (xstrcmp(argv, "compact"))
737: return(MDOC_Compact);
1.2 kristaps 738: break;
1.3 kristaps 739:
740: case (MDOC_Rv):
741: /* FALLTHROUGH */
742: case (MDOC_Ex):
743: if (xstrcmp(argv, "std"))
744: return(MDOC_Std);
745: break;
1.1 kristaps 746: default:
1.8 kristaps 747: break;
1.1 kristaps 748: }
749:
750: return(MDOC_ARG_MAX);
751: }
752:
753:
1.2 kristaps 754: static int
1.26 kristaps 755: argv_multi(struct mdoc *mdoc, int line,
1.39 kristaps 756: struct mdoc_argv *v, int *pos, char *buf)
1.12 kristaps 757: {
758: int c, ppos;
759: char *p;
760:
761: ppos = *pos;
762:
1.39 kristaps 763: for (v->sz = 0; ; v->sz++) {
1.12 kristaps 764: if ('-' == buf[*pos])
765: break;
1.26 kristaps 766: c = args(mdoc, line, pos, buf, ARGS_QUOTED, &p);
1.39 kristaps 767: if (ARGS_ERROR == c)
1.12 kristaps 768: return(0);
1.39 kristaps 769: else if (ARGS_EOLN == c)
1.12 kristaps 770: break;
1.39 kristaps 771:
772: if (0 == v->sz % 5)
773: v->value = xrealloc(v->value,
774: (v->sz + 5) * sizeof(char *));
775:
1.40 kristaps 776: v->value[(int)v->sz] = xstrdup(p);
1.12 kristaps 777: }
778:
1.39 kristaps 779: if (v->sz)
1.12 kristaps 780: return(1);
781:
1.39 kristaps 782: return(perr(mdoc, line, ppos, EARGVAL));
1.12 kristaps 783: }
784:
785:
786: static int
1.36 kristaps 787: argv_opt_single(struct mdoc *mdoc, int line,
1.39 kristaps 788: struct mdoc_argv *v, int *pos, char *buf)
1.36 kristaps 789: {
1.39 kristaps 790: int c;
1.36 kristaps 791: char *p;
792:
793: if ('-' == buf[*pos])
794: return(1);
795:
796: c = args(mdoc, line, pos, buf, ARGS_QUOTED, &p);
797: if (ARGS_ERROR == c)
798: return(0);
799: if (ARGS_EOLN == c)
800: return(1);
801:
802: v->sz = 1;
803: v->value = xcalloc(1, sizeof(char *));
1.40 kristaps 804: v->value[0] = xstrdup(p);
1.36 kristaps 805: return(1);
806: }
807:
808:
809: /*
810: * Parse a single, mandatory value from the stream.
811: */
812: static int
1.26 kristaps 813: argv_single(struct mdoc *mdoc, int line,
1.39 kristaps 814: struct mdoc_argv *v, int *pos, char *buf)
1.1 kristaps 815: {
1.12 kristaps 816: int c, ppos;
1.1 kristaps 817: char *p;
818:
819: ppos = *pos;
820:
1.26 kristaps 821: c = args(mdoc, line, pos, buf, ARGS_QUOTED, &p);
1.12 kristaps 822: if (ARGS_ERROR == c)
823: return(0);
824: if (ARGS_EOLN == c)
1.36 kristaps 825: return(perr(mdoc, line, ppos, EARGVAL));
1.12 kristaps 826:
827: v->sz = 1;
828: v->value = xcalloc(1, sizeof(char *));
1.40 kristaps 829: v->value[0] = xstrdup(p);
1.12 kristaps 830: return(1);
831: }
832:
833:
1.36 kristaps 834: /*
835: * Determine rules for parsing arguments. Arguments can either accept
836: * no parameters, an optional single parameter, one parameter, or
837: * multiple parameters.
838: */
1.12 kristaps 839: static int
1.37 kristaps 840: argv(struct mdoc *mdoc, int tok, int line,
1.39 kristaps 841: struct mdoc_argv *v, int *pos, char *buf)
1.12 kristaps 842: {
1.37 kristaps 843: int fl;
1.12 kristaps 844:
845: v->sz = 0;
846: v->value = NULL;
1.37 kristaps 847: fl = mdoc_argvflags[v->arg];
1.12 kristaps 848:
1.37 kristaps 849: /*
850: * Override the default per-argument value.
851: */
852:
853: switch (tok) {
854: case (MDOC_Ex):
855: fl = ARGV_OPT_SINGLE;
856: break;
857: default:
858: break;
859: }
860:
861: switch (fl) {
1.36 kristaps 862: case (ARGV_SINGLE):
1.26 kristaps 863: return(argv_single(mdoc, line, v, pos, buf));
1.36 kristaps 864: case (ARGV_MULTI):
1.26 kristaps 865: return(argv_multi(mdoc, line, v, pos, buf));
1.36 kristaps 866: case (ARGV_OPT_SINGLE):
867: return(argv_opt_single(mdoc, line, v, pos, buf));
1.1 kristaps 868: default:
1.36 kristaps 869: /* ARGV_NONE */
1.6 kristaps 870: break;
1.1 kristaps 871: }
872:
873: return(1);
874: }
CVSweb