Annotation of mandoc/argv.c, Revision 1.53
1.53 ! kristaps 1: /* $Id: argv.c,v 1.52 2009/03/16 22:19:19 kristaps Exp $ */
1.1 kristaps 2: /*
1.53 ! kristaps 3: * Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@openbsd.org>
1.1 kristaps 4: *
5: * Permission to use, copy, modify, and distribute this software for any
6: * purpose with or without fee is hereby granted, provided that the
7: * above copyright notice and this permission notice appear in all
8: * copies.
9: *
10: * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL
11: * WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED
12: * WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE
13: * AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
14: * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
15: * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
16: * TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
17: * PERFORMANCE OF THIS SOFTWARE.
18: */
1.44 kristaps 19: #include <sys/types.h>
20:
1.1 kristaps 21: #include <assert.h>
22: #include <ctype.h>
23: #include <err.h>
24: #include <stdlib.h>
25: #include <stdio.h>
26: #include <string.h>
27:
28: #include "private.h"
29:
1.20 kristaps 30: /*
1.27 kristaps 31: * Routines to parse arguments of macros. Arguments follow the syntax
32: * of `-arg [val [valN...]]'. Arguments come in all types: quoted
33: * arguments, multiple arguments per value, no-value arguments, etc.
1.39 kristaps 34: *
35: * There's no limit to the number or arguments that may be allocated.
1.20 kristaps 36: */
37:
1.24 kristaps 38: #define ARGS_QUOTED (1 << 0)
39: #define ARGS_DELIM (1 << 1)
40: #define ARGS_TABSEP (1 << 2)
1.38 kristaps 41: #define ARGS_ARGVLIKE (1 << 3)
1.15 kristaps 42:
1.36 kristaps 43: #define ARGV_NONE (1 << 0)
44: #define ARGV_SINGLE (1 << 1)
45: #define ARGV_MULTI (1 << 2)
46: #define ARGV_OPT_SINGLE (1 << 3)
47:
1.52 kristaps 48: #define MULTI_STEP 5
49:
1.39 kristaps 50: enum mwarn {
51: WQUOTPARM,
52: WARGVPARM,
53: WCOLEMPTY,
54: WTAILWS
55: };
56:
57: enum merr {
58: EQUOTTERM,
59: EARGVAL
60: };
61:
1.30 kristaps 62: static int argv_a2arg(int, const char *);
1.26 kristaps 63: static int args(struct mdoc *, int, int *,
64: char *, int, char **);
1.51 kristaps 65: static int argv(struct mdoc *, int,
1.39 kristaps 66: struct mdoc_argv *, int *, char *);
1.26 kristaps 67: static int argv_single(struct mdoc *, int,
1.39 kristaps 68: struct mdoc_argv *, int *, char *);
1.36 kristaps 69: static int argv_opt_single(struct mdoc *, int,
1.39 kristaps 70: struct mdoc_argv *, int *, char *);
1.26 kristaps 71: static int argv_multi(struct mdoc *, int,
1.39 kristaps 72: struct mdoc_argv *, int *, char *);
73: static int pwarn(struct mdoc *, int, int, enum mwarn);
74: static int perr(struct mdoc *, int, int, enum merr);
1.22 kristaps 75:
1.36 kristaps 76: /* Per-argument flags. */
77:
78: static int mdoc_argvflags[MDOC_ARG_MAX] = {
79: ARGV_NONE, /* MDOC_Split */
80: ARGV_NONE, /* MDOC_Nosplit */
81: ARGV_NONE, /* MDOC_Ragged */
82: ARGV_NONE, /* MDOC_Unfilled */
83: ARGV_NONE, /* MDOC_Literal */
84: ARGV_NONE, /* MDOC_File */
85: ARGV_SINGLE, /* MDOC_Offset */
86: ARGV_NONE, /* MDOC_Bullet */
87: ARGV_NONE, /* MDOC_Dash */
88: ARGV_NONE, /* MDOC_Hyphen */
89: ARGV_NONE, /* MDOC_Item */
90: ARGV_NONE, /* MDOC_Enum */
91: ARGV_NONE, /* MDOC_Tag */
92: ARGV_NONE, /* MDOC_Diag */
93: ARGV_NONE, /* MDOC_Hang */
94: ARGV_NONE, /* MDOC_Ohang */
95: ARGV_NONE, /* MDOC_Inset */
96: ARGV_MULTI, /* MDOC_Column */
97: ARGV_SINGLE, /* MDOC_Width */
98: ARGV_NONE, /* MDOC_Compact */
1.50 kristaps 99: ARGV_OPT_SINGLE, /* MDOC_Std */
1.36 kristaps 100: ARGV_NONE, /* MDOC_Filled */
101: ARGV_NONE, /* MDOC_Words */
102: ARGV_NONE, /* MDOC_Emphasis */
1.50 kristaps 103: ARGV_NONE, /* MDOC_Symbolic */
1.36 kristaps 104: ARGV_NONE /* MDOC_Symbolic */
105: };
106:
1.22 kristaps 107: static int mdoc_argflags[MDOC_MAX] = {
108: 0, /* \" */
109: 0, /* Dd */
110: 0, /* Dt */
111: 0, /* Os */
112: 0, /* Sh */
113: 0, /* Ss */
114: ARGS_DELIM, /* Pp */
115: ARGS_DELIM, /* D1 */
116: ARGS_DELIM, /* Dl */
117: 0, /* Bd */
118: 0, /* Ed */
119: 0, /* Bl */
120: 0, /* El */
1.32 kristaps 121: 0, /* It */
1.22 kristaps 122: ARGS_DELIM, /* Ad */
123: ARGS_DELIM, /* An */
124: ARGS_DELIM, /* Ar */
125: ARGS_QUOTED, /* Cd */
126: ARGS_DELIM, /* Cm */
127: ARGS_DELIM, /* Dv */
128: ARGS_DELIM, /* Er */
129: ARGS_DELIM, /* Ev */
130: 0, /* Ex */
131: ARGS_DELIM | ARGS_QUOTED, /* Fa */
132: 0, /* Fd */
133: ARGS_DELIM, /* Fl */
134: ARGS_DELIM | ARGS_QUOTED, /* Fn */
135: ARGS_DELIM | ARGS_QUOTED, /* Ft */
136: ARGS_DELIM, /* Ic */
137: 0, /* In */
138: ARGS_DELIM, /* Li */
139: 0, /* Nd */
140: ARGS_DELIM, /* Nm */
141: ARGS_DELIM, /* Op */
142: 0, /* Ot */
143: ARGS_DELIM, /* Pa */
144: 0, /* Rv */
1.38 kristaps 145: ARGS_DELIM | ARGS_ARGVLIKE, /* St */
1.22 kristaps 146: ARGS_DELIM, /* Va */
147: ARGS_DELIM, /* Vt */
148: ARGS_DELIM, /* Xr */
149: ARGS_QUOTED, /* %A */
150: ARGS_QUOTED, /* %B */
151: ARGS_QUOTED, /* %D */
152: ARGS_QUOTED, /* %I */
153: ARGS_QUOTED, /* %J */
154: ARGS_QUOTED, /* %N */
155: ARGS_QUOTED, /* %O */
156: ARGS_QUOTED, /* %P */
157: ARGS_QUOTED, /* %R */
158: ARGS_QUOTED, /* %T */
159: ARGS_QUOTED, /* %V */
160: ARGS_DELIM, /* Ac */
161: 0, /* Ao */
162: ARGS_DELIM, /* Aq */
163: ARGS_DELIM, /* At */
164: ARGS_DELIM, /* Bc */
165: 0, /* Bf */
166: 0, /* Bo */
167: ARGS_DELIM, /* Bq */
168: ARGS_DELIM, /* Bsx */
169: ARGS_DELIM, /* Bx */
170: 0, /* Db */
171: ARGS_DELIM, /* Dc */
172: 0, /* Do */
173: ARGS_DELIM, /* Dq */
174: ARGS_DELIM, /* Ec */
175: 0, /* Ef */
176: ARGS_DELIM, /* Em */
177: 0, /* Eo */
178: ARGS_DELIM, /* Fx */
179: ARGS_DELIM, /* Ms */
180: ARGS_DELIM, /* No */
181: ARGS_DELIM, /* Ns */
182: ARGS_DELIM, /* Nx */
183: ARGS_DELIM, /* Ox */
184: ARGS_DELIM, /* Pc */
185: ARGS_DELIM, /* Pf */
186: 0, /* Po */
187: ARGS_DELIM, /* Pq */
188: ARGS_DELIM, /* Qc */
189: ARGS_DELIM, /* Ql */
190: 0, /* Qo */
191: ARGS_DELIM, /* Qq */
192: 0, /* Re */
193: 0, /* Rs */
194: ARGS_DELIM, /* Sc */
195: 0, /* So */
196: ARGS_DELIM, /* Sq */
197: 0, /* Sm */
198: ARGS_DELIM, /* Sx */
199: ARGS_DELIM, /* Sy */
200: ARGS_DELIM, /* Tn */
201: ARGS_DELIM, /* Ux */
202: ARGS_DELIM, /* Xc */
203: 0, /* Xo */
204: 0, /* Fo */
205: 0, /* Fc */
206: 0, /* Oo */
207: ARGS_DELIM, /* Oc */
208: 0, /* Bk */
209: 0, /* Ek */
210: 0, /* Bt */
211: 0, /* Hf */
212: 0, /* Fr */
213: 0, /* Ud */
1.38 kristaps 214: 0, /* Lb */
1.42 kristaps 215: 0, /* Ap */
1.45 kristaps 216: ARGS_DELIM, /* Lp */
217: ARGS_DELIM | ARGS_QUOTED, /* Lk */
218: ARGS_DELIM | ARGS_QUOTED, /* Mt */
1.48 kristaps 219: ARGS_DELIM, /* Brq */
220: 0, /* Bro */
221: ARGS_DELIM, /* Brc */
1.50 kristaps 222: ARGS_QUOTED, /* %C */
1.52 kristaps 223: 0, /* Es */
224: 0, /* En */
1.53 ! kristaps 225: 0, /* Dx */
1.22 kristaps 226: };
227:
1.1 kristaps 228:
1.39 kristaps 229: /*
230: * Parse an argument from line text. This comes in the form of -key
231: * [value0...], which may either have a single mandatory value, at least
232: * one mandatory value, an optional single value, or no value.
233: */
234: int
235: mdoc_argv(struct mdoc *mdoc, int line, int tok,
236: struct mdoc_arg **v, int *pos, char *buf)
237: {
238: int i;
1.46 kristaps 239: char *p, sv;
1.39 kristaps 240: struct mdoc_argv tmp;
241: struct mdoc_arg *arg;
242:
243: if (0 == buf[*pos])
244: return(ARGV_EOLN);
245:
1.52 kristaps 246: assert(' ' != buf[*pos]);
1.39 kristaps 247:
1.52 kristaps 248: if ('-' != buf[*pos] || ARGS_ARGVLIKE & mdoc_argflags[tok])
1.39 kristaps 249: return(ARGV_WORD);
250:
1.52 kristaps 251: /* Parse through to the first unescaped space. */
252:
1.39 kristaps 253: i = *pos;
254: p = &buf[++(*pos)];
255:
256: assert(*pos > 0);
257:
258: /* LINTED */
259: while (buf[*pos]) {
1.52 kristaps 260: if (' ' == buf[*pos])
1.39 kristaps 261: if ('\\' != buf[*pos - 1])
262: break;
263: (*pos)++;
264: }
265:
1.52 kristaps 266: /* XXX - save zeroed byte, if not an argument. */
1.46 kristaps 267:
1.47 kristaps 268: sv = 0;
1.46 kristaps 269: if (buf[*pos]) {
270: sv = buf[*pos];
1.39 kristaps 271: buf[(*pos)++] = 0;
1.46 kristaps 272: }
1.39 kristaps 273:
274: (void)memset(&tmp, 0, sizeof(struct mdoc_argv));
275: tmp.line = line;
276: tmp.pos = *pos;
277:
1.52 kristaps 278: /* See if our token accepts the argument. */
1.39 kristaps 279:
280: if (MDOC_ARG_MAX == (tmp.arg = argv_a2arg(tok, p))) {
1.52 kristaps 281: /* XXX - restore saved zeroed byte. */
1.47 kristaps 282: if (sv)
283: buf[*pos - 1] = sv;
1.39 kristaps 284: if ( ! pwarn(mdoc, line, i, WARGVPARM))
285: return(ARGV_ERROR);
286: return(ARGV_WORD);
287: }
288:
1.52 kristaps 289: while (buf[*pos] && ' ' == buf[*pos])
1.39 kristaps 290: (*pos)++;
291:
1.51 kristaps 292: if ( ! argv(mdoc, line, &tmp, pos, buf))
1.39 kristaps 293: return(ARGV_ERROR);
294:
295: if (NULL == (arg = *v)) {
1.40 kristaps 296: *v = xcalloc(1, sizeof(struct mdoc_arg));
1.39 kristaps 297: arg = *v;
1.40 kristaps 298: }
1.39 kristaps 299:
300: arg->argc++;
301: arg->argv = xrealloc(arg->argv, arg->argc *
1.40 kristaps 302: sizeof(struct mdoc_argv));
1.39 kristaps 303:
304: (void)memcpy(&arg->argv[(int)arg->argc - 1],
305: &tmp, sizeof(struct mdoc_argv));
306:
307: return(ARGV_ARG);
308: }
309:
310:
311: void
312: mdoc_argv_free(struct mdoc_arg *p)
313: {
314: int i, j;
315:
1.41 kristaps 316: if (NULL == p)
317: return;
318:
1.40 kristaps 319: if (p->refcnt) {
320: --(p->refcnt);
321: if (p->refcnt)
322: return;
323: }
324:
325: assert(p->argc);
1.39 kristaps 326:
327: /* LINTED */
328: for (i = 0; i < (int)p->argc; i++) {
329: if (0 == p->argv[i].sz)
330: continue;
331: /* LINTED */
332: for (j = 0; j < (int)p->argv[i].sz; j++)
333: free(p->argv[i].value[j]);
1.40 kristaps 334:
1.39 kristaps 335: free(p->argv[i].value);
336: }
337:
1.40 kristaps 338: free(p->argv);
1.39 kristaps 339: free(p);
340: }
341:
342:
343:
1.24 kristaps 344: static int
1.39 kristaps 345: perr(struct mdoc *mdoc, int line, int pos, enum merr code)
1.25 kristaps 346: {
1.39 kristaps 347: char *p;
348:
349: p = NULL;
1.25 kristaps 350:
351: switch (code) {
352: case (EQUOTTERM):
1.39 kristaps 353: p = "unterminated quoted parameter";
1.25 kristaps 354: break;
355: case (EARGVAL):
1.39 kristaps 356: p = "argument requires a value";
1.25 kristaps 357: break;
358: }
1.39 kristaps 359:
360: assert(p);
361: return(mdoc_perr(mdoc, line, pos, p));
1.25 kristaps 362: }
363:
364:
365: static int
1.39 kristaps 366: pwarn(struct mdoc *mdoc, int line, int pos, enum mwarn code)
1.24 kristaps 367: {
1.39 kristaps 368: char *p;
1.24 kristaps 369: int c;
370:
1.39 kristaps 371: p = NULL;
372: c = WARN_SYNTAX;
373:
1.24 kristaps 374: switch (code) {
375: case (WQUOTPARM):
1.39 kristaps 376: p = "unexpected quoted parameter";
1.24 kristaps 377: break;
378: case (WARGVPARM):
1.39 kristaps 379: p = "argument-like parameter";
1.24 kristaps 380: break;
1.25 kristaps 381: case (WCOLEMPTY):
1.39 kristaps 382: p = "last list column is empty";
383: c = WARN_COMPAT;
1.25 kristaps 384: break;
385: case (WTAILWS):
1.39 kristaps 386: p = "trailing whitespace";
387: c = WARN_COMPAT;
1.25 kristaps 388: break;
1.24 kristaps 389: }
1.39 kristaps 390:
391: assert(p);
392: return(mdoc_pwarn(mdoc, line, pos, c, p));
1.24 kristaps 393: }
394:
395:
1.2 kristaps 396: int
1.22 kristaps 397: mdoc_args(struct mdoc *mdoc, int line,
398: int *pos, char *buf, int tok, char **v)
1.1 kristaps 399: {
1.26 kristaps 400: int fl, c, i;
1.22 kristaps 401: struct mdoc_node *n;
402:
1.24 kristaps 403: fl = (0 == tok) ? 0 : mdoc_argflags[tok];
404:
405: /*
1.36 kristaps 406: * Override per-macro argument flags with context-specific ones.
407: * As of now, this is only valid for `It' depending on its list
408: * context.
1.24 kristaps 409: */
410:
1.36 kristaps 411: switch (tok) {
412: case (MDOC_It):
1.24 kristaps 413: for (n = mdoc->last; n; n = n->parent)
1.36 kristaps 414: if (MDOC_BLOCK == n->type && MDOC_Bl == n->tok)
415: break;
416:
1.24 kristaps 417: assert(n);
1.39 kristaps 418: c = (int)(n->args ? n->args->argc : 0);
1.24 kristaps 419: assert(c > 0);
1.26 kristaps 420:
1.36 kristaps 421: /*
422: * Using `Bl -column' adds ARGS_TABSEP to the arguments
423: * and invalidates ARGS_DELIM. Using `Bl -diag' allows
424: * for quoted arguments.
425: */
426:
1.26 kristaps 427: /* LINTED */
1.24 kristaps 428: for (i = 0; i < c; i++) {
1.39 kristaps 429: switch (n->args->argv[i].arg) {
1.35 kristaps 430: case (MDOC_Column):
431: fl |= ARGS_TABSEP;
432: fl &= ~ARGS_DELIM;
433: i = c;
434: break;
435: case (MDOC_Diag):
436: fl |= ARGS_QUOTED;
437: i = c;
438: break;
439: default:
440: break;
441: }
1.24 kristaps 442: }
1.39 kristaps 443: break;
1.36 kristaps 444: default:
445: break;
1.24 kristaps 446: }
447:
1.26 kristaps 448: return(args(mdoc, line, pos, buf, fl, v));
449: }
450:
451:
452: static int
453: args(struct mdoc *mdoc, int line,
454: int *pos, char *buf, int fl, char **v)
455: {
1.31 kristaps 456: int i;
1.26 kristaps 457: char *p, *pp;
458:
459: assert(*pos > 0);
460:
461: if (0 == buf[*pos])
462: return(ARGS_EOLN);
463:
464: if ('\"' == buf[*pos] && ! (fl & ARGS_QUOTED))
465: if ( ! pwarn(mdoc, line, *pos, WQUOTPARM))
466: return(ARGS_ERROR);
467:
1.38 kristaps 468: if ( ! (fl & ARGS_ARGVLIKE) && '-' == buf[*pos])
1.26 kristaps 469: if ( ! pwarn(mdoc, line, *pos, WARGVPARM))
470: return(ARGS_ERROR);
471:
1.24 kristaps 472: /*
473: * If the first character is a delimiter and we're to look for
474: * delimited strings, then pass down the buffer seeing if it
475: * follows the pattern of [[::delim::][ ]+]+.
476: */
477:
1.2 kristaps 478: if ((fl & ARGS_DELIM) && mdoc_iscdelim(buf[*pos])) {
1.31 kristaps 479: for (i = *pos; buf[i]; ) {
480: if ( ! mdoc_iscdelim(buf[i]))
1.2 kristaps 481: break;
482: i++;
1.34 kristaps 483: /* There must be at least one space... */
1.52 kristaps 484: if (0 == buf[i] || ' ' != buf[i])
1.34 kristaps 485: break;
486: i++;
1.52 kristaps 487: while (buf[i] && ' ' == buf[i])
1.2 kristaps 488: i++;
489: }
490: if (0 == buf[i]) {
491: *v = &buf[*pos];
492: return(ARGS_PUNCT);
493: }
494: }
495:
1.24 kristaps 496: /* First parse non-quoted strings. */
1.1 kristaps 497:
1.17 kristaps 498: if ('\"' != buf[*pos] || ! (ARGS_QUOTED & fl)) {
1.1 kristaps 499: *v = &buf[*pos];
500:
1.24 kristaps 501: /*
502: * Thar be dragons here! If we're tab-separated, search
1.52 kristaps 503: * ahead for either a tab or the `Ta' macro.
504: * If a `Ta' is detected, it must be space-buffered before and
505: * after. If either of these hold true, then prune out the
1.24 kristaps 506: * extra spaces and call it an argument.
507: */
508:
509: if (ARGS_TABSEP & fl) {
510: /* Scan ahead to unescaped tab. */
1.12 kristaps 511:
1.52 kristaps 512: p = strchr(*v, '\t');
1.24 kristaps 513:
514: /* Scan ahead to unescaped `Ta'. */
515:
516: for (pp = *v; ; pp++) {
517: if (NULL == (pp = strstr(pp, "Ta")))
518: break;
519: if (pp > *v && ' ' != *(pp - 1))
520: continue;
521: if (' ' == *(pp + 2) || 0 == *(pp + 2))
522: break;
523: }
524:
525: /* Choose delimiter tab/Ta. */
526:
527: if (p && pp)
528: p = (p < pp ? p : pp);
529: else if ( ! p && pp)
530: p = pp;
531:
532: /* Strip delimiter's preceding whitespace. */
533:
534: if (p && p > *v) {
535: pp = p - 1;
536: while (pp > *v && ' ' == *pp)
537: pp--;
538: if (pp == *v && ' ' == *pp)
539: *pp = 0;
540: else if (' ' == *pp)
541: *(pp + 1) = 0;
542: }
543:
544: /* ...in- and proceding whitespace. */
545:
546: if (p && ('\t' != *p)) {
547: *p++ = 0;
548: *p++ = 0;
549: } else if (p)
550: *p++ = 0;
551:
552: if (p) {
553: while (' ' == *p)
554: p++;
555: if (0 != *p)
556: *(p - 1) = 0;
1.33 kristaps 557: *pos += (int)(p - *v);
1.24 kristaps 558: }
559:
1.25 kristaps 560: if (p && 0 == *p)
561: if ( ! pwarn(mdoc, line, *pos, WCOLEMPTY))
562: return(0);
563: if (p && 0 == *p && p > *v && ' ' == *(p - 1))
564: if ( ! pwarn(mdoc, line, *pos, WTAILWS))
565: return(0);
566:
1.26 kristaps 567: if (p)
1.49 kristaps 568: return(ARGS_PHRASE);
1.26 kristaps 569:
1.24 kristaps 570: /* Configure the eoln case, too. */
571:
1.26 kristaps 572: p = strchr(*v, 0);
573: assert(p);
574:
575: if (p > *v && ' ' == *(p - 1))
576: if ( ! pwarn(mdoc, line, *pos, WTAILWS))
577: return(0);
1.33 kristaps 578: *pos += (int)(p - *v);
1.24 kristaps 579:
1.49 kristaps 580: return(ARGS_PHRASE);
1.24 kristaps 581: }
1.46 kristaps 582:
1.24 kristaps 583: /* Do non-tabsep look-ahead here. */
584:
585: if ( ! (ARGS_TABSEP & fl))
1.31 kristaps 586: while (buf[*pos]) {
1.52 kristaps 587: if (' ' == buf[*pos])
1.17 kristaps 588: if ('\\' != buf[*pos - 1])
589: break;
1.12 kristaps 590: (*pos)++;
1.17 kristaps 591: }
1.1 kristaps 592:
593: if (0 == buf[*pos])
1.2 kristaps 594: return(ARGS_WORD);
1.1 kristaps 595:
596: buf[(*pos)++] = 0;
1.12 kristaps 597:
1.1 kristaps 598: if (0 == buf[*pos])
1.2 kristaps 599: return(ARGS_WORD);
1.1 kristaps 600:
1.12 kristaps 601: if ( ! (ARGS_TABSEP & fl))
1.52 kristaps 602: while (buf[*pos] && ' ' == buf[*pos])
1.12 kristaps 603: (*pos)++;
1.1 kristaps 604:
605: if (buf[*pos])
1.2 kristaps 606: return(ARGS_WORD);
1.1 kristaps 607:
1.25 kristaps 608: if ( ! pwarn(mdoc, line, *pos, WTAILWS))
1.2 kristaps 609: return(ARGS_ERROR);
1.1 kristaps 610:
1.2 kristaps 611: return(ARGS_WORD);
612: }
613:
614: /*
615: * If we're a quoted string (and quoted strings are allowed),
616: * then parse ahead to the next quote. If none's found, it's an
1.4 kristaps 617: * error. After, parse to the next word.
1.2 kristaps 618: */
1.1 kristaps 619:
620: *v = &buf[++(*pos)];
621:
622: while (buf[*pos] && '\"' != buf[*pos])
623: (*pos)++;
624:
625: if (0 == buf[*pos]) {
1.25 kristaps 626: (void)perr(mdoc, line, *pos, EQUOTTERM);
1.2 kristaps 627: return(ARGS_ERROR);
1.1 kristaps 628: }
629:
630: buf[(*pos)++] = 0;
631: if (0 == buf[*pos])
1.19 kristaps 632: return(ARGS_QWORD);
1.1 kristaps 633:
1.52 kristaps 634: while (buf[*pos] && ' ' == buf[*pos])
1.1 kristaps 635: (*pos)++;
636:
637: if (buf[*pos])
1.19 kristaps 638: return(ARGS_QWORD);
1.1 kristaps 639:
1.25 kristaps 640: if ( ! pwarn(mdoc, line, *pos, WTAILWS))
1.2 kristaps 641: return(ARGS_ERROR);
642:
1.19 kristaps 643: return(ARGS_QWORD);
1.1 kristaps 644: }
645:
646:
1.2 kristaps 647: static int
1.30 kristaps 648: argv_a2arg(int tok, const char *argv)
1.1 kristaps 649: {
650:
1.36 kristaps 651: /*
652: * Parse an argument identifier from its text. XXX - this
653: * should really be table-driven to clarify the code.
654: *
655: * If you add an argument to the list, make sure that you
656: * register it here with its one or more macros!
657: */
658:
1.1 kristaps 659: switch (tok) {
1.6 kristaps 660: case (MDOC_An):
661: if (xstrcmp(argv, "split"))
662: return(MDOC_Split);
663: else if (xstrcmp(argv, "nosplit"))
664: return(MDOC_Nosplit);
665: break;
666:
1.2 kristaps 667: case (MDOC_Bd):
1.1 kristaps 668: if (xstrcmp(argv, "ragged"))
669: return(MDOC_Ragged);
670: else if (xstrcmp(argv, "unfilled"))
671: return(MDOC_Unfilled);
1.13 kristaps 672: else if (xstrcmp(argv, "filled"))
673: return(MDOC_Filled);
1.1 kristaps 674: else if (xstrcmp(argv, "literal"))
675: return(MDOC_Literal);
676: else if (xstrcmp(argv, "file"))
677: return(MDOC_File);
678: else if (xstrcmp(argv, "offset"))
679: return(MDOC_Offset);
1.49 kristaps 680: else if (xstrcmp(argv, "compact"))
681: return(MDOC_Compact);
1.2 kristaps 682: break;
683:
1.8 kristaps 684: case (MDOC_Bf):
685: if (xstrcmp(argv, "emphasis"))
686: return(MDOC_Emphasis);
687: else if (xstrcmp(argv, "literal"))
688: return(MDOC_Literal);
689: else if (xstrcmp(argv, "symbolic"))
690: return(MDOC_Symbolic);
691: break;
692:
1.7 kristaps 693: case (MDOC_Bk):
694: if (xstrcmp(argv, "words"))
695: return(MDOC_Words);
696: break;
697:
1.2 kristaps 698: case (MDOC_Bl):
699: if (xstrcmp(argv, "bullet"))
1.1 kristaps 700: return(MDOC_Bullet);
701: else if (xstrcmp(argv, "dash"))
702: return(MDOC_Dash);
703: else if (xstrcmp(argv, "hyphen"))
704: return(MDOC_Hyphen);
705: else if (xstrcmp(argv, "item"))
706: return(MDOC_Item);
707: else if (xstrcmp(argv, "enum"))
708: return(MDOC_Enum);
709: else if (xstrcmp(argv, "tag"))
710: return(MDOC_Tag);
711: else if (xstrcmp(argv, "diag"))
712: return(MDOC_Diag);
713: else if (xstrcmp(argv, "hang"))
714: return(MDOC_Hang);
715: else if (xstrcmp(argv, "ohang"))
716: return(MDOC_Ohang);
717: else if (xstrcmp(argv, "inset"))
718: return(MDOC_Inset);
719: else if (xstrcmp(argv, "column"))
720: return(MDOC_Column);
721: else if (xstrcmp(argv, "width"))
722: return(MDOC_Width);
1.2 kristaps 723: else if (xstrcmp(argv, "offset"))
724: return(MDOC_Offset);
1.1 kristaps 725: else if (xstrcmp(argv, "compact"))
726: return(MDOC_Compact);
1.50 kristaps 727: else if (xstrcmp(argv, "nested"))
728: return(MDOC_Nested);
1.2 kristaps 729: break;
1.3 kristaps 730:
731: case (MDOC_Rv):
732: /* FALLTHROUGH */
733: case (MDOC_Ex):
734: if (xstrcmp(argv, "std"))
735: return(MDOC_Std);
736: break;
1.1 kristaps 737: default:
1.8 kristaps 738: break;
1.1 kristaps 739: }
740:
741: return(MDOC_ARG_MAX);
742: }
743:
744:
1.2 kristaps 745: static int
1.26 kristaps 746: argv_multi(struct mdoc *mdoc, int line,
1.39 kristaps 747: struct mdoc_argv *v, int *pos, char *buf)
1.12 kristaps 748: {
749: int c, ppos;
750: char *p;
751:
752: ppos = *pos;
753:
1.39 kristaps 754: for (v->sz = 0; ; v->sz++) {
1.12 kristaps 755: if ('-' == buf[*pos])
756: break;
1.26 kristaps 757: c = args(mdoc, line, pos, buf, ARGS_QUOTED, &p);
1.39 kristaps 758: if (ARGS_ERROR == c)
1.12 kristaps 759: return(0);
1.39 kristaps 760: else if (ARGS_EOLN == c)
1.12 kristaps 761: break;
1.39 kristaps 762:
1.52 kristaps 763: if (0 == v->sz % MULTI_STEP)
1.39 kristaps 764: v->value = xrealloc(v->value,
1.52 kristaps 765: (v->sz + MULTI_STEP) * sizeof(char *));
1.39 kristaps 766:
1.40 kristaps 767: v->value[(int)v->sz] = xstrdup(p);
1.12 kristaps 768: }
769:
1.39 kristaps 770: if (v->sz)
1.12 kristaps 771: return(1);
772:
1.39 kristaps 773: return(perr(mdoc, line, ppos, EARGVAL));
1.12 kristaps 774: }
775:
776:
777: static int
1.36 kristaps 778: argv_opt_single(struct mdoc *mdoc, int line,
1.39 kristaps 779: struct mdoc_argv *v, int *pos, char *buf)
1.36 kristaps 780: {
1.39 kristaps 781: int c;
1.36 kristaps 782: char *p;
783:
784: if ('-' == buf[*pos])
785: return(1);
786:
787: c = args(mdoc, line, pos, buf, ARGS_QUOTED, &p);
788: if (ARGS_ERROR == c)
789: return(0);
790: if (ARGS_EOLN == c)
791: return(1);
792:
793: v->sz = 1;
794: v->value = xcalloc(1, sizeof(char *));
1.40 kristaps 795: v->value[0] = xstrdup(p);
1.36 kristaps 796: return(1);
797: }
798:
799:
800: /*
801: * Parse a single, mandatory value from the stream.
802: */
803: static int
1.26 kristaps 804: argv_single(struct mdoc *mdoc, int line,
1.39 kristaps 805: struct mdoc_argv *v, int *pos, char *buf)
1.1 kristaps 806: {
1.12 kristaps 807: int c, ppos;
1.1 kristaps 808: char *p;
809:
810: ppos = *pos;
811:
1.26 kristaps 812: c = args(mdoc, line, pos, buf, ARGS_QUOTED, &p);
1.12 kristaps 813: if (ARGS_ERROR == c)
814: return(0);
815: if (ARGS_EOLN == c)
1.36 kristaps 816: return(perr(mdoc, line, ppos, EARGVAL));
1.12 kristaps 817:
818: v->sz = 1;
819: v->value = xcalloc(1, sizeof(char *));
1.40 kristaps 820: v->value[0] = xstrdup(p);
1.12 kristaps 821: return(1);
822: }
823:
824:
1.36 kristaps 825: /*
826: * Determine rules for parsing arguments. Arguments can either accept
827: * no parameters, an optional single parameter, one parameter, or
828: * multiple parameters.
829: */
1.12 kristaps 830: static int
1.51 kristaps 831: argv(struct mdoc *mdoc, int line,
1.39 kristaps 832: struct mdoc_argv *v, int *pos, char *buf)
1.12 kristaps 833: {
834:
835: v->sz = 0;
836: v->value = NULL;
837:
1.50 kristaps 838: switch (mdoc_argvflags[v->arg]) {
1.36 kristaps 839: case (ARGV_SINGLE):
1.26 kristaps 840: return(argv_single(mdoc, line, v, pos, buf));
1.36 kristaps 841: case (ARGV_MULTI):
1.26 kristaps 842: return(argv_multi(mdoc, line, v, pos, buf));
1.36 kristaps 843: case (ARGV_OPT_SINGLE):
844: return(argv_opt_single(mdoc, line, v, pos, buf));
1.1 kristaps 845: default:
1.36 kristaps 846: /* ARGV_NONE */
1.6 kristaps 847: break;
1.1 kristaps 848: }
849:
850: return(1);
851: }
CVSweb