Annotation of mandoc/mdoc_argv.c, Revision 1.75
1.75 ! kristaps 1: /* $Id: mdoc_argv.c,v 1.74 2011/04/07 01:08:42 joerg Exp $ */
1.1 kristaps 2: /*
1.56 schwarze 3: * Copyright (c) 2008, 2009, 2010 Kristaps Dzonsons <kristaps@bsd.lv>
1.1 kristaps 4: *
5: * Permission to use, copy, modify, and distribute this software for any
1.3 kristaps 6: * purpose with or without fee is hereby granted, provided that the above
7: * copyright notice and this permission notice appear in all copies.
1.1 kristaps 8: *
1.3 kristaps 9: * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10: * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11: * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12: * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13: * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14: * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15: * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
1.1 kristaps 16: */
1.33 kristaps 17: #ifdef HAVE_CONFIG_H
18: #include "config.h"
19: #endif
20:
1.1 kristaps 21: #include <sys/types.h>
22:
23: #include <assert.h>
24: #include <ctype.h>
25: #include <stdlib.h>
26: #include <stdio.h>
27: #include <string.h>
28:
1.72 kristaps 29: #include "mdoc.h"
1.49 kristaps 30: #include "mandoc.h"
1.1 kristaps 31: #include "libmdoc.h"
1.31 kristaps 32: #include "libmandoc.h"
1.1 kristaps 33:
1.68 kristaps 34: #define MULTI_STEP 5 /* pre-allocate argument values */
1.1 kristaps 35:
1.57 kristaps 36: static enum mdocargt argv_a2arg(enum mdoct, const char *);
1.39 kristaps 37: static enum margserr args(struct mdoc *, int, int *,
1.1 kristaps 38: char *, int, char **);
1.69 kristaps 39: static int args_checkpunct(struct mdoc *,
40: const char *, int, int, int);
1.1 kristaps 41: static int argv(struct mdoc *, int,
42: struct mdoc_argv *, int *, char *);
43: static int argv_single(struct mdoc *, int,
44: struct mdoc_argv *, int *, char *);
45: static int argv_opt_single(struct mdoc *, int,
46: struct mdoc_argv *, int *, char *);
47: static int argv_multi(struct mdoc *, int,
48: struct mdoc_argv *, int *, char *);
1.71 kristaps 49: static void argn_free(struct mdoc_arg *, int);
1.2 kristaps 50:
1.68 kristaps 51: enum argvflag {
52: ARGV_NONE, /* no args to flag (e.g., -split) */
53: ARGV_SINGLE, /* one arg to flag (e.g., -file xxx) */
54: ARGV_MULTI, /* multiple args (e.g., -column xxx yyy) */
55: ARGV_OPT_SINGLE /* optional arg (e.g., -offset [xxx]) */
56: };
1.1 kristaps 57:
1.68 kristaps 58: static const enum argvflag argvflags[MDOC_ARG_MAX] = {
1.1 kristaps 59: ARGV_NONE, /* MDOC_Split */
60: ARGV_NONE, /* MDOC_Nosplit */
61: ARGV_NONE, /* MDOC_Ragged */
62: ARGV_NONE, /* MDOC_Unfilled */
63: ARGV_NONE, /* MDOC_Literal */
1.29 kristaps 64: ARGV_SINGLE, /* MDOC_File */
1.26 kristaps 65: ARGV_OPT_SINGLE, /* MDOC_Offset */
1.1 kristaps 66: ARGV_NONE, /* MDOC_Bullet */
67: ARGV_NONE, /* MDOC_Dash */
68: ARGV_NONE, /* MDOC_Hyphen */
69: ARGV_NONE, /* MDOC_Item */
70: ARGV_NONE, /* MDOC_Enum */
71: ARGV_NONE, /* MDOC_Tag */
72: ARGV_NONE, /* MDOC_Diag */
73: ARGV_NONE, /* MDOC_Hang */
74: ARGV_NONE, /* MDOC_Ohang */
75: ARGV_NONE, /* MDOC_Inset */
76: ARGV_MULTI, /* MDOC_Column */
77: ARGV_SINGLE, /* MDOC_Width */
78: ARGV_NONE, /* MDOC_Compact */
1.25 kristaps 79: ARGV_NONE, /* MDOC_Std */
1.1 kristaps 80: ARGV_NONE, /* MDOC_Filled */
81: ARGV_NONE, /* MDOC_Words */
82: ARGV_NONE, /* MDOC_Emphasis */
83: ARGV_NONE, /* MDOC_Symbolic */
84: ARGV_NONE /* MDOC_Symbolic */
85: };
86:
1.68 kristaps 87: static const int argflags[MDOC_MAX] = {
1.5 kristaps 88: 0, /* Ap */
1.1 kristaps 89: 0, /* Dd */
90: 0, /* Dt */
91: 0, /* Os */
1.17 kristaps 92: 0, /* Sh */
93: 0, /* Ss */
1.59 kristaps 94: 0, /* Pp */
1.1 kristaps 95: ARGS_DELIM, /* D1 */
1.17 kristaps 96: ARGS_DELIM, /* Dl */
1.1 kristaps 97: 0, /* Bd */
98: 0, /* Ed */
1.17 kristaps 99: 0, /* Bl */
1.1 kristaps 100: 0, /* El */
101: 0, /* It */
102: ARGS_DELIM, /* Ad */
103: ARGS_DELIM, /* An */
1.17 kristaps 104: ARGS_DELIM, /* Ar */
105: 0, /* Cd */
1.1 kristaps 106: ARGS_DELIM, /* Cm */
107: ARGS_DELIM, /* Dv */
108: ARGS_DELIM, /* Er */
109: ARGS_DELIM, /* Ev */
110: 0, /* Ex */
1.17 kristaps 111: ARGS_DELIM, /* Fa */
1.1 kristaps 112: 0, /* Fd */
113: ARGS_DELIM, /* Fl */
1.17 kristaps 114: ARGS_DELIM, /* Fn */
115: ARGS_DELIM, /* Ft */
1.1 kristaps 116: ARGS_DELIM, /* Ic */
117: 0, /* In */
1.17 kristaps 118: ARGS_DELIM, /* Li */
119: 0, /* Nd */
1.1 kristaps 120: ARGS_DELIM, /* Nm */
121: ARGS_DELIM, /* Op */
122: 0, /* Ot */
123: ARGS_DELIM, /* Pa */
124: 0, /* Rv */
1.15 kristaps 125: ARGS_DELIM, /* St */
1.1 kristaps 126: ARGS_DELIM, /* Va */
127: ARGS_DELIM, /* Vt */
128: ARGS_DELIM, /* Xr */
1.17 kristaps 129: 0, /* %A */
130: 0, /* %B */
131: 0, /* %D */
132: 0, /* %I */
133: 0, /* %J */
134: 0, /* %N */
135: 0, /* %O */
136: 0, /* %P */
137: 0, /* %R */
138: 0, /* %T */
139: 0, /* %V */
1.1 kristaps 140: ARGS_DELIM, /* Ac */
141: 0, /* Ao */
142: ARGS_DELIM, /* Aq */
143: ARGS_DELIM, /* At */
144: ARGS_DELIM, /* Bc */
145: 0, /* Bf */
146: 0, /* Bo */
147: ARGS_DELIM, /* Bq */
148: ARGS_DELIM, /* Bsx */
149: ARGS_DELIM, /* Bx */
150: 0, /* Db */
151: ARGS_DELIM, /* Dc */
152: 0, /* Do */
153: ARGS_DELIM, /* Dq */
154: ARGS_DELIM, /* Ec */
155: 0, /* Ef */
156: ARGS_DELIM, /* Em */
157: 0, /* Eo */
158: ARGS_DELIM, /* Fx */
159: ARGS_DELIM, /* Ms */
160: ARGS_DELIM, /* No */
161: ARGS_DELIM, /* Ns */
162: ARGS_DELIM, /* Nx */
163: ARGS_DELIM, /* Ox */
164: ARGS_DELIM, /* Pc */
165: ARGS_DELIM, /* Pf */
166: 0, /* Po */
167: ARGS_DELIM, /* Pq */
168: ARGS_DELIM, /* Qc */
169: ARGS_DELIM, /* Ql */
170: 0, /* Qo */
171: ARGS_DELIM, /* Qq */
172: 0, /* Re */
173: 0, /* Rs */
174: ARGS_DELIM, /* Sc */
175: 0, /* So */
176: ARGS_DELIM, /* Sq */
177: 0, /* Sm */
178: ARGS_DELIM, /* Sx */
1.17 kristaps 179: ARGS_DELIM, /* Sy */
1.1 kristaps 180: ARGS_DELIM, /* Tn */
181: ARGS_DELIM, /* Ux */
182: ARGS_DELIM, /* Xc */
183: 0, /* Xo */
1.17 kristaps 184: 0, /* Fo */
1.1 kristaps 185: 0, /* Fc */
186: 0, /* Oo */
187: ARGS_DELIM, /* Oc */
188: 0, /* Bk */
189: 0, /* Ek */
190: 0, /* Bt */
191: 0, /* Hf */
192: 0, /* Fr */
193: 0, /* Ud */
194: 0, /* Lb */
1.60 schwarze 195: 0, /* Lp */
1.17 kristaps 196: ARGS_DELIM, /* Lk */
197: ARGS_DELIM, /* Mt */
1.1 kristaps 198: ARGS_DELIM, /* Brq */
199: 0, /* Bro */
200: ARGS_DELIM, /* Brc */
1.17 kristaps 201: 0, /* %C */
1.1 kristaps 202: 0, /* Es */
203: 0, /* En */
204: 0, /* Dx */
1.17 kristaps 205: 0, /* %Q */
1.14 kristaps 206: 0, /* br */
207: 0, /* sp */
1.30 kristaps 208: 0, /* %U */
1.51 kristaps 209: 0, /* Ta */
1.1 kristaps 210: };
211:
1.73 kristaps 212: static const enum mdocargt args_Ex[] = {
213: MDOC_Std,
214: MDOC_ARG_MAX
215: };
216:
217: static const enum mdocargt args_An[] = {
218: MDOC_Split,
219: MDOC_Nosplit,
220: MDOC_ARG_MAX
221: };
222:
223: static const enum mdocargt args_Bd[] = {
224: MDOC_Ragged,
225: MDOC_Unfilled,
226: MDOC_Filled,
227: MDOC_Literal,
228: MDOC_File,
229: MDOC_Offset,
230: MDOC_Compact,
231: MDOC_Centred,
232: MDOC_ARG_MAX
233: };
234:
235: static const enum mdocargt args_Bf[] = {
236: MDOC_Emphasis,
237: MDOC_Literal,
238: MDOC_Symbolic,
239: MDOC_ARG_MAX
240: };
241:
242: static const enum mdocargt args_Bk[] = {
243: MDOC_Words,
244: MDOC_ARG_MAX
245: };
246:
247: static const enum mdocargt args_Bl[] = {
248: MDOC_Bullet,
249: MDOC_Dash,
250: MDOC_Hyphen,
251: MDOC_Item,
252: MDOC_Enum,
253: MDOC_Tag,
254: MDOC_Diag,
255: MDOC_Hang,
256: MDOC_Ohang,
257: MDOC_Inset,
258: MDOC_Column,
259: MDOC_Width,
260: MDOC_Offset,
261: MDOC_Compact,
262: MDOC_Nested,
263: MDOC_ARG_MAX
264: };
265:
1.1 kristaps 266: /*
267: * Parse an argument from line text. This comes in the form of -key
268: * [value0...], which may either have a single mandatory value, at least
269: * one mandatory value, an optional single value, or no value.
270: */
1.40 kristaps 271: enum margverr
1.35 kristaps 272: mdoc_argv(struct mdoc *m, int line, enum mdoct tok,
1.1 kristaps 273: struct mdoc_arg **v, int *pos, char *buf)
274: {
275: char *p, sv;
276: struct mdoc_argv tmp;
277: struct mdoc_arg *arg;
278:
1.52 kristaps 279: if ('\0' == buf[*pos])
1.1 kristaps 280: return(ARGV_EOLN);
281:
282: assert(' ' != buf[*pos]);
283:
284: /* Parse through to the first unescaped space. */
285:
286: p = &buf[++(*pos)];
287:
288: assert(*pos > 0);
289:
290: /* LINTED */
291: while (buf[*pos]) {
292: if (' ' == buf[*pos])
293: if ('\\' != buf[*pos - 1])
294: break;
295: (*pos)++;
296: }
297:
298: /* XXX - save zeroed byte, if not an argument. */
299:
1.52 kristaps 300: sv = '\0';
1.1 kristaps 301: if (buf[*pos]) {
302: sv = buf[*pos];
1.52 kristaps 303: buf[(*pos)++] = '\0';
1.1 kristaps 304: }
305:
1.68 kristaps 306: memset(&tmp, 0, sizeof(struct mdoc_argv));
1.1 kristaps 307: tmp.line = line;
308: tmp.pos = *pos;
309:
310: /* See if our token accepts the argument. */
311:
312: if (MDOC_ARG_MAX == (tmp.arg = argv_a2arg(tok, p))) {
313: /* XXX - restore saved zeroed byte. */
314: if (sv)
315: buf[*pos - 1] = sv;
316: return(ARGV_WORD);
317: }
318:
319: while (buf[*pos] && ' ' == buf[*pos])
320: (*pos)++;
321:
1.11 kristaps 322: if ( ! argv(m, line, &tmp, pos, buf))
1.1 kristaps 323: return(ARGV_ERROR);
324:
1.31 kristaps 325: if (NULL == (arg = *v))
1.32 kristaps 326: arg = *v = mandoc_calloc(1, sizeof(struct mdoc_arg));
1.1 kristaps 327:
328: arg->argc++;
1.31 kristaps 329: arg->argv = mandoc_realloc
330: (arg->argv, arg->argc * sizeof(struct mdoc_argv));
1.2 kristaps 331:
1.68 kristaps 332: memcpy(&arg->argv[(int)arg->argc - 1],
1.1 kristaps 333: &tmp, sizeof(struct mdoc_argv));
334:
335: return(ARGV_ARG);
336: }
337:
338: void
339: mdoc_argv_free(struct mdoc_arg *p)
340: {
1.37 kristaps 341: int i;
1.1 kristaps 342:
343: if (NULL == p)
344: return;
345:
346: if (p->refcnt) {
347: --(p->refcnt);
348: if (p->refcnt)
349: return;
350: }
351: assert(p->argc);
352:
1.37 kristaps 353: for (i = (int)p->argc - 1; i >= 0; i--)
1.71 kristaps 354: argn_free(p, i);
1.37 kristaps 355:
356: free(p->argv);
357: free(p);
358: }
359:
1.71 kristaps 360: static void
361: argn_free(struct mdoc_arg *p, int iarg)
1.37 kristaps 362: {
1.58 kristaps 363: struct mdoc_argv *arg;
1.37 kristaps 364: int j;
1.58 kristaps 365:
366: arg = &p->argv[iarg];
1.1 kristaps 367:
1.37 kristaps 368: if (arg->sz && arg->value) {
369: for (j = (int)arg->sz - 1; j >= 0; j--)
370: free(arg->value[j]);
371: free(arg->value);
1.1 kristaps 372: }
373:
1.37 kristaps 374: for (--p->argc; iarg < (int)p->argc; iarg++)
375: p->argv[iarg] = p->argv[iarg+1];
1.1 kristaps 376: }
377:
1.39 kristaps 378: enum margserr
1.23 kristaps 379: mdoc_zargs(struct mdoc *m, int line, int *pos,
380: char *buf, int flags, char **v)
1.19 kristaps 381: {
382:
1.23 kristaps 383: return(args(m, line, pos, buf, flags, v));
1.19 kristaps 384: }
385:
1.39 kristaps 386: enum margserr
1.35 kristaps 387: mdoc_args(struct mdoc *m, int line, int *pos,
388: char *buf, enum mdoct tok, char **v)
1.1 kristaps 389: {
1.50 kristaps 390: int fl;
1.1 kristaps 391: struct mdoc_node *n;
392:
1.68 kristaps 393: fl = argflags[tok];
1.1 kristaps 394:
1.17 kristaps 395: if (MDOC_It != tok)
396: return(args(m, line, pos, buf, fl, v));
397:
1.51 kristaps 398: /*
399: * We know that we're in an `It', so it's reasonable to expect
400: * us to be sitting in a `Bl'. Someday this may not be the case
401: * (if we allow random `It's sitting out there), so provide a
402: * safe fall-back into the default behaviour.
403: */
404:
1.17 kristaps 405: for (n = m->last; n; n = n->parent)
1.50 kristaps 406: if (MDOC_Bl == n->tok)
1.17 kristaps 407: break;
1.1 kristaps 408:
1.62 kristaps 409: if (n && LIST_column == n->norm->Bl.type) {
1.17 kristaps 410: fl |= ARGS_TABSEP;
411: fl &= ~ARGS_DELIM;
1.1 kristaps 412: }
413:
1.11 kristaps 414: return(args(m, line, pos, buf, fl, v));
1.1 kristaps 415: }
416:
1.39 kristaps 417: static enum margserr
1.13 kristaps 418: args(struct mdoc *m, int line, int *pos,
419: char *buf, int fl, char **v)
1.1 kristaps 420: {
1.52 kristaps 421: char *p, *pp;
422: enum margserr rc;
1.1 kristaps 423:
1.24 kristaps 424: /*
425: * Parse out the terms (like `val' in `.Xx -arg val' or simply
426: * `.Xx val'), which can have all sorts of properties:
427: *
428: * ARGS_DELIM: use special handling if encountering trailing
429: * delimiters in the form of [[::delim::][ ]+]+.
430: *
431: * ARGS_NOWARN: don't post warnings. This is only used when
432: * re-parsing delimiters, as the warnings have already been
433: * posted.
434: *
435: * ARGS_TABSEP: use special handling for tab/`Ta' separated
436: * phrases like in `Bl -column'.
437: */
438:
1.17 kristaps 439: assert(' ' != buf[*pos]);
1.1 kristaps 440:
1.46 kristaps 441: if ('\0' == buf[*pos]) {
1.47 kristaps 442: if (MDOC_PPHRASE & m->flags)
1.46 kristaps 443: return(ARGS_EOLN);
444: /*
445: * If we're not in a partial phrase and the flag for
446: * being a phrase literal is still set, the punctuation
447: * is unterminated.
448: */
449: if (MDOC_PHRASELIT & m->flags)
1.67 kristaps 450: mdoc_pmsg(m, line, *pos, MANDOCERR_BADQUOTE);
1.46 kristaps 451:
452: m->flags &= ~MDOC_PHRASELIT;
1.1 kristaps 453: return(ARGS_EOLN);
1.46 kristaps 454: }
1.1 kristaps 455:
1.64 kristaps 456: *v = &buf[*pos];
1.17 kristaps 457:
1.69 kristaps 458: if (ARGS_DELIM & fl && args_checkpunct(m, buf, *pos, line, fl))
1.64 kristaps 459: return(ARGS_PUNCT);
1.1 kristaps 460:
1.17 kristaps 461: /*
462: * First handle TABSEP items, restricted to `Bl -column'. This
463: * ignores conventional token parsing and instead uses tabs or
464: * `Ta' macros to separate phrases. Phrases are parsed again
465: * for arguments at a later phase.
466: */
1.1 kristaps 467:
1.17 kristaps 468: if (ARGS_TABSEP & fl) {
1.20 kristaps 469: /* Scan ahead to tab (can't be escaped). */
1.17 kristaps 470: p = strchr(*v, '\t');
1.46 kristaps 471: pp = NULL;
1.17 kristaps 472:
473: /* Scan ahead to unescaped `Ta'. */
1.46 kristaps 474: if ( ! (MDOC_PHRASELIT & m->flags))
475: for (pp = *v; ; pp++) {
476: if (NULL == (pp = strstr(pp, "Ta")))
477: break;
478: if (pp > *v && ' ' != *(pp - 1))
479: continue;
1.51 kristaps 480: if (' ' == *(pp + 2) || '\0' == *(pp + 2))
1.46 kristaps 481: break;
482: }
1.17 kristaps 483:
1.42 kristaps 484: /* By default, assume a phrase. */
485: rc = ARGS_PHRASE;
486:
1.21 kristaps 487: /*
488: * Adjust new-buffer position to be beyond delimiter
489: * mark (e.g., Ta -> end + 2).
490: */
1.20 kristaps 491: if (p && pp) {
492: *pos += pp < p ? 2 : 1;
1.42 kristaps 493: rc = pp < p ? ARGS_PHRASE : ARGS_PPHRASE;
1.20 kristaps 494: p = pp < p ? pp : p;
495: } else if (p && ! pp) {
1.42 kristaps 496: rc = ARGS_PPHRASE;
1.20 kristaps 497: *pos += 1;
498: } else if (pp && ! p) {
1.17 kristaps 499: p = pp;
1.20 kristaps 500: *pos += 2;
1.44 kristaps 501: } else {
502: rc = ARGS_PEND;
1.20 kristaps 503: p = strchr(*v, 0);
1.44 kristaps 504: }
1.20 kristaps 505:
1.21 kristaps 506: /* Whitespace check for eoln case... */
1.52 kristaps 507: if ('\0' == *p && ' ' == *(p - 1) && ! (ARGS_NOWARN & fl))
1.67 kristaps 508: mdoc_pmsg(m, line, *pos, MANDOCERR_EOLNSPACE);
1.20 kristaps 509:
510: *pos += (int)(p - *v);
1.17 kristaps 511:
512: /* Strip delimiter's preceding whitespace. */
1.20 kristaps 513: pp = p - 1;
514: while (pp > *v && ' ' == *pp) {
515: if (pp > *v && '\\' == *(pp - 1))
516: break;
517: pp--;
1.17 kristaps 518: }
1.20 kristaps 519: *(pp + 1) = 0;
1.17 kristaps 520:
1.20 kristaps 521: /* Strip delimiter's proceeding whitespace. */
522: for (pp = &buf[*pos]; ' ' == *pp; pp++, (*pos)++)
523: /* Skip ahead. */ ;
1.1 kristaps 524:
1.41 kristaps 525: return(rc);
1.17 kristaps 526: }
1.1 kristaps 527:
1.17 kristaps 528: /*
529: * Process a quoted literal. A quote begins with a double-quote
530: * and ends with a double-quote NOT preceded by a double-quote.
531: * Whitespace is NOT involved in literal termination.
532: */
1.1 kristaps 533:
1.46 kristaps 534: if (MDOC_PHRASELIT & m->flags || '\"' == buf[*pos]) {
535: if ( ! (MDOC_PHRASELIT & m->flags))
536: *v = &buf[++(*pos)];
537:
1.47 kristaps 538: if (MDOC_PPHRASE & m->flags)
1.46 kristaps 539: m->flags |= MDOC_PHRASELIT;
1.1 kristaps 540:
1.17 kristaps 541: for ( ; buf[*pos]; (*pos)++) {
542: if ('\"' != buf[*pos])
543: continue;
544: if ('\"' != buf[*pos + 1])
545: break;
546: (*pos)++;
547: }
1.1 kristaps 548:
1.46 kristaps 549: if ('\0' == buf[*pos]) {
1.47 kristaps 550: if (ARGS_NOWARN & fl || MDOC_PPHRASE & m->flags)
1.23 kristaps 551: return(ARGS_QWORD);
1.67 kristaps 552: mdoc_pmsg(m, line, *pos, MANDOCERR_BADQUOTE);
1.18 kristaps 553: return(ARGS_QWORD);
1.17 kristaps 554: }
1.1 kristaps 555:
1.46 kristaps 556: m->flags &= ~MDOC_PHRASELIT;
557: buf[(*pos)++] = '\0';
1.1 kristaps 558:
1.46 kristaps 559: if ('\0' == buf[*pos])
1.17 kristaps 560: return(ARGS_QWORD);
1.1 kristaps 561:
1.17 kristaps 562: while (' ' == buf[*pos])
563: (*pos)++;
1.1 kristaps 564:
1.23 kristaps 565: if (0 == buf[*pos] && ! (ARGS_NOWARN & fl))
1.67 kristaps 566: mdoc_pmsg(m, line, *pos, MANDOCERR_EOLNSPACE);
1.1 kristaps 567:
1.17 kristaps 568: return(ARGS_QWORD);
1.1 kristaps 569: }
570:
1.75 ! kristaps 571: p = &buf[*pos];
! 572: *v = mandoc_getarg(m->parse, &p, line,
! 573: ! (ARGS_NOWARN & fl), pos);
1.1 kristaps 574:
1.17 kristaps 575: return(ARGS_WORD);
1.64 kristaps 576: }
577:
578: /*
579: * Check if the string consists only of space-separated closing
1.65 kristaps 580: * delimiters. This is a bit of a dance: the first must be a close
581: * delimiter, but it may be followed by middle delimiters. Arbitrary
582: * whitespace may separate these tokens.
1.64 kristaps 583: */
584: static int
1.69 kristaps 585: args_checkpunct(struct mdoc *m, const char *buf, int i, int ln, int fl)
1.64 kristaps 586: {
1.69 kristaps 587: int j;
588: char dbuf[DELIMSZ];
1.64 kristaps 589: enum mdelim d;
590:
1.65 kristaps 591: /* First token must be a close-delimiter. */
592:
1.69 kristaps 593: for (j = 0; buf[i] && ' ' != buf[i] && j < DELIMSZ; j++, i++)
594: dbuf[j] = buf[i];
1.65 kristaps 595:
596: if (DELIMSZ == j)
597: return(0);
598:
1.69 kristaps 599: dbuf[j] = '\0';
1.70 kristaps 600: if (DELIM_CLOSE != mdoc_isdelim(dbuf))
1.64 kristaps 601: return(0);
602:
1.69 kristaps 603: while (' ' == buf[i])
1.65 kristaps 604: i++;
605:
606: /* Remaining must NOT be open/none. */
607:
1.69 kristaps 608: while (buf[i]) {
1.65 kristaps 609: j = 0;
1.69 kristaps 610: while (buf[i] && ' ' != buf[i] && j < DELIMSZ)
611: dbuf[j++] = buf[i++];
1.65 kristaps 612:
613: if (DELIMSZ == j)
614: return(0);
615:
1.69 kristaps 616: dbuf[j] = '\0';
1.70 kristaps 617: d = mdoc_isdelim(dbuf);
1.64 kristaps 618: if (DELIM_NONE == d || DELIM_OPEN == d)
1.65 kristaps 619: return(0);
620:
1.69 kristaps 621: while (' ' == buf[i])
1.64 kristaps 622: i++;
623: }
624:
1.69 kristaps 625: if ( ! (ARGS_NOWARN & fl) && i && ' ' == buf[i - 1])
626: mdoc_pmsg(m, ln, i - 1, MANDOCERR_EOLNSPACE);
627:
628: return('\0' == buf[i]);
1.1 kristaps 629: }
630:
1.63 kristaps 631: /*
632: * Match up an argument string (e.g., `-foo bar' having "foo") with the
633: * correrct identifier. It must apply to the given macro. If none was
634: * found (including bad matches), return MDOC_ARG_MAX.
635: */
1.57 kristaps 636: static enum mdocargt
1.35 kristaps 637: argv_a2arg(enum mdoct tok, const char *p)
1.1 kristaps 638: {
1.74 joerg 639: const enum mdocargt *argsp;
1.1 kristaps 640:
1.74 joerg 641: argsp = NULL;
1.1 kristaps 642:
643: switch (tok) {
644: case (MDOC_An):
1.74 joerg 645: argsp = args_An;
1.1 kristaps 646: break;
647: case (MDOC_Bd):
1.74 joerg 648: argsp = args_Bd;
1.1 kristaps 649: break;
650: case (MDOC_Bf):
1.74 joerg 651: argsp = args_Bf;
1.1 kristaps 652: break;
653: case (MDOC_Bk):
1.74 joerg 654: argsp = args_Bk;
1.1 kristaps 655: break;
656: case (MDOC_Bl):
1.74 joerg 657: argsp = args_Bl;
1.1 kristaps 658: break;
659: case (MDOC_Rv):
660: /* FALLTHROUGH */
661: case (MDOC_Ex):
1.74 joerg 662: argsp = args_Ex;
1.1 kristaps 663: break;
664: default:
1.73 kristaps 665: return(MDOC_ARG_MAX);
1.1 kristaps 666: }
1.63 kristaps 667:
1.74 joerg 668: assert(argsp);
1.73 kristaps 669:
1.74 joerg 670: for ( ; MDOC_ARG_MAX != *argsp ; argsp++)
671: if (0 == strcmp(p, mdoc_argnames[*argsp]))
672: return(*argsp);
1.1 kristaps 673:
674: return(MDOC_ARG_MAX);
675: }
676:
677: static int
1.11 kristaps 678: argv_multi(struct mdoc *m, int line,
1.1 kristaps 679: struct mdoc_argv *v, int *pos, char *buf)
680: {
1.43 kristaps 681: enum margserr ac;
1.1 kristaps 682: char *p;
683:
684: for (v->sz = 0; ; v->sz++) {
685: if ('-' == buf[*pos])
686: break;
1.43 kristaps 687: ac = args(m, line, pos, buf, 0, &p);
688: if (ARGS_ERROR == ac)
1.1 kristaps 689: return(0);
1.43 kristaps 690: else if (ARGS_EOLN == ac)
1.1 kristaps 691: break;
692:
1.31 kristaps 693: if (0 == v->sz % MULTI_STEP)
694: v->value = mandoc_realloc(v->value,
1.1 kristaps 695: (v->sz + MULTI_STEP) * sizeof(char *));
1.31 kristaps 696:
697: v->value[(int)v->sz] = mandoc_strdup(p);
1.1 kristaps 698: }
699:
1.7 kristaps 700: return(1);
1.1 kristaps 701: }
702:
703: static int
1.11 kristaps 704: argv_opt_single(struct mdoc *m, int line,
1.1 kristaps 705: struct mdoc_argv *v, int *pos, char *buf)
706: {
1.43 kristaps 707: enum margserr ac;
1.1 kristaps 708: char *p;
709:
710: if ('-' == buf[*pos])
711: return(1);
712:
1.43 kristaps 713: ac = args(m, line, pos, buf, 0, &p);
714: if (ARGS_ERROR == ac)
1.1 kristaps 715: return(0);
1.43 kristaps 716: if (ARGS_EOLN == ac)
1.1 kristaps 717: return(1);
718:
719: v->sz = 1;
1.31 kristaps 720: v->value = mandoc_malloc(sizeof(char *));
721: v->value[0] = mandoc_strdup(p);
1.2 kristaps 722:
1.1 kristaps 723: return(1);
724: }
725:
726: /*
727: * Parse a single, mandatory value from the stream.
728: */
729: static int
1.11 kristaps 730: argv_single(struct mdoc *m, int line,
1.1 kristaps 731: struct mdoc_argv *v, int *pos, char *buf)
732: {
1.43 kristaps 733: int ppos;
734: enum margserr ac;
1.1 kristaps 735: char *p;
736:
737: ppos = *pos;
738:
1.43 kristaps 739: ac = args(m, line, pos, buf, 0, &p);
1.49 kristaps 740: if (ARGS_EOLN == ac) {
741: mdoc_pmsg(m, line, ppos, MANDOCERR_SYNTARGVCOUNT);
742: return(0);
743: } else if (ARGS_ERROR == ac)
1.1 kristaps 744: return(0);
745:
746: v->sz = 1;
1.31 kristaps 747: v->value = mandoc_malloc(sizeof(char *));
748: v->value[0] = mandoc_strdup(p);
1.2 kristaps 749:
1.1 kristaps 750: return(1);
751: }
752:
753: /*
754: * Determine rules for parsing arguments. Arguments can either accept
755: * no parameters, an optional single parameter, one parameter, or
756: * multiple parameters.
757: */
758: static int
759: argv(struct mdoc *mdoc, int line,
760: struct mdoc_argv *v, int *pos, char *buf)
761: {
762:
763: v->sz = 0;
764: v->value = NULL;
765:
1.68 kristaps 766: switch (argvflags[v->arg]) {
1.1 kristaps 767: case (ARGV_SINGLE):
768: return(argv_single(mdoc, line, v, pos, buf));
769: case (ARGV_MULTI):
770: return(argv_multi(mdoc, line, v, pos, buf));
771: case (ARGV_OPT_SINGLE):
772: return(argv_opt_single(mdoc, line, v, pos, buf));
1.68 kristaps 773: case (ARGV_NONE):
774: break;
1.1 kristaps 775: default:
1.68 kristaps 776: abort();
777: /* NOTREACHED */
1.1 kristaps 778: }
779:
780: return(1);
781: }
CVSweb