Annotation of mandoc/argv.c, Revision 1.14
1.14 ! kristaps 1: /* $Id: argv.c,v 1.13 2009/01/15 15:46:45 kristaps Exp $ */
1.1 kristaps 2: /*
3: * Copyright (c) 2008 Kristaps Dzonsons <kristaps@kth.se>
4: *
5: * Permission to use, copy, modify, and distribute this software for any
6: * purpose with or without fee is hereby granted, provided that the
7: * above copyright notice and this permission notice appear in all
8: * copies.
9: *
10: * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL
11: * WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED
12: * WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE
13: * AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL
14: * DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
15: * PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
16: * TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
17: * PERFORMANCE OF THIS SOFTWARE.
18: */
19: #include <assert.h>
20: #include <ctype.h>
21: #include <err.h>
22: #include <stdlib.h>
23: #include <stdio.h>
24: #include <string.h>
25:
26: #include "private.h"
27:
28:
1.2 kristaps 29: static int lookup(int, const char *);
1.9 kristaps 30: static int parse(struct mdoc *, int, int,
1.2 kristaps 31: struct mdoc_arg *, int *, char *);
1.12 kristaps 32: static int parse_single(struct mdoc *, int,
33: struct mdoc_arg *, int *, char *);
34: static int parse_multi(struct mdoc *, int,
35: struct mdoc_arg *, int *, char *);
1.2 kristaps 36: static int postparse(struct mdoc *, int,
37: const struct mdoc_arg *, int);
1.1 kristaps 38:
39:
1.2 kristaps 40: int
1.9 kristaps 41: mdoc_args(struct mdoc *mdoc, int line, int *pos, char *buf, int fl, char **v)
1.1 kristaps 42: {
1.2 kristaps 43: int i;
1.1 kristaps 44:
45: if (0 == buf[*pos])
1.2 kristaps 46: return(ARGS_EOLN);
47:
48: if ('\"' == buf[*pos] && ! (fl & ARGS_QUOTED))
1.14 ! kristaps 49: if ( ! mdoc_pwarn(mdoc, line, *pos, WARN_SYNTAX, "unexpected quoted parameter"))
1.2 kristaps 50: return(ARGS_ERROR);
51:
52: if ('-' == buf[*pos])
1.14 ! kristaps 53: if ( ! mdoc_pwarn(mdoc, line, *pos, WARN_SYNTAX, "argument-like parameter"))
1.2 kristaps 54: return(ARGS_ERROR);
55:
56: if ((fl & ARGS_DELIM) && mdoc_iscdelim(buf[*pos])) {
1.12 kristaps 57: /*
58: * If ARGS_DELIM, return ARGS_PUNCT if only space-separated
59: * punctuation remains.
60: */
1.2 kristaps 61: for (i = *pos; buf[i]; ) {
62: if ( ! mdoc_iscdelim(buf[i]))
63: break;
64: i++;
65: if (0 == buf[i] || ! isspace(buf[i]))
66: break;
67: i++;
68: while (buf[i] && isspace(buf[i]))
69: i++;
70: }
71: if (0 == buf[i]) {
72: *v = &buf[*pos];
73: return(ARGS_PUNCT);
74: }
75: }
76:
1.12 kristaps 77: /* Parse routine for non-quoted string. */
1.1 kristaps 78:
79: if ('\"' != buf[*pos]) {
80: *v = &buf[*pos];
81:
1.12 kristaps 82: /* FIXME: UGLY tab-sep processing. */
83:
84: if (ARGS_TABSEP & fl)
85: while (buf[*pos]) {
86: if ('\t' == buf[*pos])
87: break;
88: if ('T' == buf[*pos]) {
89: (*pos)++;
90: if (0 == buf[*pos])
91: break;
92: if ('a' == buf[*pos]) {
93: buf[*pos - 1] = 0;
94: break;
95: }
96: }
97: (*pos)++;
98: }
99: else
100: while (buf[*pos] && ! isspace(buf[*pos]))
101: (*pos)++;
1.1 kristaps 102:
103: if (0 == buf[*pos])
1.2 kristaps 104: return(ARGS_WORD);
1.1 kristaps 105:
106: buf[(*pos)++] = 0;
1.12 kristaps 107:
1.1 kristaps 108: if (0 == buf[*pos])
1.2 kristaps 109: return(ARGS_WORD);
1.1 kristaps 110:
1.12 kristaps 111: if ( ! (ARGS_TABSEP & fl))
112: while (buf[*pos] && isspace(buf[*pos]))
113: (*pos)++;
1.1 kristaps 114:
115: if (buf[*pos])
1.2 kristaps 116: return(ARGS_WORD);
1.1 kristaps 117:
1.14 ! kristaps 118: if ( ! mdoc_pwarn(mdoc, line, *pos, WARN_COMPAT, "whitespace at end-of-line"))
1.2 kristaps 119: return(ARGS_ERROR);
1.1 kristaps 120:
1.2 kristaps 121: return(ARGS_WORD);
122: }
123:
124: /*
125: * If we're a quoted string (and quoted strings are allowed),
126: * then parse ahead to the next quote. If none's found, it's an
1.4 kristaps 127: * error. After, parse to the next word.
1.2 kristaps 128: */
1.1 kristaps 129:
130: *v = &buf[++(*pos)];
131:
132: while (buf[*pos] && '\"' != buf[*pos])
133: (*pos)++;
134:
135: if (0 == buf[*pos]) {
1.14 ! kristaps 136: (void)mdoc_perr(mdoc, line, *pos, "unterminated quoted parameter");
1.2 kristaps 137: return(ARGS_ERROR);
1.1 kristaps 138: }
139:
140: buf[(*pos)++] = 0;
141: if (0 == buf[*pos])
1.2 kristaps 142: return(ARGS_WORD);
1.1 kristaps 143:
144: while (buf[*pos] && isspace(buf[*pos]))
145: (*pos)++;
146:
147: if (buf[*pos])
1.2 kristaps 148: return(ARGS_WORD);
1.1 kristaps 149:
1.14 ! kristaps 150: if ( ! mdoc_pwarn(mdoc, line, *pos, WARN_COMPAT, "whitespace at end-of-line"))
1.2 kristaps 151: return(ARGS_ERROR);
152:
153: return(ARGS_WORD);
1.1 kristaps 154: }
155:
156:
1.2 kristaps 157: static int
158: lookup(int tok, const char *argv)
1.1 kristaps 159: {
160:
161: switch (tok) {
1.6 kristaps 162: case (MDOC_An):
163: if (xstrcmp(argv, "split"))
164: return(MDOC_Split);
165: else if (xstrcmp(argv, "nosplit"))
166: return(MDOC_Nosplit);
167: break;
168:
1.2 kristaps 169: case (MDOC_Bd):
1.1 kristaps 170: if (xstrcmp(argv, "ragged"))
171: return(MDOC_Ragged);
172: else if (xstrcmp(argv, "unfilled"))
173: return(MDOC_Unfilled);
1.13 kristaps 174: else if (xstrcmp(argv, "filled"))
175: return(MDOC_Filled);
1.1 kristaps 176: else if (xstrcmp(argv, "literal"))
177: return(MDOC_Literal);
178: else if (xstrcmp(argv, "file"))
179: return(MDOC_File);
180: else if (xstrcmp(argv, "offset"))
181: return(MDOC_Offset);
1.2 kristaps 182: break;
183:
1.8 kristaps 184: case (MDOC_Bf):
185: if (xstrcmp(argv, "emphasis"))
186: return(MDOC_Emphasis);
187: else if (xstrcmp(argv, "literal"))
188: return(MDOC_Literal);
189: else if (xstrcmp(argv, "symbolic"))
190: return(MDOC_Symbolic);
191: break;
192:
1.7 kristaps 193: case (MDOC_Bk):
194: if (xstrcmp(argv, "words"))
195: return(MDOC_Words);
196: break;
197:
1.2 kristaps 198: case (MDOC_Bl):
199: if (xstrcmp(argv, "bullet"))
1.1 kristaps 200: return(MDOC_Bullet);
201: else if (xstrcmp(argv, "dash"))
202: return(MDOC_Dash);
203: else if (xstrcmp(argv, "hyphen"))
204: return(MDOC_Hyphen);
205: else if (xstrcmp(argv, "item"))
206: return(MDOC_Item);
207: else if (xstrcmp(argv, "enum"))
208: return(MDOC_Enum);
209: else if (xstrcmp(argv, "tag"))
210: return(MDOC_Tag);
211: else if (xstrcmp(argv, "diag"))
212: return(MDOC_Diag);
213: else if (xstrcmp(argv, "hang"))
214: return(MDOC_Hang);
215: else if (xstrcmp(argv, "ohang"))
216: return(MDOC_Ohang);
217: else if (xstrcmp(argv, "inset"))
218: return(MDOC_Inset);
219: else if (xstrcmp(argv, "column"))
220: return(MDOC_Column);
221: else if (xstrcmp(argv, "width"))
222: return(MDOC_Width);
1.2 kristaps 223: else if (xstrcmp(argv, "offset"))
224: return(MDOC_Offset);
1.1 kristaps 225: else if (xstrcmp(argv, "compact"))
226: return(MDOC_Compact);
1.2 kristaps 227: break;
1.3 kristaps 228:
229: case (MDOC_Rv):
230: /* FALLTHROUGH */
231: case (MDOC_Ex):
232: if (xstrcmp(argv, "std"))
233: return(MDOC_Std);
234: break;
1.5 kristaps 235:
236: case (MDOC_St):
237: if (xstrcmp(argv, "p1003.1-88"))
238: return(MDOC_p1003_1_88);
239: else if (xstrcmp(argv, "p1003.1-90"))
240: return(MDOC_p1003_1_90);
241: else if (xstrcmp(argv, "p1003.1-96"))
242: return(MDOC_p1003_1_96);
243: else if (xstrcmp(argv, "p1003.1-2001"))
244: return(MDOC_p1003_1_2001);
245: else if (xstrcmp(argv, "p1003.1-2004"))
246: return(MDOC_p1003_1_2004);
247: else if (xstrcmp(argv, "p1003.1"))
248: return(MDOC_p1003_1);
249: else if (xstrcmp(argv, "p1003.1b"))
250: return(MDOC_p1003_1b);
251: else if (xstrcmp(argv, "p1003.1b-93"))
252: return(MDOC_p1003_1b_93);
253: else if (xstrcmp(argv, "p1003.1c-95"))
254: return(MDOC_p1003_1c_95);
255: else if (xstrcmp(argv, "p1003.1g-2000"))
256: return(MDOC_p1003_1g_2000);
257: else if (xstrcmp(argv, "p1003.2-92"))
258: return(MDOC_p1003_2_92);
259: else if (xstrcmp(argv, "p1003.2-95"))
260: return(MDOC_p1387_2_95);
261: else if (xstrcmp(argv, "p1003.2"))
262: return(MDOC_p1003_2);
263: else if (xstrcmp(argv, "p1387.2-95"))
264: return(MDOC_p1387_2);
265: else if (xstrcmp(argv, "isoC-90"))
266: return(MDOC_isoC_90);
267: else if (xstrcmp(argv, "isoC-amd1"))
268: return(MDOC_isoC_amd1);
269: else if (xstrcmp(argv, "isoC-tcor1"))
270: return(MDOC_isoC_tcor1);
271: else if (xstrcmp(argv, "isoC-tcor2"))
272: return(MDOC_isoC_tcor2);
273: else if (xstrcmp(argv, "isoC-99"))
274: return(MDOC_isoC_99);
275: else if (xstrcmp(argv, "ansiC"))
276: return(MDOC_ansiC);
277: else if (xstrcmp(argv, "ansiC-89"))
278: return(MDOC_ansiC_89);
279: else if (xstrcmp(argv, "ansiC-99"))
280: return(MDOC_ansiC_99);
281: else if (xstrcmp(argv, "ieee754"))
282: return(MDOC_ieee754);
283: else if (xstrcmp(argv, "iso8802-3"))
284: return(MDOC_iso8802_3);
285: else if (xstrcmp(argv, "xpg3"))
286: return(MDOC_xpg3);
287: else if (xstrcmp(argv, "xpg4"))
288: return(MDOC_xpg4);
289: else if (xstrcmp(argv, "xpg4.2"))
290: return(MDOC_xpg4_2);
291: else if (xstrcmp(argv, "xpg4.3"))
292: return(MDOC_xpg4_3);
293: else if (xstrcmp(argv, "xbd5"))
294: return(MDOC_xbd5);
295: else if (xstrcmp(argv, "xcu5"))
296: return(MDOC_xcu5);
297: else if (xstrcmp(argv, "xsh5"))
298: return(MDOC_xsh5);
299: else if (xstrcmp(argv, "xns5"))
300: return(MDOC_xns5);
301: else if (xstrcmp(argv, "xns5.2d2.0"))
302: return(MDOC_xns5_2d2_0);
303: else if (xstrcmp(argv, "xcurses4.2"))
304: return(MDOC_xcurses4_2);
305: else if (xstrcmp(argv, "susv2"))
306: return(MDOC_susv2);
307: else if (xstrcmp(argv, "susv3"))
308: return(MDOC_susv3);
309: else if (xstrcmp(argv, "svid4"))
310: return(MDOC_svid4);
311: break;
1.1 kristaps 312:
313: default:
1.8 kristaps 314: break;
1.1 kristaps 315: }
316:
317: return(MDOC_ARG_MAX);
318: }
319:
320:
1.2 kristaps 321: static int
1.9 kristaps 322: postparse(struct mdoc *mdoc, int line, const struct mdoc_arg *v, int pos)
1.2 kristaps 323: {
324:
325: switch (v->arg) {
326: case (MDOC_Offset):
327: assert(v->value);
328: assert(v->value[0]);
329: if (xstrcmp(v->value[0], "left"))
330: break;
331: if (xstrcmp(v->value[0], "right"))
332: break;
333: if (xstrcmp(v->value[0], "center"))
334: break;
335: if (xstrcmp(v->value[0], "indent"))
336: break;
337: if (xstrcmp(v->value[0], "indent-two"))
338: break;
1.14 ! kristaps 339: return(mdoc_perr(mdoc, line, pos, "invalid offset value"));
1.2 kristaps 340: default:
341: break;
342: }
343:
344: return(1);
345: }
346:
347:
348: static int
1.12 kristaps 349: parse_multi(struct mdoc *mdoc, int line,
350: struct mdoc_arg *v, int *pos, char *buf)
351: {
352: int c, ppos;
353: char *p;
354:
355: v->sz = 0;
356: v->value = xcalloc(MDOC_LINEARG_MAX, sizeof(char *));
357:
358: ppos = *pos;
359:
360: for (v->sz = 0; v->sz < MDOC_LINEARG_MAX; v->sz++) {
361: if ('-' == buf[*pos])
362: break;
363: c = mdoc_args(mdoc, line, pos, buf, ARGS_QUOTED, &p);
364: if (ARGS_ERROR == c) {
365: free(v->value);
366: return(0);
367: } else if (ARGS_EOLN == c)
368: break;
369: v->value[v->sz] = p;
370: }
371:
372: if (0 < v->sz && v->sz < MDOC_LINEARG_MAX)
373: return(1);
374:
375: free(v->value);
1.14 ! kristaps 376: return(mdoc_perr(mdoc, line, ppos, 0 == v->sz ?
! 377: "argument requires a value" :
! 378: "too many values to argument"));
1.12 kristaps 379: }
380:
381:
382: static int
383: parse_single(struct mdoc *mdoc, int line,
1.1 kristaps 384: struct mdoc_arg *v, int *pos, char *buf)
385: {
1.12 kristaps 386: int c, ppos;
1.1 kristaps 387: char *p;
388:
389: ppos = *pos;
390:
1.12 kristaps 391: c = mdoc_args(mdoc, line, pos, buf, ARGS_QUOTED, &p);
392: if (ARGS_ERROR == c)
393: return(0);
394: if (ARGS_EOLN == c)
1.14 ! kristaps 395: return(mdoc_perr(mdoc, line, ppos, "argument requires a value"));
1.12 kristaps 396:
397: v->sz = 1;
398: v->value = xcalloc(1, sizeof(char *));
399: v->value[0] = p;
400: return(1);
401: }
402:
403:
404: static int
405: parse(struct mdoc *mdoc, int line, int tok,
406: struct mdoc_arg *v, int *pos, char *buf)
407: {
408:
409: v->sz = 0;
410: v->value = NULL;
411:
1.2 kristaps 412: switch (v->arg) {
1.3 kristaps 413: case(MDOC_Std):
414: /* FALLTHROUGH */
1.1 kristaps 415: case(MDOC_Width):
416: /* FALLTHROUGH */
417: case(MDOC_Offset):
1.12 kristaps 418: return(parse_single(mdoc, line, v, pos, buf));
1.1 kristaps 419: case(MDOC_Column):
1.12 kristaps 420: return(parse_multi(mdoc, line, v, pos, buf));
1.1 kristaps 421: default:
1.6 kristaps 422: break;
1.1 kristaps 423: }
424:
425: return(1);
426: }
427:
428:
1.2 kristaps 429: int
1.9 kristaps 430: mdoc_argv(struct mdoc *mdoc, int line, int tok,
1.2 kristaps 431: struct mdoc_arg *v, int *pos, char *buf)
432: {
433: int i, ppos;
434: char *argv;
435:
436: (void)memset(v, 0, sizeof(struct mdoc_arg));
437:
438: if (0 == buf[*pos])
1.5 kristaps 439: return(ARGV_EOLN);
1.2 kristaps 440:
441: assert( ! isspace(buf[*pos]));
442:
1.5 kristaps 443: if ('-' != buf[*pos])
444: return(ARGV_WORD);
1.2 kristaps 445:
446: i = *pos;
447: argv = &buf[++(*pos)];
448:
1.11 kristaps 449: v->line = line;
450: v->pos = *pos;
451:
1.2 kristaps 452: while (buf[*pos] && ! isspace(buf[*pos]))
453: (*pos)++;
454:
455: if (buf[*pos])
456: buf[(*pos)++] = 0;
457:
458: if (MDOC_ARG_MAX == (v->arg = lookup(tok, argv))) {
1.14 ! kristaps 459: if ( ! mdoc_pwarn(mdoc, line, i, WARN_SYNTAX, "argument-like parameter"))
! 460: return(ARGV_ERROR);
1.10 kristaps 461: return(ARGV_WORD);
1.2 kristaps 462: }
463:
464: while (buf[*pos] && isspace(buf[*pos]))
465: (*pos)++;
466:
467: /* FIXME: whitespace if no value. */
468:
469: ppos = *pos;
1.9 kristaps 470: if ( ! parse(mdoc, line, tok, v, pos, buf))
1.5 kristaps 471: return(ARGV_ERROR);
1.9 kristaps 472: if ( ! postparse(mdoc, line, v, ppos))
1.5 kristaps 473: return(ARGV_ERROR);
1.2 kristaps 474:
1.5 kristaps 475: return(ARGV_ARG);
1.2 kristaps 476: }
477:
478:
1.1 kristaps 479: void
480: mdoc_argv_free(int sz, struct mdoc_arg *arg)
481: {
482: int i;
483:
484: for (i = 0; i < sz; i++) {
485: if (0 == arg[i].sz) {
486: assert(NULL == arg[i].value);
487: continue;
488: }
489: assert(arg[i].value);
490: free(arg[i].value);
491: }
492: }
1.2 kristaps 493:
CVSweb