Annotation of mandoc/man_macro.c, Revision 1.137
1.137 ! schwarze 1: /* $Id: man_macro.c,v 1.136 2018/12/14 06:33:14 schwarze Exp $ */
1.1 kristaps 2: /*
1.65 schwarze 3: * Copyright (c) 2008, 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv>
1.124 schwarze 4: * Copyright (c) 2012-2015, 2017, 2018 Ingo Schwarze <schwarze@openbsd.org>
1.79 schwarze 5: * Copyright (c) 2013 Franco Fichtner <franco@lastsummer.de>
1.1 kristaps 6: *
7: * Permission to use, copy, modify, and distribute this software for any
1.14 kristaps 8: * purpose with or without fee is hereby granted, provided that the above
9: * copyright notice and this permission notice appear in all copies.
1.1 kristaps 10: *
1.101 schwarze 11: * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHORS DISCLAIM ALL WARRANTIES
1.14 kristaps 12: * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
1.101 schwarze 13: * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
1.14 kristaps 14: * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
15: * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
16: * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
17: * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
1.1 kristaps 18: */
1.30 kristaps 19: #include "config.h"
1.88 schwarze 20:
21: #include <sys/types.h>
1.30 kristaps 22:
1.1 kristaps 23: #include <assert.h>
24: #include <ctype.h>
1.134 schwarze 25: #include <stdio.h>
1.1 kristaps 26: #include <stdlib.h>
27: #include <string.h>
28:
1.101 schwarze 29: #include "mandoc.h"
30: #include "roff.h"
1.58 kristaps 31: #include "man.h"
1.57 kristaps 32: #include "libmandoc.h"
1.106 schwarze 33: #include "roff_int.h"
1.1 kristaps 34: #include "libman.h"
35:
1.91 schwarze 36: static void blk_close(MACRO_PROT_ARGS);
37: static void blk_exp(MACRO_PROT_ARGS);
38: static void blk_imp(MACRO_PROT_ARGS);
39: static void in_line_eoln(MACRO_PROT_ARGS);
1.105 schwarze 40: static int man_args(struct roff_man *, int,
1.60 kristaps 41: int *, char *, char **);
1.116 schwarze 42: static void rew_scope(struct roff_man *, enum roff_tok);
1.19 kristaps 43:
1.127 schwarze 44: static const struct man_macro man_macros[MAN_MAX - MAN_TH] = {
1.133 schwarze 45: { in_line_eoln, MAN_XSCOPE }, /* TH */
46: { blk_imp, MAN_XSCOPE | MAN_BSCOPED }, /* SH */
47: { blk_imp, MAN_XSCOPE | MAN_BSCOPED }, /* SS */
48: { blk_imp, MAN_XSCOPE | MAN_BSCOPED }, /* TP */
49: { blk_imp, MAN_XSCOPE | MAN_BSCOPED }, /* TQ */
50: { blk_imp, MAN_XSCOPE }, /* LP */
51: { blk_imp, MAN_XSCOPE }, /* PP */
52: { blk_imp, MAN_XSCOPE }, /* P */
53: { blk_imp, MAN_XSCOPE }, /* IP */
54: { blk_imp, MAN_XSCOPE }, /* HP */
55: { in_line_eoln, MAN_NSCOPED | MAN_ESCOPED | MAN_JOIN }, /* SM */
56: { in_line_eoln, MAN_NSCOPED | MAN_ESCOPED | MAN_JOIN }, /* SB */
1.19 kristaps 57: { in_line_eoln, 0 }, /* BI */
58: { in_line_eoln, 0 }, /* IB */
59: { in_line_eoln, 0 }, /* BR */
60: { in_line_eoln, 0 }, /* RB */
1.133 schwarze 61: { in_line_eoln, MAN_NSCOPED | MAN_ESCOPED | MAN_JOIN }, /* R */
62: { in_line_eoln, MAN_NSCOPED | MAN_ESCOPED | MAN_JOIN }, /* B */
63: { in_line_eoln, MAN_NSCOPED | MAN_ESCOPED | MAN_JOIN }, /* I */
1.19 kristaps 64: { in_line_eoln, 0 }, /* IR */
65: { in_line_eoln, 0 }, /* RI */
1.110 schwarze 66: { in_line_eoln, MAN_NSCOPED }, /* nf */
67: { in_line_eoln, MAN_NSCOPED }, /* fi */
1.133 schwarze 68: { blk_close, MAN_XSCOPE }, /* RE */
69: { blk_exp, MAN_XSCOPE }, /* RS */
1.23 kristaps 70: { in_line_eoln, 0 }, /* DT */
1.28 kristaps 71: { in_line_eoln, 0 }, /* UC */
1.100 schwarze 72: { in_line_eoln, MAN_NSCOPED }, /* PD */
1.45 joerg 73: { in_line_eoln, 0 }, /* AT */
1.122 schwarze 74: { in_line_eoln, MAN_NSCOPED }, /* in */
1.133 schwarze 75: { blk_imp, MAN_XSCOPE }, /* SY */
76: { blk_close, MAN_XSCOPE }, /* YS */
1.71 kristaps 77: { in_line_eoln, 0 }, /* OP */
1.133 schwarze 78: { in_line_eoln, MAN_XSCOPE }, /* EX */
79: { in_line_eoln, MAN_XSCOPE }, /* EE */
80: { blk_exp, MAN_XSCOPE }, /* UR */
81: { blk_close, MAN_XSCOPE }, /* UE */
82: { blk_exp, MAN_XSCOPE }, /* MT */
83: { blk_close, MAN_XSCOPE }, /* ME */
1.19 kristaps 84: };
1.1 kristaps 85:
86:
1.127 schwarze 87: const struct man_macro *
88: man_macro(enum roff_tok tok)
89: {
90: assert(tok >= MAN_TH && tok <= MAN_MAX);
91: return man_macros + (tok - MAN_TH);
92: }
93:
1.91 schwarze 94: void
1.105 schwarze 95: man_unscope(struct roff_man *man, const struct roff_node *to)
1.1 kristaps 96: {
1.102 schwarze 97: struct roff_node *n;
1.1 kristaps 98:
1.83 schwarze 99: to = to->parent;
100: n = man->last;
101: while (n != to) {
1.87 schwarze 102:
103: /* Reached the end of the document? */
104:
1.115 schwarze 105: if (to == NULL && ! (n->flags & NODE_VALID)) {
1.87 schwarze 106: if (man->flags & (MAN_BLINE | MAN_ELINE) &&
1.133 schwarze 107: man_macro(n->tok)->flags &
108: (MAN_BSCOPED | MAN_NSCOPED)) {
1.135 schwarze 109: mandoc_msg(MANDOCERR_BLK_LINE,
110: n->line, n->pos,
1.116 schwarze 111: "EOF breaks %s", roff_name[n->tok]);
1.87 schwarze 112: if (man->flags & MAN_ELINE)
113: man->flags &= ~MAN_ELINE;
114: else {
1.101 schwarze 115: assert(n->type == ROFFT_HEAD);
1.87 schwarze 116: n = n->parent;
117: man->flags &= ~MAN_BLINE;
118: }
119: man->last = n;
120: n = n->parent;
1.106 schwarze 121: roff_node_delete(man, man->last);
1.87 schwarze 122: continue;
123: }
1.101 schwarze 124: if (n->type == ROFFT_BLOCK &&
1.127 schwarze 125: man_macro(n->tok)->fp == blk_exp)
1.87 schwarze 126: mandoc_msg(MANDOCERR_BLK_NOEND,
1.135 schwarze 127: n->line, n->pos, "%s",
1.116 schwarze 128: roff_name[n->tok]);
1.87 schwarze 129: }
130:
1.55 kristaps 131: /*
1.83 schwarze 132: * We might delete the man->last node
133: * in the post-validation phase.
134: * Save a pointer to the parent such that
135: * we know where to continue the iteration.
1.55 kristaps 136: */
1.89 schwarze 137:
1.83 schwarze 138: man->last = n;
139: n = n->parent;
1.115 schwarze 140: man->last->flags |= NODE_VALID;
1.19 kristaps 141: }
1.89 schwarze 142:
143: /*
144: * If we ended up at the parent of the node we were
145: * supposed to rewind to, that means the target node
146: * got deleted, so add the next node we parse as a child
147: * of the parent instead of as a sibling of the target.
148: */
149:
150: man->next = (man->last == to) ?
1.105 schwarze 151: ROFF_NEXT_CHILD : ROFF_NEXT_SIBLING;
1.19 kristaps 152: }
1.1 kristaps 153:
1.19 kristaps 154: /*
155: * Rewinding entails ascending the parse tree until a coherent point,
156: * for example, the `SH' macro will close out any intervening `SS'
157: * scopes. When a scope is closed, it must be validated and actioned.
158: */
1.91 schwarze 159: static void
1.116 schwarze 160: rew_scope(struct roff_man *man, enum roff_tok tok)
1.19 kristaps 161: {
1.102 schwarze 162: struct roff_node *n;
1.7 kristaps 163:
1.104 schwarze 164: /* Preserve empty paragraphs before RS. */
165:
166: n = man->last;
1.114 schwarze 167: if (tok == MAN_RS && n->child == NULL &&
1.104 schwarze 168: (n->tok == MAN_P || n->tok == MAN_PP || n->tok == MAN_LP))
169: return;
170:
171: for (;;) {
172: if (n->type == ROFFT_ROOT)
173: return;
1.115 schwarze 174: if (n->flags & NODE_VALID) {
1.104 schwarze 175: n = n->parent;
176: continue;
177: }
178: if (n->type != ROFFT_BLOCK) {
179: if (n->parent->type == ROFFT_ROOT) {
180: man_unscope(man, n);
181: return;
182: } else {
183: n = n->parent;
184: continue;
185: }
186: }
187: if (tok != MAN_SH && (n->tok == MAN_SH ||
188: (tok != MAN_SS && (n->tok == MAN_SS ||
1.127 schwarze 189: man_macro(n->tok)->fp == blk_exp))))
1.91 schwarze 190: return;
1.104 schwarze 191: man_unscope(man, n);
192: n = man->last;
1.6 kristaps 193: }
1.19 kristaps 194: }
195:
1.6 kristaps 196:
1.36 kristaps 197: /*
198: * Close out a generic explicit macro.
199: */
1.91 schwarze 200: void
1.21 kristaps 201: blk_close(MACRO_PROT_ARGS)
202: {
1.124 schwarze 203: enum roff_tok ctok, ntok;
1.102 schwarze 204: const struct roff_node *nn;
1.137 ! schwarze 205: char *p, *ep;
! 206: int cline, cpos, la, nrew, target;
1.21 kristaps 207:
1.93 schwarze 208: nrew = 1;
1.21 kristaps 209: switch (tok) {
1.82 schwarze 210: case MAN_RE:
1.21 kristaps 211: ntok = MAN_RS;
1.137 ! schwarze 212: la = *pos;
1.93 schwarze 213: if ( ! man_args(man, line, pos, buf, &p))
214: break;
215: for (nn = man->last->parent; nn; nn = nn->parent)
1.101 schwarze 216: if (nn->tok == ntok && nn->type == ROFFT_BLOCK)
1.93 schwarze 217: nrew++;
1.137 ! schwarze 218: target = strtol(p, &ep, 10);
! 219: if (*ep != '\0')
1.135 schwarze 220: mandoc_msg(MANDOCERR_ARG_EXCESS, line,
1.137 ! schwarze 221: la + (buf[la] == '"') + (int)(ep - p),
! 222: "RE ... %s", ep);
! 223: free(p);
1.93 schwarze 224: if (target == 0)
225: target = 1;
226: nrew -= target;
227: if (nrew < 1) {
1.135 schwarze 228: mandoc_msg(MANDOCERR_RE_NOTOPEN,
1.93 schwarze 229: line, ppos, "RE %d", target);
230: return;
231: }
1.128 schwarze 232: break;
233: case MAN_YS:
234: ntok = MAN_SY;
1.76 schwarze 235: break;
1.82 schwarze 236: case MAN_UE:
1.76 schwarze 237: ntok = MAN_UR;
1.123 schwarze 238: break;
239: case MAN_ME:
240: ntok = MAN_MT;
1.21 kristaps 241: break;
242: default:
243: abort();
244: }
245:
1.75 schwarze 246: for (nn = man->last->parent; nn; nn = nn->parent)
1.101 schwarze 247: if (nn->tok == ntok && nn->type == ROFFT_BLOCK && ! --nrew)
1.21 kristaps 248: break;
249:
1.91 schwarze 250: if (nn == NULL) {
1.135 schwarze 251: mandoc_msg(MANDOCERR_BLK_NOTOPEN,
252: line, ppos, "%s", roff_name[tok]);
1.104 schwarze 253: rew_scope(man, MAN_PP);
1.131 schwarze 254: if (tok == MAN_RE) {
255: roff_elem_alloc(man, line, ppos, ROFF_br);
256: man->last->flags |= NODE_LINE |
257: NODE_VALID | NODE_ENDED;
258: man->next = ROFF_NEXT_SIBLING;
259: }
1.124 schwarze 260: return;
261: }
262:
263: cline = man->last->line;
264: cpos = man->last->pos;
265: ctok = man->last->tok;
266: man_unscope(man, nn);
267:
268: if (tok == MAN_RE && nn->head->aux > 0)
269: roff_setreg(man->roff, "an-margin", nn->head->aux, '-');
270:
271: /* Trailing text. */
272:
273: if (buf[*pos] != '\0') {
274: roff_word_alloc(man, line, ppos, buf + *pos);
275: man->last->flags |= NODE_DELIMC;
1.130 schwarze 276: if (mandoc_eos(man->last->string, strlen(man->last->string)))
277: man->last->flags |= NODE_EOS;
1.124 schwarze 278: }
279:
280: /* Move a trailing paragraph behind the block. */
281:
282: if (ctok == MAN_LP || ctok == MAN_PP || ctok == MAN_P) {
283: *pos = strlen(buf);
1.125 schwarze 284: blk_imp(man, ctok, cline, cpos, pos, buf);
1.129 schwarze 285: }
286:
287: /* Synopsis blocks need an explicit end marker for spacing. */
288:
289: if (tok == MAN_YS && man->last == nn) {
290: roff_elem_alloc(man, line, ppos, tok);
291: man_unscope(man, man->last);
1.95 schwarze 292: }
1.21 kristaps 293: }
294:
1.91 schwarze 295: void
1.35 kristaps 296: blk_exp(MACRO_PROT_ARGS)
297: {
1.102 schwarze 298: struct roff_node *head;
1.98 schwarze 299: char *p;
1.59 kristaps 300: int la;
1.35 kristaps 301:
1.132 schwarze 302: if (tok == MAN_RS)
303: rew_scope(man, tok);
1.108 schwarze 304: roff_block_alloc(man, line, ppos, tok);
1.106 schwarze 305: head = roff_head_alloc(man, line, ppos, tok);
1.35 kristaps 306:
1.98 schwarze 307: la = *pos;
1.121 schwarze 308: if (man_args(man, line, pos, buf, &p)) {
1.107 schwarze 309: roff_word_alloc(man, line, la, p);
1.121 schwarze 310: if (tok == MAN_RS) {
311: if (roff_getreg(man->roff, "an-margin") == 0)
312: roff_setreg(man->roff, "an-margin",
313: 7 * 24, '=');
314: if ((head->aux = strtod(p, NULL) * 24.0) > 0)
315: roff_setreg(man->roff, "an-margin",
316: head->aux, '+');
317: }
1.137 ! schwarze 318: free(p);
1.121 schwarze 319: }
1.35 kristaps 320:
1.98 schwarze 321: if (buf[*pos] != '\0')
1.135 schwarze 322: mandoc_msg(MANDOCERR_ARG_EXCESS, line, *pos,
323: "%s ... %s", roff_name[tok], buf + *pos);
1.73 schwarze 324:
1.98 schwarze 325: man_unscope(man, head);
1.106 schwarze 326: roff_body_alloc(man, line, ppos, tok);
1.35 kristaps 327: }
328:
1.19 kristaps 329: /*
1.101 schwarze 330: * Parse an implicit-block macro. These contain a ROFFT_HEAD and a
331: * ROFFT_BODY contained within a ROFFT_BLOCK. Rules for closing out other
1.19 kristaps 332: * scopes, such as `SH' closing out an `SS', are defined in the rew
333: * routines.
334: */
1.91 schwarze 335: void
1.19 kristaps 336: blk_imp(MACRO_PROT_ARGS)
337: {
1.59 kristaps 338: int la;
1.19 kristaps 339: char *p;
1.102 schwarze 340: struct roff_node *n;
1.19 kristaps 341:
1.104 schwarze 342: rew_scope(man, tok);
1.108 schwarze 343: n = roff_block_alloc(man, line, ppos, tok);
1.106 schwarze 344: if (n->tok == MAN_SH || n->tok == MAN_SS)
345: man->flags &= ~MAN_LITERAL;
346: n = roff_head_alloc(man, line, ppos, tok);
1.25 kristaps 347:
1.19 kristaps 348: /* Add line arguments. */
1.3 kristaps 349:
1.19 kristaps 350: for (;;) {
351: la = *pos;
1.75 schwarze 352: if ( ! man_args(man, line, pos, buf, &p))
1.19 kristaps 353: break;
1.107 schwarze 354: roff_word_alloc(man, line, la, p);
1.137 ! schwarze 355: free(p);
1.6 kristaps 356: }
357:
1.99 schwarze 358: /*
359: * For macros having optional next-line scope,
360: * keep the head open if there were no arguments.
1.133 schwarze 361: * For `TP' and `TQ', always keep the head open.
1.99 schwarze 362: */
1.19 kristaps 363:
1.133 schwarze 364: if (man_macro(tok)->flags & MAN_BSCOPED &&
1.126 schwarze 365: (tok == MAN_TP || tok == MAN_TQ || n == man->last)) {
1.99 schwarze 366: man->flags |= MAN_BLINE;
367: return;
1.27 kristaps 368: }
1.99 schwarze 369:
370: /* Close out the head and open the body. */
371:
1.103 schwarze 372: man_unscope(man, n);
1.106 schwarze 373: roff_body_alloc(man, line, ppos, tok);
1.4 kristaps 374: }
375:
1.91 schwarze 376: void
1.19 kristaps 377: in_line_eoln(MACRO_PROT_ARGS)
1.3 kristaps 378: {
1.59 kristaps 379: int la;
1.19 kristaps 380: char *p;
1.102 schwarze 381: struct roff_node *n;
1.3 kristaps 382:
1.108 schwarze 383: roff_elem_alloc(man, line, ppos, tok);
1.75 schwarze 384: n = man->last;
1.3 kristaps 385:
1.19 kristaps 386: for (;;) {
1.117 schwarze 387: if (buf[*pos] != '\0' && (tok == MAN_fi || tok == MAN_nf)) {
1.135 schwarze 388: mandoc_msg(MANDOCERR_ARG_SKIP, line, *pos,
389: "%s %s", roff_name[tok], buf + *pos);
1.97 schwarze 390: break;
391: }
1.120 schwarze 392: if (buf[*pos] != '\0' && man->last != n && tok == MAN_PD) {
1.135 schwarze 393: mandoc_msg(MANDOCERR_ARG_EXCESS, line, *pos,
394: "%s ... %s", roff_name[tok], buf + *pos);
1.96 schwarze 395: break;
396: }
1.19 kristaps 397: la = *pos;
1.75 schwarze 398: if ( ! man_args(man, line, pos, buf, &p))
1.19 kristaps 399: break;
1.127 schwarze 400: if (man_macro(tok)->flags & MAN_JOIN &&
1.101 schwarze 401: man->last->type == ROFFT_TEXT)
1.107 schwarze 402: roff_word_append(man, p);
1.91 schwarze 403: else
1.107 schwarze 404: roff_word_alloc(man, line, la, p);
1.137 ! schwarze 405: free(p);
1.19 kristaps 406: }
1.78 schwarze 407:
408: /*
1.115 schwarze 409: * Append NODE_EOS in case the last snipped argument
1.78 schwarze 410: * ends with a dot, e.g. `.IR syslog (3).'
411: */
412:
413: if (n != man->last &&
1.80 schwarze 414: mandoc_eos(man->last->string, strlen(man->last->string)))
1.115 schwarze 415: man->last->flags |= NODE_EOS;
1.3 kristaps 416:
1.31 kristaps 417: /*
1.133 schwarze 418: * If no arguments are specified and this is MAN_ESCOPED (i.e.,
1.31 kristaps 419: * next-line scoped), then set our mode to indicate that we're
420: * waiting for terms to load into our context.
421: */
422:
1.133 schwarze 423: if (n == man->last && man_macro(tok)->flags & MAN_ESCOPED) {
1.75 schwarze 424: man->flags |= MAN_ELINE;
1.91 schwarze 425: return;
1.31 kristaps 426: }
1.64 kristaps 427:
1.101 schwarze 428: assert(man->last->type != ROFFT_ROOT);
1.105 schwarze 429: man->next = ROFF_NEXT_SIBLING;
1.82 schwarze 430:
1.113 schwarze 431: /* Rewind our element scope. */
1.3 kristaps 432:
1.75 schwarze 433: for ( ; man->last; man->last = man->last->parent) {
1.113 schwarze 434: man_state(man, man->last);
1.75 schwarze 435: if (man->last == n)
1.19 kristaps 436: break;
437: }
1.133 schwarze 438:
439: /* Rewind next-line scoped ancestors, if any. */
440:
441: if (man_macro(tok)->flags & MAN_ESCOPED)
442: man_descope(man, line, ppos, NULL);
1.19 kristaps 443: }
1.3 kristaps 444:
1.91 schwarze 445: void
1.109 schwarze 446: man_endparse(struct roff_man *man)
1.19 kristaps 447: {
1.22 kristaps 448:
1.91 schwarze 449: man_unscope(man, man->first);
1.113 schwarze 450: man->flags &= ~MAN_LITERAL;
1.19 kristaps 451: }
1.3 kristaps 452:
1.60 kristaps 453: static int
1.105 schwarze 454: man_args(struct roff_man *man, int line, int *pos, char *buf, char **v)
1.60 kristaps 455: {
456: char *start;
457:
458: assert(*pos);
459: *v = start = buf + *pos;
460: assert(' ' != *start);
461:
462: if ('\0' == *start)
1.112 schwarze 463: return 0;
1.60 kristaps 464:
1.137 ! schwarze 465: *v = roff_getarg(man->roff, v, line, pos);
1.112 schwarze 466: return 1;
1.60 kristaps 467: }
CVSweb