Annotation of texi2mdoc/main.c, Revision 1.47
1.47 ! kristaps 1: /* $Id: main.c,v 1.46 2015/02/25 14:37:17 kristaps Exp $ */
1.1 kristaps 2: /*
3: * Copyright (c) 2015 Kristaps Dzonsons <kristaps@bsd.lv>
4: *
5: * Permission to use, copy, modify, and distribute this software for any
6: * purpose with or without fee is hereby granted, provided that the above
7: * copyright notice and this permission notice appear in all copies.
8: *
9: * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10: * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11: * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12: * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13: * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14: * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15: * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
16: */
1.37 kristaps 17: #if defined(__linux__) || defined(__MINT__)
18: # define _GNU_SOURCE /* memmem */
19: #endif
1.1 kristaps 20: #include <assert.h>
21: #include <ctype.h>
22: #include <getopt.h>
1.2 kristaps 23: #include <libgen.h>
24: #include <limits.h>
1.1 kristaps 25: #include <stdarg.h>
26: #include <stdio.h>
27: #include <stdlib.h>
28: #include <string.h>
1.10 kristaps 29: #include <time.h>
1.47 ! kristaps 30: #include <unistd.h>
1.1 kristaps 31:
1.24 kristaps 32: #include "extern.h"
1.1 kristaps 33:
1.23 kristaps 34: #define SECTSZ 4
35: static const char *const sects[SECTSZ] = {
36: "Sh",
37: "Ss",
38: "Em",
39: "No",
40: };
41:
1.46 kristaps 42: static void doaccent(struct texi *, enum texicmd, size_t *);
43: static void doblock(struct texi *, enum texicmd, size_t *);
44: static void dobracket(struct texi *, enum texicmd, size_t *);
45: static void dobye(struct texi *, enum texicmd, size_t *);
46: static void dodefindex(struct texi *, enum texicmd, size_t *);
47: static void dodefn(struct texi *, enum texicmd, size_t *);
48: static void dodisplay(struct texi *, enum texicmd, size_t *);
49: static void doend(struct texi *, enum texicmd, size_t *);
50: static void doenumerate(struct texi *, enum texicmd, size_t *);
51: static void doexample(struct texi *, enum texicmd, size_t *);
52: static void doignargn(struct texi *, enum texicmd, size_t *);
53: static void doignblock(struct texi *, enum texicmd, size_t *);
54: static void doignbracket(struct texi *, enum texicmd, size_t *);
55: static void doignline(struct texi *, enum texicmd, size_t *);
56: static void doinline(struct texi *, enum texicmd, size_t *);
57: static void doinclude(struct texi *, enum texicmd, size_t *);
58: static void doitem(struct texi *, enum texicmd, size_t *);
59: static void doitemize(struct texi *, enum texicmd, size_t *);
60: static void dolink(struct texi *, enum texicmd, size_t *);
61: static void domacro(struct texi *, enum texicmd, size_t *);
62: static void domath(struct texi *, enum texicmd, size_t *);
63: static void domultitable(struct texi *, enum texicmd, size_t *);
64: static void doquotation(struct texi *, enum texicmd, size_t *);
65: static void dotable(struct texi *, enum texicmd, size_t *);
66: static void dotop(struct texi *, enum texicmd, size_t *);
67: static void dosecoffs(struct texi *, enum texicmd, size_t *);
68: static void dosection(struct texi *, enum texicmd, size_t *);
69: static void dosp(struct texi *, enum texicmd, size_t *);
70: static void dosubsection(struct texi *, enum texicmd, size_t *);
71: static void dosubsubsection(struct texi *, enum texicmd, size_t *);
72: static void dosymbol(struct texi *, enum texicmd, size_t *);
73: static void dotab(struct texi *, enum texicmd, size_t *);
74: static void dotitle(struct texi *, enum texicmd, size_t *);
75: static void dovalue(struct texi *, enum texicmd, size_t *);
76: static void doverb(struct texi *, enum texicmd, size_t *);
77: static void doverbatim(struct texi *, enum texicmd, size_t *);
78: static void doverbinclude(struct texi *, enum texicmd, size_t *);
1.1 kristaps 79:
1.24 kristaps 80: static const struct texitok __texitoks[TEXICMD__MAX] = {
1.20 kristaps 81: /* TEXICMD__BEGIN */
1.42 kristaps 82: { doignline, "afourpaper", 10 }, /* TEXICMD_A4PAPER */
83: { dosymbol, "AA", 2 }, /* TEXICMD_AA */
84: { dosymbol, "aa", 2 }, /* TEXICMD_AASMALL */
1.8 kristaps 85: { doignargn, "acronym", 7 }, /* TEXICMD_ACRONYM */
1.16 kristaps 86: { doaccent, "'", 1 }, /* TEXICMD_ACUTE */
1.42 kristaps 87: { dosymbol, "AE", 2 }, /* TEXICMD_AE */
88: { dosymbol, "ae", 2 }, /* TEXICMD_AESMALL */
1.1 kristaps 89: { doignbracket, "anchor", 6 }, /* TEXICMD_ANCHOR */
1.12 kristaps 90: { dosection, "appendix", 8 }, /* TEXICMD_APPENDIX */
91: { dosection, "appendixsec", 11 }, /* TEXICMD_APPENDIXSEC */
1.20 kristaps 92: { dosubsection, "appendixsubsec", 14 }, /* TEXICMD_APPENDIXSUBSEC */
1.23 kristaps 93: { dosubsubsection, "appendixsubsubsec", 17 }, /* TEXICMD_APPENDIXSUBSUBSEC */
1.25 kristaps 94: { doinline, "asis", 4 }, /* TEXICMD_ASIS */
1.3 kristaps 95: { dosymbol, "*", 1 }, /* TEXICMD_ASTERISK */
1.1 kristaps 96: { dosymbol, "@", 1 }, /* TEXICMD_AT */
1.3 kristaps 97: { doignline, "author", 6 }, /* TEXICMD_AUTHOR */
1.21 kristaps 98: { doinline, "b", 1 }, /* TEXICMD_BOLD */
1.3 kristaps 99: { dosymbol, "!", 1 }, /* TEXICMD_BANG */
1.7 kristaps 100: { dosymbol, "bullet", 6 }, /* TEXICMD_BULLET */
1.1 kristaps 101: { dobye, "bye", 3 }, /* TEXICMD_BYE */
1.34 kristaps 102: { doblock, "cartouche", 9 }, /* TEXICMD_CARTOUCHE */
103: { doaccent, ",", 1 }, /* TEXICMD_CEDILLA */
1.12 kristaps 104: { doignline, "center", 6 }, /* TEXICMD_CENTER */
105: { dosection, "chapter", 7 }, /* TEXICMD_CHAPTER */
1.1 kristaps 106: { doignline, "cindex", 6 }, /* TEXICMD_CINDEX */
1.16 kristaps 107: { doaccent, "^", 1 }, /* TEXICMD_CIRCUMFLEX */
1.24 kristaps 108: { doinline, "cite", 4 }, /* TEXICMD_CITE */
109: { dovalue, "clear", 5 }, /* TEXICMD_CLEAR */
1.21 kristaps 110: { doinline, "code", 4 }, /* TEXICMD_CODE */
1.3 kristaps 111: { dosymbol, ":", 1 }, /* TEXICMD_COLON */
1.18 kristaps 112: { NULL, "columnfractions", 15 }, /* TEXICMD_COLUMNFRACTIONS */
1.35 kristaps 113: { dosymbol, "comma", 5 }, /* TEXICMD_COMMA */
1.12 kristaps 114: { doinline, "command", 7 }, /* TEXICMD_COMMAND */
1.1 kristaps 115: { doignline, "c", 1 }, /* TEXICMD_COMMENT */
1.2 kristaps 116: { doignline, "comment", 7 }, /* TEXICMD_COMMENT_LONG */
1.1 kristaps 117: { doignline, "contents", 8 }, /* TEXICMD_CONTENTS */
118: { doignblock, "copying", 7 }, /* TEXICMD_COPYING */
119: { dosymbol, "copyright", 9 }, /* TEXICMD_COPYRIGHT */
1.27 kristaps 120: { dodefindex, "defcodeindex", 12 }, /* TEXICMD_DEFCODEINDEX */
1.15 kristaps 121: { dodefn, "deffn", 5 }, /* TEXICMD_DEFFN */
122: { dodefn, "deffnx", 6 }, /* TEXICMD_DEFFNX */
1.27 kristaps 123: { dodefindex, "defindex", 8 }, /* TEXICMD_DEFINDEX */
1.15 kristaps 124: { dodefn, "defmac", 6 }, /* TEXICMD_DEFMAC */
125: { dodefn, "defmacx", 7 }, /* TEXICMD_DEFMACX */
126: { dodefn, "deftp", 5 }, /* TEXICMD_DEFTP */
127: { dodefn, "deftpx", 6 }, /* TEXICMD_DEFTPX */
128: { dodefn, "deftypefn", 9 }, /* TEXICMD_DEFTYPEFN */
129: { dodefn, "deftypefnx", 10 }, /* TEXICMD_DEFTYPEFNX */
130: { dodefn, "deftypefun", 10 }, /* TEXICMD_DEFTYPEFUN */
131: { dodefn, "deftypefunx", 11 }, /* TEXICMD_DEFTYPEFUNX */
1.34 kristaps 132: { dodefn, "deftypemethod", 13 }, /* TEXICMD_DEFTYPEMETHOD */
133: { dodefn, "deftypemethodx", 14 }, /* TEXICMD_DEFTYPEMETHODX */
1.15 kristaps 134: { dodefn, "deftypevar", 10 }, /* TEXICMD_DEFTYPEVAR */
135: { dodefn, "deftypevarx", 11 }, /* TEXICMD_DEFTYPEVARX */
136: { dodefn, "deftypevr", 9 }, /* TEXICMD_DEFTYPEVR */
137: { dodefn, "deftypevrx", 10 }, /* TEXICMD_DEFTYPEVRX */
138: { dodefn, "defun", 5 }, /* TEXICMD_DEFUN */
139: { dodefn, "defunx", 6 }, /* TEXICMD_DEFUNX */
140: { dodefn, "defvar", 6 }, /* TEXICMD_DEFVAR */
141: { dodefn, "defvarx", 7 }, /* TEXICMD_DEFVARX */
142: { dodefn, "defvr", 5 }, /* TEXICMD_DEFVR */
143: { dodefn, "defvrx", 6 }, /* TEXICMD_DEFVRX */
1.1 kristaps 144: { doignblock, "detailmenu", 10 }, /* TEXICMD_DETAILMENU */
1.21 kristaps 145: { doinline, "dfn", 3 }, /* TEXICMD_DFN */
1.42 kristaps 146: { dosymbol, "DH", 2 }, /* TEXICMD_DH */
147: { dosymbol, "dh", 2 }, /* TEXICMD_DHSMALL */
1.1 kristaps 148: { doignline, "dircategory", 11 }, /* TEXICMD_DIRCATEGORY */
149: { doignblock, "direntry", 8 }, /* TEXICMD_DIRENTRY */
1.3 kristaps 150: { dodisplay, "display", 7 }, /* TEXICMD_DISPLAY */
1.28 kristaps 151: { doignbracket, "dmn", 3 }, /* TEXICMD_DMN */
1.40 kristaps 152: { doignblock, "documentdescription", 19 }, /* TEXICMD_DOCUMENTDESCRIPTION */
153: { doignline, "documentencoding", 16 }, /* TEXICMD_DOCUMENTENCODING */
1.44 kristaps 154: { doignline, "documentlanguage", 16 }, /* TEXICMD_DOCUMENTLANGUAGE */
1.42 kristaps 155: { doaccent, "dotaccent", 9 }, /* TEXICMD_DOTACCENT */
156: { doaccent, "dotless", 7 }, /* TEXICMD_DOTLESS */
1.2 kristaps 157: { dosymbol, "dots", 4 }, /* TEXICMD_DOTS */
1.8 kristaps 158: { dolink, "email", 5 }, /* TEXICMD_EMAIL */
1.21 kristaps 159: { doinline, "emph", 4 }, /* TEXICMD_EMPH */
1.44 kristaps 160: { doend, "end", 3 }, /* TEXICMD_END */
1.34 kristaps 161: { dosymbol, "enddots", 7 }, /* TEXICMD_ENDDOTS */
1.2 kristaps 162: { doenumerate, "enumerate", 9 }, /* TEXICMD_ENUMERATE */
1.12 kristaps 163: { doinline, "env", 3 }, /* TEXICMD_ENV */
1.28 kristaps 164: { dosymbol, "equiv", 5 }, /* TEXICMD_EQUIV */
1.15 kristaps 165: { dosymbol, "error", 5 }, /* TEXICMD_ERROR */
1.43 kristaps 166: { dosymbol, "euro", 4 }, /* TEXICMD_EURO */
1.1 kristaps 167: { doexample, "example", 7 }, /* TEXICMD_EXAMPLE */
1.42 kristaps 168: { dosymbol, "exclamdown", 10 }, /* TEXICMD_EXCLAMDOWN */
1.25 kristaps 169: { doignline, "exdent", 6 }, /* TEXICMD_EXDENT */
1.17 kristaps 170: { dosymbol, "expansion", 9 }, /* TEXICMD_EXPANSION */
1.12 kristaps 171: { doinline, "file", 4 }, /* TEXICMD_FILE */
1.17 kristaps 172: { doignline, "finalout", 8 }, /* TEXICMD_FINALOUT */
1.20 kristaps 173: { doignline, "findex", 6 }, /* TEXICMD_FINDEX */
1.44 kristaps 174: { doblock, "flushleft", 9 }, /* TEXICMD_FLUSHLEFT */
175: { doblock, "flushright", 10 }, /* TEXICMD_FLUSHRIGHT */
176: { doignline, "firstparagraphindent", 20 }, /* TEXICMD_FIRSTPARAGRAPHINDENT */
1.32 kristaps 177: { doignbracket, "footnote", 8 }, /* TEXICMD_FOOTNOTE */
1.44 kristaps 178: { doignline, "footnotestyle", 13 }, /* TEXICMD_FOOTNOTESTYLE */
1.20 kristaps 179: { dotable, "ftable", 6 }, /* TEXICMD_FTABLE */
180: { dodisplay, "format", 6 }, /* TEXICMD_FORMAT */
1.43 kristaps 181: { dosymbol, "geq", 3 }, /* TEXICMD_GEQ */
1.16 kristaps 182: { doaccent, "`", 1 }, /* TEXICMD_GRAVE */
1.3 kristaps 183: { doblock, "group", 5 }, /* TEXICMD_GROUP */
1.43 kristaps 184: { dosymbol, "guillemetleft", 13 }, /* TEXICMD_GUILLEMETLEFT */
185: { dosymbol, "guillemetright", 14 }, /* TEXICMD_GUILLEMETRIGHT */
186: { dosymbol, "guillemotleft", 13 }, /* TEXICMD_GUILLEMOTLEFT */
187: { dosymbol, "guillemotright", 14 }, /* TEXICMD_GUILLEMOTRIGHT */
188: { dosymbol, "guilsinglleft", 13 }, /* TEXICMD_GUILSINGLLEFT */
189: { dosymbol, "guilsinglright", 14 }, /* TEXICMD_GUILSINGLRIGHT */
1.42 kristaps 190: { doaccent, "H", 1 }, /* TEXICMD_H */
1.2 kristaps 191: { dosection, "heading", 7 }, /* TEXICMD_HEADING */
1.3 kristaps 192: { doignline, "headings", 8 }, /* TEXICMD_HEADINGS */
1.18 kristaps 193: { doitem, "headitem", 8 }, /* TEXICMD_HEADITEM */
1.25 kristaps 194: { doignblock, "html", 4 }, /* TEXICMD_HTML */
1.3 kristaps 195: { dosymbol, "-", 1 }, /* TEXICMD_HYPHEN */
1.21 kristaps 196: { doinline, "i", 1 }, /* TEXICMD_I */
1.24 kristaps 197: { dovalue, "ifclear", 7 }, /* TEXICMD_IFCLEAR */
1.14 kristaps 198: { doignblock, "ifdocbook", 9 }, /* TEXICMD_IFDOCBOOK */
1.1 kristaps 199: { doignblock, "ifhtml", 6 }, /* TEXICMD_IFHTML */
1.26 kristaps 200: { doblock, "ifinfo", 6 }, /* TEXICMD_IFINFO */
1.14 kristaps 201: { doblock, "ifnotdocbook", 12 }, /* TEXICMD_IFNOTDOCBOOK */
202: { doblock, "ifnothtml", 9 }, /* TEXICMD_IFNOTHTML */
203: { doblock, "ifnotinfo", 9 }, /* TEXICMD_IFNOTINFO */
204: { doignblock, "ifnotplaintext", 14 }, /* TEXICMD_IFNOTPLAINTEXT */
1.3 kristaps 205: { doblock, "ifnottex", 8 }, /* TEXICMD_IFNOTTEX */
1.14 kristaps 206: { doblock, "ifnotxml", 8 }, /* TEXICMD_IFNOTXML */
207: { doblock, "ifplaintext", 11 }, /* TEXICMD_IFPLAINTEXT */
1.1 kristaps 208: { doignblock, "iftex", 5 }, /* TEXICMD_IFTEX */
1.30 kristaps 209: { dovalue, "ifset", 5 }, /* TEXICMD_IFSET */
1.14 kristaps 210: { doignblock, "ifxml", 5 }, /* TEXICMD_IFXML */
1.17 kristaps 211: { doignblock, "ignore", 6 }, /* TEXICMD_IGNORE */
1.1 kristaps 212: { doignbracket, "image", 5 }, /* TEXICMD_IMAGE */
1.2 kristaps 213: { doinclude, "include", 7 }, /* TEXICMD_INCLUDE */
1.13 kristaps 214: { dodisplay, "indentblock", 11 }, /* TEXICMD_INDENTBLOCK */
1.44 kristaps 215: { dolink, "indicateurl", 11 }, /* TEXICMD_INDICATEURL */
216: { dolink, "inforef", 7 }, /* TEXICMD_INFOREF */
1.5 kristaps 217: { doignline, "insertcopying", 13 }, /* TEXICMD_INSERTCOPYING */
1.1 kristaps 218: { doitem, "item", 4 }, /* TEXICMD_ITEM */
219: { doitemize, "itemize", 7 }, /* TEXICMD_ITEMIZE */
1.20 kristaps 220: { doitem, "itemx", 5 }, /* TEXICMD_ITEMX */
1.21 kristaps 221: { doinline, "kbd", 3 }, /* TEXICMD_KBD */
1.18 kristaps 222: { dobracket, "key", 3 }, /* TEXICMD_KEY */
1.20 kristaps 223: { doignline, "kindex", 6 }, /* TEXICMD_KINDEX */
1.42 kristaps 224: { dosymbol, "L", 1 }, /* TEXICMD_L */
1.1 kristaps 225: { dosymbol, "LaTeX", 5 }, /* TEXICMD_LATEX */
1.43 kristaps 226: { dosymbol, "leq", 3 }, /* TEXICMD_LEQ */
1.23 kristaps 227: { dosecoffs, "lowersections", 13 }, /* TEXICMD_LOWERSECTIONS */
1.42 kristaps 228: { dosymbol, "l", 1 }, /* TEXICMD_LSMALL */
1.30 kristaps 229: { domacro, "macro", 5 }, /* TEXICMD_MACRO */
1.42 kristaps 230: { doaccent, "=", 1 }, /* TEXICMD_MACRON */
1.3 kristaps 231: { domath, "math", 4 }, /* TEXICMD_MATH */
1.1 kristaps 232: { doignblock, "menu", 4 }, /* TEXICMD_MENU */
1.25 kristaps 233: { dosymbol, "minus", 5 }, /* TEXICMD_MINUS */
1.18 kristaps 234: { domultitable, "multitable", 10 }, /* TEXICMD_MULTITABLE */
1.15 kristaps 235: { doignline, "need", 4 }, /* TEXICMD_NEED */
1.3 kristaps 236: { dosymbol, "\n", 1 }, /* TEXICMD_NEWLINE */
1.1 kristaps 237: { doignline, "node", 4 }, /* TEXICMD_NODE */
1.3 kristaps 238: { doignline, "noindent", 8 }, /* TEXICMD_NOINDENT */
1.42 kristaps 239: { dosymbol, "O", 1 }, /* TEXICMD_O */
240: { dosymbol, "OE", 2 }, /* TEXICMD_OE */
241: { dosymbol, "oe", 2 }, /* TEXICMD_OESMALL */
242: { doaccent, "ogonek", 6 }, /* TEXICMD_OGONEK */
1.16 kristaps 243: { doinline, "option", 6 }, /* TEXICMD_OPTION */
1.42 kristaps 244: { dosymbol, "ordf", 4 }, /* TEXICMD_ORDF */
245: { dosymbol, "ordm", 4 }, /* TEXICMD_ORDM */
246: { dosymbol, "o", 1 }, /* TEXICMD_OSMALL */
1.3 kristaps 247: { doignline, "page", 4 }, /* TEXICMD_PAGE */
1.25 kristaps 248: { doignline, "paragraphindent", 15 }, /* TEXICMD_PARINDENT */
249: { dosymbol, ".", 1 }, /* TEXICMD_PERIOD */
1.28 kristaps 250: { doignline, "pindex", 6 }, /* TEXICMD_PINDEX */
1.43 kristaps 251: { dosymbol, "pounds", 6 }, /* TEXICMD_POUNDS */
1.2 kristaps 252: { doignline, "printindex", 10 }, /* TEXICMD_PRINTINDEX */
1.42 kristaps 253: { dolink, "pxref", 5 }, /* TEXICMD_PXREF */
254: { dosymbol, "questiondown", 12 }, /* TEXICMD_QUESTIONDOWN */
255: { dosymbol, "?", 1 }, /* TEXICMD_QUESTIONMARK */
256: { doquotation, "quotation", 9 }, /* TEXICMD_QUOTATION */
1.43 kristaps 257: { dosymbol, "quotedblbase", 12 }, /* TEXICMD_QUOTEDBLBASE */
258: { dosymbol, "quotedblleft", 12 }, /* TEXICMD_QUOTEDBLLEFT */
259: { dosymbol, "quotedblright", 13 }, /* TEXICMD_QUOTEDBLRIGHT */
260: { dosymbol, "quotesinglbase", 14 }, /* TEXICMD_QUOTESINGLBASE */
261: { dosymbol, "quoteleft", 9 }, /* TEXICMD_QUOTELEFT */
262: { dosymbol, "quoteright", 10 }, /* TEXICMD_QUOTERIGHT */
1.21 kristaps 263: { doinline, "r", 1 }, /* TEXICMD_R */
1.23 kristaps 264: { dosecoffs, "raisesections", 13 }, /* TEXICMD_RAISESECTIONS */
1.1 kristaps 265: { dobracket, "ref", 3 }, /* TEXICMD_REF */
1.28 kristaps 266: { doignline, "refill", 6 }, /* TEXICMD_REFILL */
1.43 kristaps 267: { dosymbol, "registeredsymbol", 16 }, /* TEXICMD_REGISTEREDSYMBOL */
1.15 kristaps 268: { dosymbol, "result", 6 }, /* TEXICMD_RESULT */
1.42 kristaps 269: { doaccent, "ringaccent", 10 }, /* TEXICMD_RINGACCENT */
1.21 kristaps 270: { doinline, "samp", 4 }, /* TEXICMD_SAMP */
271: { doinline, "sansserif", 9 }, /* TEXICMD_SANSSERIF */
1.7 kristaps 272: { dobracket, "sc", 2 }, /* TEXICMD_SC */
1.1 kristaps 273: { dosection, "section", 7 }, /* TEXICMD_SECTION */
1.24 kristaps 274: { dovalue, "set", 3 }, /* TEXICMD_SET */
1.1 kristaps 275: { doignline, "setchapternewpage", 17 }, /* TEXICMD_SETCHAPNEWPAGE */
1.35 kristaps 276: { doignline, "setcontentsaftertitlepage", 25 }, /* TEXICMD_SETCONTENTSAFTER */
1.1 kristaps 277: { doignline, "setfilename", 11 }, /* TEXICMD_SETFILENAME */
1.10 kristaps 278: { dotitle, "settitle", 8 }, /* TEXICMD_SETTITLE */
1.25 kristaps 279: { doignline, "shortcontents", 13 }, /* TEXICMD_SHORTCONTENTS */
1.21 kristaps 280: { doinline, "slanted", 7 }, /* TEXICMD_SLANTED */
1.34 kristaps 281: { dosymbol, "/", 1 }, /* TEXICMD_SLASH */
1.3 kristaps 282: { dosp, "sp", 2 }, /* TEXICMD_SP */
283: { dosymbol, " ", 1 }, /* TEXICMD_SPACE */
1.17 kristaps 284: { doignline, "smallbook", 9 }, /* TEXICMD_SMALLBOOK */
1.12 kristaps 285: { dodisplay, "smalldisplay", 12 }, /* TEXICMD_SMALLDISPLAY */
1.3 kristaps 286: { doexample, "smallexample", 12 }, /* TEXICMD_SMALLEXAMPLE */
1.20 kristaps 287: { dodisplay, "smallformat", 11 }, /* TEXICMD_SMALLFORMAT */
1.13 kristaps 288: { dodisplay, "smallindentblock", 16 }, /* TEXICMD_SMALLINDENTBLOCK */
1.3 kristaps 289: { dosymbol, "{", 1 }, /* TEXICMD_SQUIGGLE_LEFT */
290: { dosymbol, "}", 1 }, /* TEXICMD_SQUIGGLE_RIGHT */
1.35 kristaps 291: { dosymbol, "ss", 2 }, /* TEXICMD_SS */
1.21 kristaps 292: { doinline, "strong", 6 }, /* TEXICMD_STRONG */
1.20 kristaps 293: { dosubsection, "subheading", 10 }, /* TEXICMD_SUBHEADING */
1.1 kristaps 294: { dosubsection, "subsection", 10 }, /* TEXICMD_SUBSECTION */
1.28 kristaps 295: { dosubsubsection, "subsubheading", 13 }, /* TEXICMD_SUBSUBHEADING */
1.23 kristaps 296: { dosubsubsection, "subsubsection", 13 }, /* TEXICMD_SUBSUBSECTION */
1.3 kristaps 297: { doignline, "subtitle", 8 }, /* TEXICMD_SUBTITLE */
1.25 kristaps 298: { doignline, "summarycontents", 15 }, /* TEXICMD_SUMMARYCONTENTS */
1.27 kristaps 299: { doignline, "synindex", 8 }, /* TEXICMD_SYNINDEX */
1.20 kristaps 300: { doignline, "syncodeindex", 12 }, /* TEXICMD_SYNCODEINDEX */
1.21 kristaps 301: { doinline, "t", 1 }, /* TEXICMD_T */
1.18 kristaps 302: { dotab, "tab", 3 }, /* TEXICMD_TAB */
303: { dosymbol, "\t", 1 }, /* TEXICMD_TABSYM */
1.1 kristaps 304: { dotable, "table", 5 }, /* TEXICMD_TABLE */
305: { doignblock, "tex", 3 }, /* TEXICMD_TEX */
306: { dosymbol, "TeX", 3 }, /* TEXICMD_TEXSYM */
1.43 kristaps 307: { dosymbol, "textdegree", 10 }, /* TEXICMD_TEXTDEGREE */
1.42 kristaps 308: { dosymbol, "TH", 2 }, /* TEXICMD_TH */
309: { dosymbol, "th", 2 }, /* TEXICMD_THSMALL */
1.35 kristaps 310: { dosymbol, "tie", 3 }, /* TEXICMD_TIE */
1.42 kristaps 311: { doaccent, "tieaccent", 9 }, /* TEXICMD_TIEACCENT */
1.16 kristaps 312: { doaccent, "~", 1 }, /* TEXICMD_TILDE */
1.25 kristaps 313: { doignline, "tindex", 6 }, /* TEXICMD_TINDEX */
1.3 kristaps 314: { doignline, "title", 5 }, /* TEXICMD_TITLE */
1.1 kristaps 315: { dobracket, "titlefont", 9 }, /* TEXICMD_TITLEFONT */
316: { doignblock, "titlepage", 9 }, /* TEXICMD_TITLEPAGE */
317: { dotop, "top", 3 }, /* TEXICMD_TOP */
1.42 kristaps 318: { doaccent, "u", 1 }, /* TEXICMD_U */
319: { doaccent, "ubaraccent", 10 }, /* TEXICMD_UBARACCENT */
320: { doaccent, "udotaccent", 10 }, /* TEXICMD_UDOTACCENT */
1.16 kristaps 321: { doaccent, "\"", 1 }, /* TEXICMD_UMLAUT */
1.12 kristaps 322: { dosection, "unnumbered", 10 }, /* TEXICMD_UNNUMBERED */
1.2 kristaps 323: { dosection, "unnumberedsec", 13 }, /* TEXICMD_UNNUMBEREDSEC */
1.20 kristaps 324: { dosubsection, "unnumberedsubsec", 16 }, /* TEXICMD_UNNUMBEREDSUBSEC */
1.23 kristaps 325: { dosubsubsection, "unnumberedsubsubsec", 19 }, /* TEXICMD_UNNUMBEREDSUBSUBSEC */
1.8 kristaps 326: { dolink, "uref", 4 }, /* TEXICMD_UREF */
327: { dolink, "url", 3 }, /* TEXICMD_URL */
1.34 kristaps 328: { doignline, "", 0 }, /* TEXICMD_USER_INDEX */
1.42 kristaps 329: { doaccent, "v", 1 }, /* TEXICMD_V */
1.24 kristaps 330: { dovalue, "value", 5 }, /* TEXICMD_VALUE */
1.12 kristaps 331: { doinline, "var", 3 }, /* TEXICMD_VAR */
1.33 kristaps 332: { doverb, "verb", 4 }, /* TEXICMD_VERB */
333: { doverbatim, "verbatim", 8 }, /* TEXICMD_VERBATIM */
1.16 kristaps 334: { doverbinclude, "verbatiminclude", 15 }, /* TEXICMD_VERBATIMINCLUDE */
1.18 kristaps 335: { doignline, "vindex", 6 }, /* TEXICMD_VINDEX */
1.9 kristaps 336: { dosp, "vskip", 5 }, /* TEXICMD_VSKIP */
1.20 kristaps 337: { dotable, "vtable", 6 }, /* TEXICMD_VTABLE */
1.3 kristaps 338: { dobracket, "w", 1 }, /* TEXICMD_W */
1.8 kristaps 339: { dolink, "xref", 4 }, /* TEXICMD_XREF */
1.20 kristaps 340: /* TEXICMD__END */
1.1 kristaps 341: };
342:
1.24 kristaps 343: const struct texitok *const texitoks = __texitoks;
1.18 kristaps 344:
1.2 kristaps 345: static void
1.46 kristaps 346: dodefindex(struct texi *p, enum texicmd cmd, size_t *pos)
1.27 kristaps 347: {
348: size_t start, end;
349: char *cp;
350:
1.46 kristaps 351: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
352: advance(p, pos);
1.27 kristaps 353:
354: start = end = *pos;
1.46 kristaps 355: while (end < BUFSZ(p) && ! ismspace(BUF(p)[end]))
1.27 kristaps 356: end++;
357:
358: if (start == end) {
1.46 kristaps 359: advanceeoln(p, pos, 1);
1.27 kristaps 360: return;
361: } else if (NULL == (cp = malloc(end - start + 1)))
362: texiabort(p, NULL);
363:
1.46 kristaps 364: memcpy(cp, &BUF(p)[start], end - start);
1.27 kristaps 365: cp[end - start] = '\0';
366:
367: p->indexs = realloc(p->indexs,
368: sizeof(char *) * (p->indexsz + 1));
369:
370: if (NULL == p->indexs)
371: texiabort(p, NULL);
372: p->indexs[p->indexsz++] = cp;
373: }
374:
375: static void
1.46 kristaps 376: dodefn(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 377: {
378: const char *blk;
379:
1.5 kristaps 380: blk = NULL;
1.3 kristaps 381: switch (cmd) {
1.15 kristaps 382: case (TEXICMD_DEFFN):
1.35 kristaps 383: case (TEXICMD_DEFMAC):
1.15 kristaps 384: case (TEXICMD_DEFTP):
1.3 kristaps 385: case (TEXICMD_DEFTYPEFN):
386: case (TEXICMD_DEFTYPEFUN):
1.34 kristaps 387: case (TEXICMD_DEFTYPEMETHOD):
1.15 kristaps 388: case (TEXICMD_DEFTYPEVAR):
389: case (TEXICMD_DEFTYPEVR):
390: case (TEXICMD_DEFUN):
391: case (TEXICMD_DEFVAR):
392: case (TEXICMD_DEFVR):
1.5 kristaps 393: blk = texitoks[cmd].tok;
1.3 kristaps 394: break;
1.5 kristaps 395: default:
1.3 kristaps 396: break;
397: }
398:
399: if (p->ign) {
1.15 kristaps 400: NULL != blk ?
1.46 kristaps 401: parseto(p, pos, blk) :
402: parseeoln(p, pos);
1.3 kristaps 403: return;
404: }
405:
1.15 kristaps 406: if (NULL != blk)
407: texivspace(p);
408:
1.3 kristaps 409: switch (cmd) {
1.34 kristaps 410: case (TEXICMD_DEFTYPEMETHOD):
411: case (TEXICMD_DEFTYPEMETHODX):
412: texiputchars(p, "Method");
413: break;
1.15 kristaps 414: case (TEXICMD_DEFMAC):
415: case (TEXICMD_DEFMACX):
416: texiputchars(p, "Macro");
417: break;
418: case (TEXICMD_DEFTYPEVAR):
419: case (TEXICMD_DEFTYPEVARX):
420: case (TEXICMD_DEFVAR):
421: case (TEXICMD_DEFVARX):
422: texiputchars(p, "Variable");
423: break;
1.3 kristaps 424: case (TEXICMD_DEFTYPEFUN):
1.15 kristaps 425: case (TEXICMD_DEFTYPEFUNX):
426: case (TEXICMD_DEFUN):
427: case (TEXICMD_DEFUNX):
428: texiputchars(p, "Function");
1.3 kristaps 429: break;
430: default:
1.46 kristaps 431: parselinearg(p, pos);
1.3 kristaps 432: break;
433: }
1.15 kristaps 434:
435: texiputchars(p, ":\n");
436:
437: switch (cmd) {
438: case (TEXICMD_DEFMAC):
439: case (TEXICMD_DEFMACX):
440: teximacroopen(p, "Dv");
1.46 kristaps 441: while (parselinearg(p, pos))
1.15 kristaps 442: /* Spin. */ ;
443: teximacroclose(p);
444: break;
445: case (TEXICMD_DEFFN):
446: case (TEXICMD_DEFFNX):
447: case (TEXICMD_DEFUN):
448: case (TEXICMD_DEFUNX):
449: teximacroopen(p, "Fo");
1.46 kristaps 450: parselinearg(p, pos);
1.15 kristaps 451: teximacroclose(p);
452: teximacroopen(p, "Fa");
1.46 kristaps 453: while (parselinearg(p, pos))
1.15 kristaps 454: /* Spin. */ ;
455: teximacroclose(p);
456: teximacro(p, "Fc");
457: break;
458: case (TEXICMD_DEFTYPEFUN):
459: case (TEXICMD_DEFTYPEFUNX):
460: case (TEXICMD_DEFTYPEFN):
461: case (TEXICMD_DEFTYPEFNX):
1.34 kristaps 462: case (TEXICMD_DEFTYPEMETHOD):
463: case (TEXICMD_DEFTYPEMETHODX):
1.15 kristaps 464: teximacroopen(p, "Ft");
1.46 kristaps 465: parselinearg(p, pos);
1.15 kristaps 466: teximacroclose(p);
467: teximacroopen(p, "Fo");
1.46 kristaps 468: parselinearg(p, pos);
1.15 kristaps 469: teximacroclose(p);
470: teximacroopen(p, "Fa");
1.46 kristaps 471: while (parselinearg(p, pos))
1.15 kristaps 472: /* Spin. */ ;
473: teximacroclose(p);
474: teximacro(p, "Fc");
475: break;
476: case (TEXICMD_DEFTP):
477: case (TEXICMD_DEFTPX):
478: case (TEXICMD_DEFTYPEVAR):
479: case (TEXICMD_DEFTYPEVARX):
480: case (TEXICMD_DEFTYPEVR):
481: case (TEXICMD_DEFTYPEVRX):
482: teximacroopen(p, "Vt");
1.46 kristaps 483: while (parselinearg(p, pos))
1.15 kristaps 484: /* Spin. */ ;
485: teximacroclose(p);
486: break;
487: case (TEXICMD_DEFVAR):
488: case (TEXICMD_DEFVARX):
489: case (TEXICMD_DEFVR):
490: case (TEXICMD_DEFVRX):
491: teximacroopen(p, "Va");
1.46 kristaps 492: while (parselinearg(p, pos))
1.15 kristaps 493: /* Spin. */ ;
494: teximacroclose(p);
495: break;
496: default:
497: abort();
1.3 kristaps 498: }
1.15 kristaps 499:
1.11 kristaps 500: texivspace(p);
1.3 kristaps 501: if (NULL != blk)
1.46 kristaps 502: parseto(p, pos, blk);
1.3 kristaps 503: }
504:
505: static void
1.46 kristaps 506: domacro(struct texi *p, enum texicmd cmd, size_t *pos)
1.30 kristaps 507: {
508: size_t start, end, endtoksz, len;
509: struct teximacro m;
510: const char *endtok, *blk;
511:
512: memset(&m, 0, sizeof(struct teximacro));
513:
1.46 kristaps 514: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
515: advance(p, pos);
1.30 kristaps 516:
1.46 kristaps 517: for (start = end = *pos; end < BUFSZ(p); end++)
518: if (ismspace(BUF(p)[end]) || '{' == BUF(p)[end])
1.30 kristaps 519: break;
520:
521: if (start == end)
522: texierr(p, "zero-length macro name");
523:
1.46 kristaps 524: advanceto(p, pos, end);
1.30 kristaps 525:
526: m.key = malloc(end - start + 1);
527: if (NULL == m.key)
528: texiabort(p, NULL);
1.46 kristaps 529: memcpy(m.key, &BUF(p)[start], end - start);
1.30 kristaps 530: m.key[end - start] = '\0';
531:
1.46 kristaps 532: m.args = argparse(p, pos, &m.argsz, 0);
1.30 kristaps 533:
1.46 kristaps 534: /* Note: we advance to the beginning of the macro. */
535: advanceeoln(p, pos, 1);
536:
537: /*
538: * According to the Texinfo manual, the macro ends on the
539: * newline subsequent the @end macro.
540: * That's COMPLETELY FUCKING WRONG.
541: * It ends inclusive the newline, which is why so many macros
542: * say things like @r{hello}@c, where the subsequent @c swallows
543: * the newline.
544: * However, it does swallow the leading newline, so look for the
545: * @end macro without the leading newline else we might look
546: * past empty macros.
547: */
1.30 kristaps 548: start = *pos;
1.46 kristaps 549: endtok = "@end macro\n";
1.30 kristaps 550: endtoksz = strlen(endtok);
1.46 kristaps 551: blk = memmem(&BUF(p)[start], BUFSZ(p) - start, endtok, endtoksz);
1.30 kristaps 552: if (NULL == blk)
553: texierr(p, "unterminated macro body");
1.46 kristaps 554: /* Roll us back one character. */
555: while (&BUF(p)[*pos] != blk)
556: advance(p, pos);
557: assert('@' == BUF(p)[*pos]);
558: if ('\n' != BUF(p)[*pos - 1])
559: texierr(p, "cannot handle @end macro in-line");
560:
561: len = blk - &BUF(p)[start];
1.30 kristaps 562: m.value = malloc(len + 1);
563: if (NULL == m.value)
564: texiabort(p, NULL);
1.46 kristaps 565: memcpy(m.value, &BUF(p)[start], len);
1.30 kristaps 566: m.value[len] = '\0';
567:
568: p->macros = realloc
569: (p->macros,
570: (p->macrosz + 1) *
571: sizeof(struct teximacro));
572: if (NULL == p->macros)
573: texiabort(p, NULL);
574:
575: p->macros[p->macrosz++] = m;
1.46 kristaps 576: advanceeoln(p, pos, 1);
1.30 kristaps 577: }
578:
579: static void
1.46 kristaps 580: doignblock(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 581: {
1.45 kristaps 582: char end[32], start[32];
583: const char *endt, *startt;
584: size_t esz, ssz, newpos, stack;
1.26 kristaps 585:
586: /*
1.45 kristaps 587: * FIXME: this is cheating.
588: * These tokens are supposed to begin on a newline.
589: * However, if we do that, then we would need to check within
590: * the loop for trailer (or leading, as the case may be)
591: * newline, and that's just a bit too complicated right now.
592: * This is becasue
593: * @ifset BAR
594: * @ifset FOO
595: * @end ifset
596: * @end ifset
597: * won't work right now: we'd read after the first "@end ifset"
598: * to the next line, then look for the next line after that.
1.26 kristaps 599: */
1.45 kristaps 600: ssz = snprintf(start, sizeof(start),
601: "@%s", texitoks[cmd].tok);
602: assert(ssz < sizeof(start));
603: esz = snprintf(end, sizeof(end),
604: "@end %s\n", texitoks[cmd].tok);
605: assert(esz < sizeof(end));
606: stack = 1;
607:
608: /*
609: * Here we look for the end token "end" somewhere in the file in
610: * front of us.
611: * It's not that easy, of course: if we have a nested block,
612: * then there'll be an "end" token of the same kind between us.
613: * Thus, we keep track of scopes for matching "end" blocks.
1.26 kristaps 614: */
1.46 kristaps 615: while (stack > 0 && *pos < BUFSZ(p)) {
1.45 kristaps 616: if (stack > 10)
617: abort();
1.46 kristaps 618: endt = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, end, esz);
619: startt = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, start, ssz);
1.45 kristaps 620: if (NULL == endt) {
621: texiwarn(p, "unterminated \"%s\" "
622: "block", texitoks[cmd].tok);
1.46 kristaps 623: *pos = BUFSZ(p);
1.45 kristaps 624: break;
625: }
1.26 kristaps 626:
1.45 kristaps 627: newpos = *pos;
628: if (NULL == startt || startt > endt) {
1.46 kristaps 629: newpos += esz + (size_t)(endt - &BUF(p)[*pos]);
1.45 kristaps 630: stack--;
631: } else {
1.46 kristaps 632: newpos += ssz + (size_t)(startt - &BUF(p)[*pos]);
1.45 kristaps 633: stack++;
634: }
635:
1.46 kristaps 636: assert(newpos <= BUFSZ(p));
1.45 kristaps 637: while (*pos < newpos)
1.46 kristaps 638: advance(p, pos);
1.45 kristaps 639: }
1.1 kristaps 640: }
641:
642: static void
1.46 kristaps 643: doblock(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 644: {
645:
1.46 kristaps 646: parseto(p, pos, texitoks[cmd].tok);
1.1 kristaps 647: }
648:
649: static void
1.46 kristaps 650: doinline(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 651: {
1.21 kristaps 652: const char *macro = NULL;
1.12 kristaps 653:
654: switch (cmd) {
1.21 kristaps 655: case (TEXICMD_CODE):
656: case (TEXICMD_KBD):
657: case (TEXICMD_SAMP):
658: case (TEXICMD_T):
659: macro = "Li";
660: break;
661: case (TEXICMD_CITE):
662: case (TEXICMD_DFN):
663: case (TEXICMD_EMPH):
664: case (TEXICMD_I):
665: case (TEXICMD_SLANTED):
666: macro = "Em";
667: break;
668: case (TEXICMD_B):
669: case (TEXICMD_STRONG):
670: macro = "Sy";
671: break;
1.12 kristaps 672: case (TEXICMD_COMMAND):
673: macro = "Xr";
674: break;
675: case (TEXICMD_ENV):
676: macro = "Ev";
677: break;
678: case (TEXICMD_FILE):
679: macro = "Pa";
680: break;
1.16 kristaps 681: case (TEXICMD_OPTION):
682: macro = "Op";
683: break;
1.12 kristaps 684: case (TEXICMD_VAR):
685: macro = "Va";
686: break;
687: default:
1.22 kristaps 688: break;
1.12 kristaps 689: }
690:
1.25 kristaps 691: if (NULL == macro || p->literal || TEXILIST_TABLE == p->list) {
1.46 kristaps 692: parsebracket(p, pos);
1.12 kristaps 693: return;
694: }
1.1 kristaps 695:
1.5 kristaps 696: teximacroopen(p, macro);
1.1 kristaps 697: p->seenws = 0;
1.46 kristaps 698: parsebracket(p, pos);
699: texipunctuate(p, pos);
1.5 kristaps 700: teximacroclose(p);
1.1 kristaps 701: }
702:
703: static void
1.46 kristaps 704: doverb(struct texi *p, enum texicmd cmd, size_t *pos)
1.33 kristaps 705: {
706: char delim;
1.34 kristaps 707: size_t start;
1.33 kristaps 708:
1.46 kristaps 709: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
710: advance(p, pos);
711: if (*pos == BUFSZ(p) || '{' != BUF(p)[*pos])
1.33 kristaps 712: return;
1.46 kristaps 713: advance(p, pos);
714: if (*pos == BUFSZ(p))
1.33 kristaps 715: return;
716:
1.46 kristaps 717: delim = BUF(p)[*pos];
718: advance(p, pos);
1.33 kristaps 719: /* Make sure we flush out our initial whitespace... */
720: if (p->seenws && p->outcol && 0 == p->literal)
721: texiputchar(p, ' ');
722: p->seenws = 0;
1.34 kristaps 723: start = *pos;
1.33 kristaps 724: /* Read until we see the delimiter then end-brace. */
1.46 kristaps 725: while (*pos < BUFSZ(p) - 1) {
726: if (BUF(p)[*pos] == delim && BUF(p)[*pos + 1] == '}')
1.33 kristaps 727: break;
1.46 kristaps 728: advance(p, pos);
1.33 kristaps 729: }
1.46 kristaps 730: if (*pos == BUFSZ(p) - 1)
1.33 kristaps 731: return;
1.46 kristaps 732: texiputbuf(p, start, *pos);
1.34 kristaps 733:
1.33 kristaps 734: /* Make sure we read after the end-brace. */
1.46 kristaps 735: assert(delim == BUF(p)[*pos]);
736: advance(p, pos);
737: assert('}' == BUF(p)[*pos]);
738: advance(p, pos);
1.33 kristaps 739: }
740:
741: static void
1.46 kristaps 742: doverbatim(struct texi *p, enum texicmd cmd, size_t *pos)
1.25 kristaps 743: {
744: const char *end, *term;
745: size_t endsz, endpos;
746:
1.45 kristaps 747: /* We read from the @verbatim\n newline inclusive! */
1.25 kristaps 748: end = "\n@end verbatim\n";
749: endsz = strlen(end);
1.46 kristaps 750: advanceeoln(p, pos, 0);
751: if (*pos == BUFSZ(p)) {
1.45 kristaps 752: texiwarn(p, "unexpected end of file");
753: return;
754: }
1.25 kristaps 755:
1.46 kristaps 756: term = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, end, endsz);
1.45 kristaps 757: if (NULL == term) {
758: texiwarn(p, "unterminated verbatim block");
1.46 kristaps 759: endpos = BUFSZ(p);
1.45 kristaps 760: } else
1.46 kristaps 761: endpos = *pos + (size_t)(term - &BUF(p)[*pos]);
1.25 kristaps 762:
1.46 kristaps 763: assert(endpos <= BUFSZ(p));
764: assert('\n' == BUF(p)[*pos]);
765: advance(p, pos);
1.25 kristaps 766: teximacro(p, "Bd -literal -offset indent");
1.26 kristaps 767: while (*pos < endpos) {
1.46 kristaps 768: texiputchar(p, BUF(p)[*pos]);
769: advance(p, pos);
1.25 kristaps 770: }
771: teximacro(p, "Ed");
1.46 kristaps 772: if (*pos < BUFSZ(p))
773: advanceto(p, pos, endpos + endsz);
1.25 kristaps 774: }
775:
776: static void
1.46 kristaps 777: doverbinclude(struct texi *p, enum texicmd cmd, size_t *pos)
1.16 kristaps 778: {
1.25 kristaps 779: char fname[PATH_MAX], path[PATH_MAX];
780: int rc;
781: size_t i, end;
782: const char *v;
783: enum texicmd type;
1.16 kristaps 784:
1.46 kristaps 785: while (*pos < BUFSZ(p) && ' ' == BUF(p)[*pos])
786: advance(p, pos);
1.16 kristaps 787:
1.46 kristaps 788: for (i = 0; *pos < BUFSZ(p) && '\n' != BUF(p)[*pos]; ) {
1.16 kristaps 789: if (i == sizeof(fname) - 1)
790: break;
1.46 kristaps 791: if ('@' != BUF(p)[*pos]) {
792: fname[i++] = BUF(p)[*pos];
793: advance(p, pos);
1.25 kristaps 794: continue;
795: }
1.46 kristaps 796: type = texicmd(p, *pos, &end, NULL);
797: advanceto(p, pos, end);
1.25 kristaps 798: if (TEXICMD_VALUE != type)
799: texierr(p, "unknown verbatiminclude command");
1.46 kristaps 800: v = valueblookup(p, pos);
1.25 kristaps 801: if (NULL == v)
802: continue;
803: while ('\0' != *v) {
804: if (i == sizeof(fname) - 1)
805: break;
806: fname[i++] = *v++;
807: }
808: if ('\0' != *v)
809: break;
1.16 kristaps 810: }
811:
812: if (i == 0)
813: texierr(p, "path too short");
1.46 kristaps 814: else if ('\n' != BUF(p)[*pos])
1.16 kristaps 815: texierr(p, "path too long");
816: else if ('/' == fname[0])
817: texierr(p, "no absolute paths");
818: fname[i] = '\0';
819:
820: if (strstr(fname, "../") || strstr(fname, "/.."))
821: texierr(p, "insecure path");
822:
823: rc = snprintf(path, sizeof(path),
824: "%s/%s", p->dirs[0], fname);
825: if (rc < 0)
826: texierr(p, "couldn't format path");
827: else if ((size_t)rc >= sizeof(path))
828: texierr(p, "path too long");
829:
830: parsefile(p, path, 0);
831: }
832:
833: static void
1.46 kristaps 834: doinclude(struct texi *p, enum texicmd cmd, size_t *pos)
1.2 kristaps 835: {
1.25 kristaps 836: char fname[PATH_MAX], path[PATH_MAX];
837: size_t i, end;
838: int rc;
839: const char *v;
840: enum texicmd type;
1.2 kristaps 841:
1.46 kristaps 842: while (*pos < BUFSZ(p) && ' ' == BUF(p)[*pos])
843: advance(p, pos);
1.2 kristaps 844:
845: /* Read in the filename. */
1.46 kristaps 846: for (i = 0; *pos < BUFSZ(p) && '\n' != BUF(p)[*pos]; ) {
1.2 kristaps 847: if (i == sizeof(fname) - 1)
848: break;
1.46 kristaps 849: if ('@' != BUF(p)[*pos]) {
850: fname[i++] = BUF(p)[*pos];
851: advance(p, pos);
1.25 kristaps 852: continue;
853: }
1.46 kristaps 854: type = texicmd(p, *pos, &end, NULL);
855: advanceto(p, pos, end);
1.25 kristaps 856: if (TEXICMD_VALUE != type)
857: texierr(p, "unknown include command");
1.46 kristaps 858: v = valueblookup(p, pos);
1.25 kristaps 859: if (NULL == v)
860: continue;
861: while ('\0' != *v) {
862: if (i == sizeof(fname) - 1)
863: break;
864: fname[i++] = *v++;
865: }
866: if ('\0' != *v)
867: break;
1.2 kristaps 868: }
869:
870: if (i == 0)
871: texierr(p, "path too short");
1.46 kristaps 872: else if ('\n' != BUF(p)[*pos])
1.2 kristaps 873: texierr(p, "path too long");
874: else if ('/' == fname[0])
875: texierr(p, "no absolute paths");
876: fname[i] = '\0';
877:
878: if (strstr(fname, "../") || strstr(fname, "/.."))
879: texierr(p, "insecure path");
880:
1.5 kristaps 881: for (i = 0; i < p->dirsz; i++) {
882: rc = snprintf(path, sizeof(path),
883: "%s/%s", p->dirs[i], fname);
884: if (rc < 0)
885: texierr(p, "couldn't format path");
886: else if ((size_t)rc >= sizeof(path))
887: texierr(p, "path too long");
888: else if (-1 == access(path, R_OK))
889: continue;
890:
1.16 kristaps 891: parsefile(p, path, 1);
1.5 kristaps 892: return;
893: }
1.2 kristaps 894:
1.5 kristaps 895: texierr(p, "couldn't find %s in includes", fname);
1.2 kristaps 896: }
897:
898: static void
1.46 kristaps 899: dobracket(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 900: {
901:
1.46 kristaps 902: parsebracket(p, pos);
1.1 kristaps 903: }
904:
905: static void
1.46 kristaps 906: dodisplay(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 907: {
908:
1.20 kristaps 909: switch (cmd) {
910: case (TEXICMD_FORMAT):
911: case (TEXICMD_SMALLFORMAT):
912: teximacro(p, "Bd -filled");
913: break;
914: default:
915: teximacro(p, "Bd -filled -offset indent");
916: break;
917: }
918:
1.11 kristaps 919: p->seenvs = 1;
1.12 kristaps 920: /* FIXME: ignore and parseeoln. */
1.46 kristaps 921: advanceeoln(p, pos, 1);
922: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 923: teximacro(p, "Ed");
1.3 kristaps 924: }
925:
926: static void
1.46 kristaps 927: doexample(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 928: {
929:
1.5 kristaps 930: teximacro(p, "Bd -literal -offset indent");
1.12 kristaps 931: /* FIXME: ignore and parseeoln. */
1.46 kristaps 932: advanceeoln(p, pos, 1);
1.3 kristaps 933: p->literal++;
1.46 kristaps 934: parseto(p, pos, texitoks[cmd].tok);
1.3 kristaps 935: p->literal--;
1.5 kristaps 936: teximacro(p, "Ed");
1.1 kristaps 937: }
938:
939: static void
1.46 kristaps 940: dobye(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 941: {
942:
943: texiexit(p);
944: exit(EXIT_SUCCESS);
945: }
946:
947: static void
1.46 kristaps 948: dotitle(struct texi *p, enum texicmd cmd, size_t *pos)
1.10 kristaps 949: {
950: size_t start, end;
951:
1.46 kristaps 952: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
953: advance(p, pos);
1.10 kristaps 954: start = end = *pos;
1.46 kristaps 955: while (end < BUFSZ(p) && '\n' != BUF(p)[end])
1.10 kristaps 956: end++;
1.46 kristaps 957: advanceeoln(p, pos, 1);
1.10 kristaps 958: free(p->subtitle);
959: p->subtitle = malloc(end - start + 1);
1.27 kristaps 960: if (NULL == p->subtitle)
961: texiabort(p, NULL);
1.46 kristaps 962: memcpy(p->subtitle, &BUF(p)[start], end - start);
1.10 kristaps 963: p->subtitle[end - start] = '\0';
964: }
965:
966: static void
1.46 kristaps 967: doaccent(struct texi *p, enum texicmd cmd, size_t *pos)
1.16 kristaps 968: {
1.42 kristaps 969: int brace = 0;
1.16 kristaps 970:
1.46 kristaps 971: if (*pos == BUFSZ(p)) {
1.42 kristaps 972: texiwarn(p, "truncated: @%s", texitoks[cmd].tok);
1.16 kristaps 973: return;
1.42 kristaps 974: }
975:
976: /* Pad us with space, if necessary. */
977: if (p->seenws && p->outcol && 0 == p->literal) {
1.34 kristaps 978: texiputchar(p, ' ');
1.42 kristaps 979: p->seenws = 0;
980: }
981:
982: /*
983: * If we're braced, then that's that.
984: * Otherwise, in a special Texinfo case: if we're a non
985: * alphabetic command of one letter, then the next character is
986: * the critical one.
987: * Otherwise, space can sit between us and our argument.
988: */
1.46 kristaps 989: if ('{' == BUF(p)[*pos]) {
1.42 kristaps 990: brace = 1;
1.46 kristaps 991: advance(p, pos);
1.42 kristaps 992: } else if (isalpha(texitoks[cmd].tok[0]))
1.46 kristaps 993: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
994: advance(p, pos);
1.42 kristaps 995:
1.46 kristaps 996: if (*pos == BUFSZ(p)) {
1.42 kristaps 997: texiwarn(p, "truncated: @%s", texitoks[cmd].tok);
998: return;
999: }
1000:
1001: switch (cmd) {
1.16 kristaps 1002: case (TEXICMD_ACUTE):
1.46 kristaps 1003: switch (BUF(p)[*pos]) {
1.16 kristaps 1004: case ('a'): case ('A'):
1005: case ('e'): case ('E'):
1006: case ('i'): case ('I'):
1007: case ('o'): case ('O'):
1008: case ('u'): case ('U'):
1009: texiputchars(p, "\\(\'");
1010: break;
1011: default:
1.42 kristaps 1012: texiwarn(p, "ignoring accent");
1013: break;
1.16 kristaps 1014: }
1.46 kristaps 1015: texiputchar(p, BUF(p)[*pos]);
1016: advance(p, pos);
1.42 kristaps 1017: break;
1018: case (TEXICMD_CEDILLA):
1.46 kristaps 1019: if ('c' == BUF(p)[*pos] || 'C' == BUF(p)[*pos])
1.42 kristaps 1020: texiputchars(p, "\\(,");
1021: else
1022: texiwarn(p, "ignoring accent");
1.46 kristaps 1023: texiputchar(p, BUF(p)[*pos]);
1024: advance(p, pos);
1.16 kristaps 1025: break;
1026: case (TEXICMD_CIRCUMFLEX):
1.46 kristaps 1027: switch (BUF(p)[*pos]) {
1.16 kristaps 1028: case ('a'): case ('A'):
1029: case ('e'): case ('E'):
1030: case ('i'): case ('I'):
1031: case ('o'): case ('O'):
1032: case ('u'): case ('U'):
1033: texiputchars(p, "\\(^");
1034: break;
1035: default:
1.42 kristaps 1036: texiwarn(p, "ignoring accent");
1.34 kristaps 1037: break;
1.16 kristaps 1038: }
1.46 kristaps 1039: texiputchar(p, BUF(p)[*pos]);
1040: advance(p, pos);
1.42 kristaps 1041: break;
1042: case (TEXICMD_DOTLESS):
1.46 kristaps 1043: if ('i' == BUF(p)[*pos] || 'j' == BUF(p)[*pos])
1.42 kristaps 1044: texiputchars(p, "\\(.");
1045: else
1046: texiwarn(p, "ignoring accent");
1.46 kristaps 1047: texiputchar(p, BUF(p)[*pos]);
1048: advance(p, pos);
1.16 kristaps 1049: break;
1050: case (TEXICMD_GRAVE):
1.46 kristaps 1051: switch (BUF(p)[*pos]) {
1.16 kristaps 1052: case ('a'): case ('A'):
1053: case ('e'): case ('E'):
1054: case ('i'): case ('I'):
1055: case ('o'): case ('O'):
1056: case ('u'): case ('U'):
1057: texiputchars(p, "\\(`");
1058: break;
1059: default:
1.42 kristaps 1060: texiwarn(p, "ignoring accent");
1061: break;
1.16 kristaps 1062: }
1.46 kristaps 1063: texiputchar(p, BUF(p)[*pos]);
1064: advance(p, pos);
1.16 kristaps 1065: break;
1066: case (TEXICMD_TILDE):
1.46 kristaps 1067: switch (BUF(p)[*pos]) {
1.16 kristaps 1068: case ('a'): case ('A'):
1069: case ('n'): case ('N'):
1070: case ('o'): case ('O'):
1071: texiputchars(p, "\\(~");
1072: break;
1073: default:
1.42 kristaps 1074: texiwarn(p, "ignoring accent");
1.34 kristaps 1075: break;
1.16 kristaps 1076: }
1.46 kristaps 1077: texiputchar(p, BUF(p)[*pos]);
1078: advance(p, pos);
1.16 kristaps 1079: break;
1080: case (TEXICMD_UMLAUT):
1.46 kristaps 1081: switch (BUF(p)[*pos]) {
1.16 kristaps 1082: case ('a'): case ('A'):
1083: case ('e'): case ('E'):
1084: case ('i'): case ('I'):
1085: case ('o'): case ('O'):
1086: case ('u'): case ('U'):
1087: case ('y'):
1088: texiputchars(p, "\\(:");
1089: break;
1090: default:
1.42 kristaps 1091: texiwarn(p, "ignoring accent");
1.34 kristaps 1092: break;
1.16 kristaps 1093: }
1.46 kristaps 1094: texiputchar(p, BUF(p)[*pos]);
1095: advance(p, pos);
1.16 kristaps 1096: break;
1097: default:
1.46 kristaps 1098: texiputchar(p, BUF(p)[*pos]);
1099: advance(p, pos);
1.42 kristaps 1100: break;
1101: }
1102:
1103: if (brace) {
1.46 kristaps 1104: while (*pos < BUFSZ(p) && '}' != BUF(p)[*pos]) {
1105: texiputchar(p, BUF(p)[*pos]);
1106: advance(p, pos);
1.42 kristaps 1107: }
1.46 kristaps 1108: if (*pos < BUFSZ(p))
1109: advance(p, pos);
1.42 kristaps 1110: }
1111:
1112: switch (cmd) {
1113: case (TEXICMD_TIEACCENT):
1114: texiputchar(p, ']');
1115: break;
1116: case (TEXICMD_DOTACCENT):
1117: texiputchar(p, '*');
1118: break;
1119: default:
1120: break;
1.16 kristaps 1121: }
1122: }
1123:
1124: static void
1.46 kristaps 1125: dosymbol(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1126: {
1127:
1.42 kristaps 1128: /* Remember to pad us. */
1.43 kristaps 1129: if (p->seenws && p->outcol && 0 == p->literal)
1.3 kristaps 1130: texiputchar(p, ' ');
1.43 kristaps 1131:
1132: p->seenws = 0;
1.3 kristaps 1133:
1.1 kristaps 1134: switch (cmd) {
1.42 kristaps 1135: case (TEXICMD_AA):
1136: texiputchars(p, "\\(oA");
1137: break;
1138: case (TEXICMD_AASMALL):
1139: texiputchars(p, "\\(oa");
1140: break;
1141: case (TEXICMD_AE):
1142: texiputchars(p, "\\(AE");
1143: break;
1144: case (TEXICMD_AESMALL):
1145: texiputchars(p, "\\(ae");
1146: break;
1.3 kristaps 1147: case (TEXICMD_ASTERISK):
1148: case (TEXICMD_NEWLINE):
1149: case (TEXICMD_SPACE):
1.18 kristaps 1150: case (TEXICMD_TABSYM):
1.3 kristaps 1151: texiputchar(p, ' ');
1152: break;
1.1 kristaps 1153: case (TEXICMD_AT):
1.3 kristaps 1154: texiputchar(p, '@');
1155: break;
1156: case (TEXICMD_BANG):
1157: texiputchar(p, '!');
1.7 kristaps 1158: break;
1159: case (TEXICMD_BULLET):
1160: texiputchars(p, "\\(bu");
1.1 kristaps 1161: break;
1.35 kristaps 1162: case (TEXICMD_COMMA):
1163: texiputchar(p, ',');
1164: break;
1.1 kristaps 1165: case (TEXICMD_COPYRIGHT):
1166: texiputchars(p, "\\(co");
1167: break;
1.42 kristaps 1168: case (TEXICMD_DH):
1169: texiputchars(p, "\\(-D");
1170: break;
1171: case (TEXICMD_DHSMALL):
1172: texiputchars(p, "\\(Sd");
1173: break;
1.2 kristaps 1174: case (TEXICMD_DOTS):
1.34 kristaps 1175: case (TEXICMD_ENDDOTS):
1.2 kristaps 1176: texiputchars(p, "...");
1177: break;
1.28 kristaps 1178: case (TEXICMD_EQUIV):
1179: texiputchars(p, "\\(==");
1180: break;
1.15 kristaps 1181: case (TEXICMD_ERROR):
1182: texiputchars(p, "error\\(->");
1.17 kristaps 1183: break;
1.43 kristaps 1184: case (TEXICMD_EURO):
1185: texiputchars(p, "\\(Eu");
1186: break;
1.42 kristaps 1187: case (TEXICMD_EXCLAMDOWN):
1188: texiputchars(p, "\\(r!");
1189: break;
1.17 kristaps 1190: case (TEXICMD_EXPANSION):
1191: texiputchars(p, "\\(->");
1.15 kristaps 1192: break;
1.43 kristaps 1193: case (TEXICMD_GEQ):
1194: texiputchars(p, "\\(>=");
1195: break;
1196: case (TEXICMD_GUILLEMETLEFT):
1197: case (TEXICMD_GUILLEMOTLEFT):
1198: texiputchars(p, "\\(Fo");
1199: break;
1200: case (TEXICMD_GUILLEMETRIGHT):
1201: case (TEXICMD_GUILLEMOTRIGHT):
1202: texiputchars(p, "\\(Fc");
1203: break;
1204: case (TEXICMD_GUILSINGLLEFT):
1205: texiputchars(p, "\\(fo");
1206: break;
1207: case (TEXICMD_GUILSINGLRIGHT):
1208: texiputchars(p, "\\(fc");
1209: break;
1.42 kristaps 1210: case (TEXICMD_L):
1211: texiputchars(p, "\\(/L");
1212: break;
1.1 kristaps 1213: case (TEXICMD_LATEX):
1214: texiputchars(p, "LaTeX");
1215: break;
1.43 kristaps 1216: case (TEXICMD_LEQ):
1217: texiputchars(p, "\\(<=");
1218: break;
1.42 kristaps 1219: case (TEXICMD_LSMALL):
1220: texiputchars(p, "\\(/l");
1221: break;
1.25 kristaps 1222: case (TEXICMD_MINUS):
1223: texiputchars(p, "\\-");
1224: break;
1.42 kristaps 1225: case (TEXICMD_O):
1226: texiputchars(p, "\\(/O");
1227: break;
1228: case (TEXICMD_OE):
1229: texiputchars(p, "\\(OE");
1230: break;
1231: case (TEXICMD_OESMALL):
1232: texiputchars(p, "\\(oe");
1233: break;
1234: case (TEXICMD_ORDF):
1235: texiputchars(p, "a");
1236: break;
1237: case (TEXICMD_ORDM):
1238: texiputchars(p, "o");
1239: break;
1240: case (TEXICMD_OSMALL):
1241: texiputchars(p, "\\(/o");
1242: break;
1.25 kristaps 1243: case (TEXICMD_PERIOD):
1244: texiputchar(p, '.');
1245: break;
1.43 kristaps 1246: case (TEXICMD_POUNDS):
1247: texiputchars(p, "\\(Po");
1248: break;
1.42 kristaps 1249: case (TEXICMD_QUESTIONDOWN):
1250: texiputchars(p, "\\(r?");
1251: break;
1.3 kristaps 1252: case (TEXICMD_QUESTIONMARK):
1253: texiputchar(p, '?');
1.15 kristaps 1254: break;
1.43 kristaps 1255: case (TEXICMD_QUOTEDBLBASE):
1256: texiputchars(p, "\\(Bq");
1257: break;
1258: case (TEXICMD_QUOTEDBLLEFT):
1259: texiputchars(p, "\\(lq");
1260: break;
1261: case (TEXICMD_QUOTEDBLRIGHT):
1262: texiputchars(p, "\\(rq");
1263: break;
1264: case (TEXICMD_QUOTESINGLBASE):
1265: texiputchars(p, "\\(bq");
1266: break;
1267: case (TEXICMD_QUOTELEFT):
1268: texiputchars(p, "\\(oq");
1269: break;
1270: case (TEXICMD_QUOTERIGHT):
1271: texiputchars(p, "\\(cq");
1272: break;
1273: case (TEXICMD_REGISTEREDSYMBOL):
1274: texiputchars(p, "\\(rg");
1275: break;
1.15 kristaps 1276: case (TEXICMD_RESULT):
1277: texiputchars(p, "\\(rA");
1.3 kristaps 1278: break;
1.34 kristaps 1279: case (TEXICMD_SLASH):
1280: texiputchar(p, '/');
1281: break;
1.35 kristaps 1282: case (TEXICMD_SS):
1283: texiputchars(p, "\\(ss");
1284: break;
1.3 kristaps 1285: case (TEXICMD_SQUIGGLE_LEFT):
1286: texiputchars(p, "{");
1287: break;
1288: case (TEXICMD_SQUIGGLE_RIGHT):
1289: texiputchars(p, "}");
1290: break;
1.38 kristaps 1291: case (TEXICMD_TEXSYM):
1.35 kristaps 1292: texiputchars(p, "TeX");
1.43 kristaps 1293: break;
1294: case (TEXICMD_TEXTDEGREE):
1295: texiputchars(p, "\\(de");
1.35 kristaps 1296: break;
1.42 kristaps 1297: case (TEXICMD_TH):
1298: texiputchars(p, "\\(TP");
1299: break;
1300: case (TEXICMD_THSMALL):
1301: texiputchars(p, "\\(Tp");
1302: break;
1.38 kristaps 1303: case (TEXICMD_TIE):
1.35 kristaps 1304: texiputchars(p, "\\ ");
1.1 kristaps 1305: break;
1.3 kristaps 1306: case (TEXICMD_COLON):
1307: case (TEXICMD_HYPHEN):
1308: break;
1.1 kristaps 1309: default:
1310: abort();
1311: }
1312:
1.42 kristaps 1313: /* Alphabetic commands have braces we ignore. */
1314: if (isalpha(texitoks[cmd].tok[0]))
1.46 kristaps 1315: doignbracket(p, cmd, pos);
1.1 kristaps 1316: }
1317:
1318: static void
1.46 kristaps 1319: doquotation(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1320: {
1321:
1.5 kristaps 1322: teximacro(p, "Qo");
1.46 kristaps 1323: parseto(p, pos, "quotation");
1.5 kristaps 1324: teximacro(p, "Qc");
1.1 kristaps 1325: }
1326:
1.3 kristaps 1327: static void
1.46 kristaps 1328: domath(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 1329: {
1.34 kristaps 1330: size_t nest, start;
1.3 kristaps 1331:
1332: /*
1333: * Math handling is different from everything else.
1334: * We don't allow any subcomponents, and we ignore the rules in
1335: * terms of @-commands.
1336: * This departs from GNU's rules, but whatever.
1337: */
1.46 kristaps 1338: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1339: advance(p, pos);
1340: if (*pos == BUFSZ(p) || '{' != BUF(p)[*pos])
1.3 kristaps 1341: return;
1.46 kristaps 1342: advance(p, pos);
1.3 kristaps 1343: if (p->seenws && p->outcol && 0 == p->literal)
1344: texiputchar(p, ' ');
1345: p->seenws = 0;
1.46 kristaps 1346: for (nest = 1, start = *pos; *pos < BUFSZ(p) && nest > 0; ) {
1347: if ('{' == BUF(p)[*pos])
1.3 kristaps 1348: nest++;
1.46 kristaps 1349: else if ('}' == BUF(p)[*pos])
1.3 kristaps 1350: if (0 == --nest)
1351: continue;
1.46 kristaps 1352: advance(p, pos);
1.3 kristaps 1353: }
1.46 kristaps 1354: if (*pos == BUFSZ(p))
1.3 kristaps 1355: return;
1.46 kristaps 1356: assert('}' == BUF(p)[*pos]);
1357: texiputbuf(p, start, *pos);
1358: advance(p, pos);
1.24 kristaps 1359: }
1360:
1361: static void
1.46 kristaps 1362: dovalue(struct texi *p, enum texicmd cmd, size_t *pos)
1.24 kristaps 1363: {
1.46 kristaps 1364: size_t start, end;
1.25 kristaps 1365: char *key, *val;
1366: const char *cp;
1.24 kristaps 1367:
1368: if (TEXICMD_SET == cmd) {
1.46 kristaps 1369: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1370: advance(p, pos);
1371: for (start = end = *pos; end < BUFSZ(p); end++)
1372: if (ismspace(BUF(p)[end]))
1.24 kristaps 1373: break;
1.25 kristaps 1374: /* We don't allow empty keys. */
1.24 kristaps 1375: if (start == end)
1376: return;
1.46 kristaps 1377: advanceto(p, pos, end);
1.24 kristaps 1378:
1379: key = malloc(end - start + 1);
1.27 kristaps 1380: if (NULL == key)
1381: texiabort(p, NULL);
1.46 kristaps 1382: memcpy(key, &BUF(p)[start], end - start);
1.24 kristaps 1383: key[end - start] = '\0';
1384:
1.46 kristaps 1385: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1386: advance(p, pos);
1387: for (start = end = *pos; end < BUFSZ(p); end++)
1388: if ('\n' == BUF(p)[end])
1.24 kristaps 1389: break;
1.25 kristaps 1390: /* We do allow empty values. */
1.46 kristaps 1391: advanceeoln(p, pos, 1);
1.24 kristaps 1392:
1393: val = malloc(end - start + 1);
1.27 kristaps 1394: if (NULL == val)
1395: texiabort(p, NULL);
1.46 kristaps 1396: memcpy(val, &BUF(p)[start], end - start);
1.24 kristaps 1397: val[end - start] = '\0';
1.25 kristaps 1398: valueadd(p, key, val);
1.24 kristaps 1399: } else if (TEXICMD_VALUE == cmd) {
1400: if (p->seenws)
1401: texiputchar(p, ' ');
1402: p->seenws = 0;
1.46 kristaps 1403: if (NULL != (cp = valueblookup(p, pos)))
1404: texisplice(p, cp, strlen(cp), pos);
1405: else
1.25 kristaps 1406: texiputchars(p, "{No value}");
1.24 kristaps 1407: } else if (TEXICMD_IFCLEAR == cmd) {
1.46 kristaps 1408: if (NULL != valuellookup(p, pos))
1409: doignblock(p, cmd, pos);
1.26 kristaps 1410: else
1.46 kristaps 1411: parseto(p, pos, texitoks[cmd].tok);
1.30 kristaps 1412: } else if (TEXICMD_IFSET == cmd) {
1.46 kristaps 1413: if (NULL == valuellookup(p, pos))
1414: doignblock(p, cmd, pos);
1.30 kristaps 1415: else
1.46 kristaps 1416: parseto(p, pos, texitoks[cmd].tok);
1.25 kristaps 1417: } else if (TEXICMD_CLEAR == cmd)
1.46 kristaps 1418: valuelclear(p, pos);
1.3 kristaps 1419: }
1420:
1.1 kristaps 1421: static void
1.46 kristaps 1422: dolink(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1423: {
1.8 kristaps 1424: int c;
1.1 kristaps 1425:
1426: switch (cmd) {
1427: case (TEXICMD_EMAIL):
1.5 kristaps 1428: teximacroopen(p, "Mt");
1.1 kristaps 1429: break;
1.3 kristaps 1430: case (TEXICMD_UREF):
1.1 kristaps 1431: case (TEXICMD_URL):
1.44 kristaps 1432: case (TEXICMD_INDICATEURL):
1.5 kristaps 1433: teximacroopen(p, "Lk");
1.1 kristaps 1434: break;
1.8 kristaps 1435: case (TEXICMD_XREF):
1436: texiputchars(p, "See Section");
1.39 kristaps 1437: teximacroopen(p, "Dq");
1.8 kristaps 1438: break;
1439: case (TEXICMD_PXREF):
1440: texiputchars(p, "see Section");
1.39 kristaps 1441: teximacroopen(p, "Dq");
1.8 kristaps 1442: break;
1.34 kristaps 1443: case (TEXICMD_INFOREF):
1444: texiputchars(p, "See Info file node");
1.39 kristaps 1445: teximacroopen(p, "Dq");
1.34 kristaps 1446: break;
1.1 kristaps 1447: default:
1.8 kristaps 1448: abort();
1.1 kristaps 1449: }
1.8 kristaps 1450:
1.46 kristaps 1451: c = parsearg(p, pos, 0);
1.8 kristaps 1452: p->ign++;
1453: while (c > 0)
1.46 kristaps 1454: c = parsearg(p, pos, 1);
1.8 kristaps 1455: p->ign--;
1456:
1.46 kristaps 1457: texipunctuate(p, pos);
1.8 kristaps 1458: teximacroclose(p);
1459: }
1460:
1461: static void
1.46 kristaps 1462: doignargn(struct texi *p, enum texicmd cmd, size_t *pos)
1.8 kristaps 1463: {
1464: int c;
1465:
1.46 kristaps 1466: c = parsearg(p, pos, 0);
1.8 kristaps 1467: p->ign++;
1468: while (c > 0)
1.46 kristaps 1469: c = parsearg(p, pos, 1);
1.8 kristaps 1470: p->ign--;
1.1 kristaps 1471: }
1472:
1.23 kristaps 1473: /*
1474: * Sections can be made subsections and so on by way of the
1475: * @raiseections and @lowersections commands.
1476: * Perform this check here and return the actual section number adjusted
1477: * to the raise level.
1478: */
1479: static int
1480: sectioner(struct texi *p, int sec)
1481: {
1482:
1483: if ((sec -= p->secoffs) < 0) {
1484: texiwarn(p, "section below minimum, clamping");
1485: return(0);
1486: } else if (sec >= SECTSZ) {
1487: texiwarn(p, "section above maximum, clamping");
1488: return(SECTSZ - 1);
1489: }
1490: return(sec);
1491: }
1492:
1493: static void
1.46 kristaps 1494: dosubsubsection(struct texi *p, enum texicmd cmd, size_t *pos)
1.23 kristaps 1495: {
1496: int sec;
1497:
1498: sec = sectioner(p, 3);
1499:
1500: /* We don't have a subsubsubsection, so make one up. */
1501: texivspace(p);
1502: teximacroopen(p, sects[sec]);
1.46 kristaps 1503: parseeoln(p, pos);
1.23 kristaps 1504: teximacroclose(p);
1505: texivspace(p);
1506: }
1507:
1.1 kristaps 1508: static void
1.46 kristaps 1509: dosubsection(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1510: {
1.23 kristaps 1511: int sec;
1512:
1513: sec = sectioner(p, 2);
1.13 kristaps 1514:
1515: if (p->outmacro)
1.23 kristaps 1516: texierr(p, "\"%s\" in open line scope!?", sects[sec]);
1.13 kristaps 1517: else if (p->literal)
1.23 kristaps 1518: texierr(p, "\"%s\" in a literal scope!?", sects[sec]);
1.1 kristaps 1519:
1.21 kristaps 1520: /* We don't have a subsubsection, so make one up. */
1.34 kristaps 1521: if (sec > 1)
1522: texivspace(p);
1.23 kristaps 1523: teximacroopen(p, sects[sec]);
1.46 kristaps 1524: parseeoln(p, pos);
1.5 kristaps 1525: teximacroclose(p);
1.34 kristaps 1526: if (sec > 1)
1527: texivspace(p);
1.1 kristaps 1528: }
1529:
1530: static void
1.46 kristaps 1531: dosecoffs(struct texi *p, enum texicmd cmd, size_t *pos)
1.23 kristaps 1532: {
1533:
1534: if (TEXICMD_RAISESECTIONS == cmd)
1535: p->secoffs++;
1536: else
1537: p->secoffs--;
1538: }
1539:
1540: static void
1.46 kristaps 1541: dosection(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1542: {
1.23 kristaps 1543: int sec;
1.12 kristaps 1544:
1545: switch (cmd) {
1546: case (TEXICMD_APPENDIX):
1547: case (TEXICMD_CHAPTER):
1548: case (TEXICMD_TOP):
1549: case (TEXICMD_UNNUMBERED):
1.23 kristaps 1550: sec = sectioner(p, 0);
1.12 kristaps 1551: break;
1552: case (TEXICMD_APPENDIXSEC):
1553: case (TEXICMD_HEADING):
1554: case (TEXICMD_SECTION):
1555: case (TEXICMD_UNNUMBEREDSEC):
1.23 kristaps 1556: sec = sectioner(p, 1);
1.12 kristaps 1557: break;
1558: default:
1559: abort();
1560: }
1.1 kristaps 1561:
1.3 kristaps 1562: if (p->outmacro)
1.23 kristaps 1563: texierr(p, "\"%s\" in open line scope!?", sects[sec]);
1.3 kristaps 1564: else if (p->literal)
1.23 kristaps 1565: texierr(p, "\"%s\" in a literal scope!?", sects[sec]);
1.3 kristaps 1566:
1.23 kristaps 1567: teximacroopen(p, sects[sec]);
1.46 kristaps 1568: parseeoln(p, pos);
1.3 kristaps 1569: teximacroclose(p);
1.11 kristaps 1570: p->seenvs = 1;
1.3 kristaps 1571: }
1572:
1573: static void
1.46 kristaps 1574: dosp(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 1575: {
1576:
1.37 kristaps 1577: if (p->literal)
1578: texiputchar(p, '\n');
1579: else
1580: texivspace(p);
1.12 kristaps 1581: /* FIXME: ignore and parseeoln. */
1.46 kristaps 1582: advanceeoln(p, pos, 1);
1.1 kristaps 1583: }
1584:
1585: static void
1.46 kristaps 1586: dotop(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1587: {
1.10 kristaps 1588: const char *cp;
1589: time_t t;
1590: char date[32];
1591:
1.26 kristaps 1592: if (--p->ign)
1.46 kristaps 1593: texierr(p, "@top command while ignoring");
1.26 kristaps 1594:
1.18 kristaps 1595: /*
1596: * Here we print our standard mdoc(7) prologue.
1597: * We use the title set with @settitle for the `Nd' description
1598: * and the source document filename (the first one as invoked on
1599: * the command line) for the title.
1600: * The date is set to the current date.
1601: */
1.10 kristaps 1602: t = time(NULL);
1603: strftime(date, sizeof(date), "%F", localtime(&t));
1.1 kristaps 1604:
1.10 kristaps 1605: teximacroopen(p, "Dd");
1606: texiputchars(p, date);
1607: teximacroclose(p);
1608: teximacroopen(p, "Dt");
1609: for (cp = p->title; '\0' != *cp; cp++)
1610: texiputchar(p, toupper(*cp));
1.11 kristaps 1611: texiputchars(p, " 7");
1.10 kristaps 1612: teximacroclose(p);
1.5 kristaps 1613: teximacro(p, "Os");
1614: teximacro(p, "Sh NAME");
1.10 kristaps 1615: teximacroopen(p, "Nm");
1.41 kristaps 1616: for (cp = p->title; '\0' != *cp; cp++)
1617: texiputchar(p, *cp);
1.10 kristaps 1618: teximacroclose(p);
1619: teximacroopen(p, "Nd");
1.41 kristaps 1620: if (NULL != p->subtitle)
1621: for (cp = p->subtitle; '\0' != *cp; cp++)
1622: texiputchar(p, *cp);
1623: else
1624: texiputchars(p, "Unknown description");
1.10 kristaps 1625: teximacroclose(p);
1.11 kristaps 1626: p->seenvs = 1;
1.46 kristaps 1627: dosection(p, cmd, pos);
1.1 kristaps 1628: }
1629:
1630: static void
1.46 kristaps 1631: doitem(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1632: {
1633:
1.18 kristaps 1634: /* Multitable is using raw tbl(7). */
1635: if (TEXILIST_TABLE == p->list) {
1636: texiputchar(p, '\n');
1637: return;
1638: }
1639:
1.3 kristaps 1640: if (p->outmacro)
1641: texierr(p, "item in open line scope!?");
1642: else if (p->literal)
1643: texierr(p, "item in a literal scope!?");
1644:
1645: switch (p->list) {
1646: case (TEXILIST_ITEM):
1.5 kristaps 1647: teximacroopen(p, "It");
1.3 kristaps 1648: break;
1649: case (TEXILIST_NOITEM):
1.5 kristaps 1650: teximacro(p, "It");
1.3 kristaps 1651: break;
1652: default:
1.11 kristaps 1653: texivspace(p);
1.3 kristaps 1654: break;
1655: }
1.18 kristaps 1656:
1657: /* Trick so we don't start with Pp. */
1.11 kristaps 1658: p->seenvs = 1;
1.46 kristaps 1659: parseeoln(p, pos);
1.1 kristaps 1660:
1.3 kristaps 1661: if (TEXILIST_ITEM == p->list)
1662: teximacroclose(p);
1.9 kristaps 1663: else if (p->outcol > 0)
1.1 kristaps 1664: texiputchar(p, '\n');
1.18 kristaps 1665: }
1666:
1667: static void
1.46 kristaps 1668: dotab(struct texi *p, enum texicmd cmd, size_t *pos)
1.18 kristaps 1669: {
1670:
1671: /* This command is only useful in @multitable. */
1672: if (TEXILIST_TABLE == p->list)
1673: texiputchar(p, '\t');
1674: }
1675:
1676: static void
1.46 kristaps 1677: domultitable(struct texi *p, enum texicmd cmd, size_t *pos)
1.18 kristaps 1678: {
1679: enum texilist sv = p->list;
1.32 kristaps 1680: int svliteral = p->literal;
1.18 kristaps 1681: enum texicmd type;
1682: size_t i, end, columns;
1683:
1684: p->list = TEXILIST_TABLE;
1.32 kristaps 1685: /*
1686: * TS/TE blocks aren't "in mdoc(7)", so we can disregard the
1687: * fact that we're in literal mode right now.
1688: */
1689: p->literal = 0;
1.18 kristaps 1690: teximacro(p, "TS");
1691: columns = 0;
1692:
1693: /* Advance to the first argument... */
1.46 kristaps 1694: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1695: advance(p, pos);
1.18 kristaps 1696:
1697: /* Make sure we don't print anything when scanning. */
1698: p->ign++;
1.46 kristaps 1699: if ('@' == BUF(p)[*pos]) {
1.18 kristaps 1700: /*
1701: * Look for @columnfractions.
1702: * We ignore these, but we do use the number of
1703: * arguments to set the number of columns that we'll
1704: * have.
1705: */
1.46 kristaps 1706: type = texicmd(p, *pos, &end, NULL);
1707: advanceto(p, pos, end);
1.18 kristaps 1708: if (TEXICMD_COLUMNFRACTIONS != type)
1.25 kristaps 1709: texierr(p, "unknown multitable command");
1.46 kristaps 1710: while (*pos < BUFSZ(p) && '\n' != BUF(p)[*pos]) {
1711: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1712: advance(p, pos);
1713: while (*pos < BUFSZ(p) && ! isws(BUF(p)[*pos])) {
1714: if ('\n' == BUF(p)[*pos])
1.18 kristaps 1715: break;
1.46 kristaps 1716: advance(p, pos);
1.18 kristaps 1717: }
1718: columns++;
1719: }
1720: } else
1721: /*
1722: * We have arguments.
1723: * We could parse these, but it's easier to just let
1724: * tbl(7) figure it out.
1725: * So use this only to count arguments.
1726: */
1.46 kristaps 1727: while (parselinearg(p, pos) > 0)
1.18 kristaps 1728: columns++;
1729: p->ign--;
1730:
1731: /* Left-justify each table entry. */
1732: for (i = 0; i < columns; i++) {
1733: if (i > 0)
1734: texiputchar(p, ' ');
1735: texiputchar(p, 'l');
1736: }
1737: texiputchars(p, ".\n");
1738: p->outmacro++;
1.46 kristaps 1739: parseto(p, pos, texitoks[cmd].tok);
1.18 kristaps 1740: p->outmacro--;
1741: teximacro(p, "TE");
1.32 kristaps 1742: p->literal = svliteral;
1.18 kristaps 1743: p->list = sv;
1.1 kristaps 1744: }
1745:
1746: static void
1.46 kristaps 1747: dotable(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1748: {
1.3 kristaps 1749: enum texilist sv = p->list;
1750:
1751: p->list = TEXILIST_ITEM;
1.5 kristaps 1752: teximacro(p, "Bl -tag -width Ds");
1.12 kristaps 1753: /* FIXME: ignore and parseeoln. */
1.46 kristaps 1754: advanceeoln(p, pos, 1);
1.11 kristaps 1755: p->seenvs = 1;
1.46 kristaps 1756: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 1757: teximacro(p, "El");
1.3 kristaps 1758: p->list = sv;
1.44 kristaps 1759: }
1760:
1761: static void
1.46 kristaps 1762: doend(struct texi *p, enum texicmd cmd, size_t *pos)
1.44 kristaps 1763: {
1764: size_t start;
1765:
1.46 kristaps 1766: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1767: advance(p, pos);
1.44 kristaps 1768: start = *pos;
1.46 kristaps 1769: while (*pos < BUFSZ(p) && '\n' != BUF(p)[*pos])
1770: advance(p, pos);
1.44 kristaps 1771:
1.46 kristaps 1772: texiwarn(p, "unexpected \"end\": %.*s", (int)(*pos - start), &BUF(p)[start]);
1773: advanceeoln(p, pos, 1);
1.1 kristaps 1774: }
1775:
1776: static void
1.46 kristaps 1777: doenumerate(struct texi *p, enum texicmd cmd, size_t *pos)
1.2 kristaps 1778: {
1.3 kristaps 1779: enum texilist sv = p->list;
1.2 kristaps 1780:
1.3 kristaps 1781: p->list = TEXILIST_NOITEM;
1.5 kristaps 1782: teximacro(p, "Bl -enum");
1.11 kristaps 1783: p->seenvs = 1;
1.12 kristaps 1784: /* FIXME: ignore and parseeoln. */
1.46 kristaps 1785: advanceeoln(p, pos, 1);
1786: parseto(p, pos, "enumerate");
1.5 kristaps 1787: teximacro(p, "El");
1.3 kristaps 1788: p->list = sv;
1.2 kristaps 1789: }
1790:
1791: static void
1.46 kristaps 1792: doitemize(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1793: {
1.3 kristaps 1794: enum texilist sv = p->list;
1.1 kristaps 1795:
1.21 kristaps 1796: p->list = TEXILIST_NOITEM;
1.5 kristaps 1797: teximacro(p, "Bl -bullet");
1.11 kristaps 1798: p->seenvs = 1;
1.12 kristaps 1799: /* FIXME: ignore and parseeoln. */
1.46 kristaps 1800: advanceeoln(p, pos, 1);
1801: parseto(p, pos, "itemize");
1.5 kristaps 1802: teximacro(p, "El");
1.3 kristaps 1803: p->list = sv;
1.1 kristaps 1804: }
1805:
1806: static void
1.46 kristaps 1807: doignbracket(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1808: {
1809:
1.3 kristaps 1810: p->ign++;
1.46 kristaps 1811: parsebracket(p, pos);
1.3 kristaps 1812: p->ign--;
1.1 kristaps 1813: }
1814:
1815: static void
1.46 kristaps 1816: doignline(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1817: {
1818:
1.12 kristaps 1819: /* FIXME: ignore and parseeoln. */
1.46 kristaps 1820: advanceeoln(p, pos, 1);
1.1 kristaps 1821: }
1822:
1.8 kristaps 1823: /*
1824: * Parse colon-separated directories from "cp" (if not NULL) and returns
1825: * the array of pointers.
1.40 kristaps 1826: * Prepends "base" to the array, if found.
1.8 kristaps 1827: * This does NOT sanitise the directories!
1828: */
1.5 kristaps 1829: static char **
1.27 kristaps 1830: parsedirs(struct texi *p, const char *base, const char *cp, size_t *sz)
1.5 kristaps 1831: {
1832: char *tok, *str, *tofree;
1833: const char *cpp;
1.40 kristaps 1834: size_t i = 0;
1.5 kristaps 1835: char **dirs;
1836:
1.40 kristaps 1837: /* Count up our expected arguments. */
1838: *sz = NULL != base;
1839: if (NULL != (cpp = cp))
1840: for ((*sz)++; NULL != (cpp = strchr(cpp, ':')); (*sz)++)
1.5 kristaps 1841: cpp++;
1842:
1.40 kristaps 1843: if (0 == *sz)
1844: return(NULL);
1.27 kristaps 1845: if (NULL == (dirs = calloc(*sz, sizeof(char *))))
1846: texiabort(p, NULL);
1.40 kristaps 1847: if (NULL != base && NULL == (dirs[i++] = strdup(base)))
1.27 kristaps 1848: texiabort(p, NULL);
1.5 kristaps 1849: if (NULL == cp)
1850: return(dirs);
1.27 kristaps 1851: if (NULL == (tofree = tok = str = strdup(cp)))
1852: texiabort(p, NULL);
1.5 kristaps 1853:
1.40 kristaps 1854: for ( ; NULL != (tok = strsep(&str, ":")); i++)
1.27 kristaps 1855: if (NULL == (dirs[i] = strdup(tok)))
1856: texiabort(p, NULL);
1.5 kristaps 1857:
1858: free(tofree);
1859: return(dirs);
1860: }
1861:
1.1 kristaps 1862: int
1863: main(int argc, char *argv[])
1864: {
1865: struct texi texi;
1.2 kristaps 1866: int c;
1.37 kristaps 1867: char *dirpath, *dir, *ccp;
1.10 kristaps 1868: const char *progname, *Idir, *cp;
1.1 kristaps 1869:
1870: progname = strrchr(argv[0], '/');
1871: if (progname == NULL)
1872: progname = argv[0];
1873: else
1874: ++progname;
1875:
1.10 kristaps 1876: memset(&texi, 0, sizeof(struct texi));
1.40 kristaps 1877: texi.ign = 1;
1.5 kristaps 1878: Idir = NULL;
1.10 kristaps 1879:
1.5 kristaps 1880: while (-1 != (c = getopt(argc, argv, "I:")))
1.1 kristaps 1881: switch (c) {
1.5 kristaps 1882: case ('I'):
1883: Idir = optarg;
1884: break;
1.1 kristaps 1885: default:
1886: goto usage;
1887: }
1888:
1889: argv += optind;
1.40 kristaps 1890: argc -= optind;
1.1 kristaps 1891:
1.40 kristaps 1892: if (argc > 0) {
1893: if (NULL == (dirpath = strdup(argv[0])))
1894: texiabort(&texi, NULL);
1895: if (NULL == (dir = dirname(dirpath)))
1896: texiabort(&texi, NULL);
1897: if (NULL != (cp = strrchr(argv[0], '/')))
1898: texi.title = strdup(cp + 1);
1899: else
1900: texi.title = strdup(argv[0]);
1901: if (NULL == texi.title)
1902: texiabort(&texi, NULL);
1903: else if (NULL != (ccp = strchr(texi.title, '.')))
1904: *ccp = '\0';
1905: texi.dirs = parsedirs(&texi, dir, Idir, &texi.dirsz);
1906: free(dirpath);
1907: parsefile(&texi, argv[0], 1);
1908: } else {
1909: texi.title = strdup("Unknown Manual");
1910: texi.dirs = parsedirs(&texi, NULL, Idir, &texi.dirsz);
1911: parsestdin(&texi);
1912: }
1.27 kristaps 1913:
1.2 kristaps 1914: texiexit(&texi);
1915: return(EXIT_FAILURE);
1.1 kristaps 1916: usage:
1.40 kristaps 1917: fprintf(stderr, "usage: %s [-Idirs] [file]\n", progname);
1.1 kristaps 1918: return(EXIT_FAILURE);
1919: }
CVSweb