Annotation of texi2mdoc/main.c, Revision 1.58
1.58 ! kristaps 1: /* $Id: main.c,v 1.57 2015/03/01 16:57:39 kristaps Exp $ */
1.1 kristaps 2: /*
3: * Copyright (c) 2015 Kristaps Dzonsons <kristaps@bsd.lv>
4: *
5: * Permission to use, copy, modify, and distribute this software for any
6: * purpose with or without fee is hereby granted, provided that the above
7: * copyright notice and this permission notice appear in all copies.
8: *
9: * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10: * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11: * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12: * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13: * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14: * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15: * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
16: */
1.37 kristaps 17: #if defined(__linux__) || defined(__MINT__)
18: # define _GNU_SOURCE /* memmem */
19: #endif
1.1 kristaps 20: #include <assert.h>
21: #include <ctype.h>
22: #include <getopt.h>
1.2 kristaps 23: #include <libgen.h>
24: #include <limits.h>
1.1 kristaps 25: #include <stdarg.h>
26: #include <stdio.h>
27: #include <stdlib.h>
28: #include <string.h>
1.47 kristaps 29: #include <unistd.h>
1.1 kristaps 30:
1.24 kristaps 31: #include "extern.h"
1.1 kristaps 32:
1.23 kristaps 33: #define SECTSZ 4
34: static const char *const sects[SECTSZ] = {
35: "Sh",
36: "Ss",
37: "Em",
38: "No",
39: };
40:
1.46 kristaps 41: static void doaccent(struct texi *, enum texicmd, size_t *);
42: static void doblock(struct texi *, enum texicmd, size_t *);
43: static void dobracket(struct texi *, enum texicmd, size_t *);
44: static void dobye(struct texi *, enum texicmd, size_t *);
45: static void dodefindex(struct texi *, enum texicmd, size_t *);
46: static void dodefn(struct texi *, enum texicmd, size_t *);
47: static void dodisplay(struct texi *, enum texicmd, size_t *);
48: static void doend(struct texi *, enum texicmd, size_t *);
49: static void doenumerate(struct texi *, enum texicmd, size_t *);
50: static void doexample(struct texi *, enum texicmd, size_t *);
51: static void doignargn(struct texi *, enum texicmd, size_t *);
52: static void doignblock(struct texi *, enum texicmd, size_t *);
53: static void doignbracket(struct texi *, enum texicmd, size_t *);
54: static void doignline(struct texi *, enum texicmd, size_t *);
55: static void doinline(struct texi *, enum texicmd, size_t *);
56: static void doinclude(struct texi *, enum texicmd, size_t *);
57: static void doitem(struct texi *, enum texicmd, size_t *);
58: static void doitemize(struct texi *, enum texicmd, size_t *);
59: static void dolink(struct texi *, enum texicmd, size_t *);
60: static void domacro(struct texi *, enum texicmd, size_t *);
61: static void domath(struct texi *, enum texicmd, size_t *);
62: static void domultitable(struct texi *, enum texicmd, size_t *);
63: static void doquotation(struct texi *, enum texicmd, size_t *);
64: static void dotable(struct texi *, enum texicmd, size_t *);
65: static void dotop(struct texi *, enum texicmd, size_t *);
66: static void dosecoffs(struct texi *, enum texicmd, size_t *);
67: static void dosection(struct texi *, enum texicmd, size_t *);
68: static void dosp(struct texi *, enum texicmd, size_t *);
69: static void dosubsection(struct texi *, enum texicmd, size_t *);
70: static void dosubsubsection(struct texi *, enum texicmd, size_t *);
71: static void dosymbol(struct texi *, enum texicmd, size_t *);
72: static void dotab(struct texi *, enum texicmd, size_t *);
73: static void dotitle(struct texi *, enum texicmd, size_t *);
74: static void dovalue(struct texi *, enum texicmd, size_t *);
75: static void doverb(struct texi *, enum texicmd, size_t *);
76: static void doverbatim(struct texi *, enum texicmd, size_t *);
77: static void doverbinclude(struct texi *, enum texicmd, size_t *);
1.1 kristaps 78:
1.24 kristaps 79: static const struct texitok __texitoks[TEXICMD__MAX] = {
1.20 kristaps 80: /* TEXICMD__BEGIN */
1.42 kristaps 81: { doignline, "afourpaper", 10 }, /* TEXICMD_A4PAPER */
82: { dosymbol, "AA", 2 }, /* TEXICMD_AA */
83: { dosymbol, "aa", 2 }, /* TEXICMD_AASMALL */
1.8 kristaps 84: { doignargn, "acronym", 7 }, /* TEXICMD_ACRONYM */
1.16 kristaps 85: { doaccent, "'", 1 }, /* TEXICMD_ACUTE */
1.42 kristaps 86: { dosymbol, "AE", 2 }, /* TEXICMD_AE */
87: { dosymbol, "ae", 2 }, /* TEXICMD_AESMALL */
1.1 kristaps 88: { doignbracket, "anchor", 6 }, /* TEXICMD_ANCHOR */
1.12 kristaps 89: { dosection, "appendix", 8 }, /* TEXICMD_APPENDIX */
90: { dosection, "appendixsec", 11 }, /* TEXICMD_APPENDIXSEC */
1.20 kristaps 91: { dosubsection, "appendixsubsec", 14 }, /* TEXICMD_APPENDIXSUBSEC */
1.23 kristaps 92: { dosubsubsection, "appendixsubsubsec", 17 }, /* TEXICMD_APPENDIXSUBSUBSEC */
1.25 kristaps 93: { doinline, "asis", 4 }, /* TEXICMD_ASIS */
1.3 kristaps 94: { dosymbol, "*", 1 }, /* TEXICMD_ASTERISK */
1.1 kristaps 95: { dosymbol, "@", 1 }, /* TEXICMD_AT */
1.3 kristaps 96: { doignline, "author", 6 }, /* TEXICMD_AUTHOR */
1.21 kristaps 97: { doinline, "b", 1 }, /* TEXICMD_BOLD */
1.3 kristaps 98: { dosymbol, "!", 1 }, /* TEXICMD_BANG */
1.7 kristaps 99: { dosymbol, "bullet", 6 }, /* TEXICMD_BULLET */
1.1 kristaps 100: { dobye, "bye", 3 }, /* TEXICMD_BYE */
1.34 kristaps 101: { doblock, "cartouche", 9 }, /* TEXICMD_CARTOUCHE */
102: { doaccent, ",", 1 }, /* TEXICMD_CEDILLA */
1.12 kristaps 103: { doignline, "center", 6 }, /* TEXICMD_CENTER */
104: { dosection, "chapter", 7 }, /* TEXICMD_CHAPTER */
1.1 kristaps 105: { doignline, "cindex", 6 }, /* TEXICMD_CINDEX */
1.16 kristaps 106: { doaccent, "^", 1 }, /* TEXICMD_CIRCUMFLEX */
1.24 kristaps 107: { doinline, "cite", 4 }, /* TEXICMD_CITE */
108: { dovalue, "clear", 5 }, /* TEXICMD_CLEAR */
1.21 kristaps 109: { doinline, "code", 4 }, /* TEXICMD_CODE */
1.3 kristaps 110: { dosymbol, ":", 1 }, /* TEXICMD_COLON */
1.18 kristaps 111: { NULL, "columnfractions", 15 }, /* TEXICMD_COLUMNFRACTIONS */
1.35 kristaps 112: { dosymbol, "comma", 5 }, /* TEXICMD_COMMA */
1.12 kristaps 113: { doinline, "command", 7 }, /* TEXICMD_COMMAND */
1.1 kristaps 114: { doignline, "c", 1 }, /* TEXICMD_COMMENT */
1.2 kristaps 115: { doignline, "comment", 7 }, /* TEXICMD_COMMENT_LONG */
1.1 kristaps 116: { doignline, "contents", 8 }, /* TEXICMD_CONTENTS */
117: { doignblock, "copying", 7 }, /* TEXICMD_COPYING */
118: { dosymbol, "copyright", 9 }, /* TEXICMD_COPYRIGHT */
1.27 kristaps 119: { dodefindex, "defcodeindex", 12 }, /* TEXICMD_DEFCODEINDEX */
1.15 kristaps 120: { dodefn, "deffn", 5 }, /* TEXICMD_DEFFN */
121: { dodefn, "deffnx", 6 }, /* TEXICMD_DEFFNX */
1.27 kristaps 122: { dodefindex, "defindex", 8 }, /* TEXICMD_DEFINDEX */
1.15 kristaps 123: { dodefn, "defmac", 6 }, /* TEXICMD_DEFMAC */
124: { dodefn, "defmacx", 7 }, /* TEXICMD_DEFMACX */
125: { dodefn, "deftp", 5 }, /* TEXICMD_DEFTP */
126: { dodefn, "deftpx", 6 }, /* TEXICMD_DEFTPX */
127: { dodefn, "deftypefn", 9 }, /* TEXICMD_DEFTYPEFN */
128: { dodefn, "deftypefnx", 10 }, /* TEXICMD_DEFTYPEFNX */
129: { dodefn, "deftypefun", 10 }, /* TEXICMD_DEFTYPEFUN */
130: { dodefn, "deftypefunx", 11 }, /* TEXICMD_DEFTYPEFUNX */
1.34 kristaps 131: { dodefn, "deftypemethod", 13 }, /* TEXICMD_DEFTYPEMETHOD */
132: { dodefn, "deftypemethodx", 14 }, /* TEXICMD_DEFTYPEMETHODX */
1.15 kristaps 133: { dodefn, "deftypevar", 10 }, /* TEXICMD_DEFTYPEVAR */
134: { dodefn, "deftypevarx", 11 }, /* TEXICMD_DEFTYPEVARX */
135: { dodefn, "deftypevr", 9 }, /* TEXICMD_DEFTYPEVR */
136: { dodefn, "deftypevrx", 10 }, /* TEXICMD_DEFTYPEVRX */
137: { dodefn, "defun", 5 }, /* TEXICMD_DEFUN */
138: { dodefn, "defunx", 6 }, /* TEXICMD_DEFUNX */
139: { dodefn, "defvar", 6 }, /* TEXICMD_DEFVAR */
140: { dodefn, "defvarx", 7 }, /* TEXICMD_DEFVARX */
141: { dodefn, "defvr", 5 }, /* TEXICMD_DEFVR */
142: { dodefn, "defvrx", 6 }, /* TEXICMD_DEFVRX */
1.1 kristaps 143: { doignblock, "detailmenu", 10 }, /* TEXICMD_DETAILMENU */
1.21 kristaps 144: { doinline, "dfn", 3 }, /* TEXICMD_DFN */
1.42 kristaps 145: { dosymbol, "DH", 2 }, /* TEXICMD_DH */
146: { dosymbol, "dh", 2 }, /* TEXICMD_DHSMALL */
1.1 kristaps 147: { doignline, "dircategory", 11 }, /* TEXICMD_DIRCATEGORY */
148: { doignblock, "direntry", 8 }, /* TEXICMD_DIRENTRY */
1.3 kristaps 149: { dodisplay, "display", 7 }, /* TEXICMD_DISPLAY */
1.28 kristaps 150: { doignbracket, "dmn", 3 }, /* TEXICMD_DMN */
1.40 kristaps 151: { doignblock, "documentdescription", 19 }, /* TEXICMD_DOCUMENTDESCRIPTION */
152: { doignline, "documentencoding", 16 }, /* TEXICMD_DOCUMENTENCODING */
1.44 kristaps 153: { doignline, "documentlanguage", 16 }, /* TEXICMD_DOCUMENTLANGUAGE */
1.42 kristaps 154: { doaccent, "dotaccent", 9 }, /* TEXICMD_DOTACCENT */
155: { doaccent, "dotless", 7 }, /* TEXICMD_DOTLESS */
1.2 kristaps 156: { dosymbol, "dots", 4 }, /* TEXICMD_DOTS */
1.8 kristaps 157: { dolink, "email", 5 }, /* TEXICMD_EMAIL */
1.21 kristaps 158: { doinline, "emph", 4 }, /* TEXICMD_EMPH */
1.44 kristaps 159: { doend, "end", 3 }, /* TEXICMD_END */
1.34 kristaps 160: { dosymbol, "enddots", 7 }, /* TEXICMD_ENDDOTS */
1.2 kristaps 161: { doenumerate, "enumerate", 9 }, /* TEXICMD_ENUMERATE */
1.12 kristaps 162: { doinline, "env", 3 }, /* TEXICMD_ENV */
1.28 kristaps 163: { dosymbol, "equiv", 5 }, /* TEXICMD_EQUIV */
1.15 kristaps 164: { dosymbol, "error", 5 }, /* TEXICMD_ERROR */
1.43 kristaps 165: { dosymbol, "euro", 4 }, /* TEXICMD_EURO */
1.1 kristaps 166: { doexample, "example", 7 }, /* TEXICMD_EXAMPLE */
1.42 kristaps 167: { dosymbol, "exclamdown", 10 }, /* TEXICMD_EXCLAMDOWN */
1.25 kristaps 168: { doignline, "exdent", 6 }, /* TEXICMD_EXDENT */
1.17 kristaps 169: { dosymbol, "expansion", 9 }, /* TEXICMD_EXPANSION */
1.12 kristaps 170: { doinline, "file", 4 }, /* TEXICMD_FILE */
1.17 kristaps 171: { doignline, "finalout", 8 }, /* TEXICMD_FINALOUT */
1.20 kristaps 172: { doignline, "findex", 6 }, /* TEXICMD_FINDEX */
1.44 kristaps 173: { doblock, "flushleft", 9 }, /* TEXICMD_FLUSHLEFT */
174: { doblock, "flushright", 10 }, /* TEXICMD_FLUSHRIGHT */
175: { doignline, "firstparagraphindent", 20 }, /* TEXICMD_FIRSTPARAGRAPHINDENT */
1.32 kristaps 176: { doignbracket, "footnote", 8 }, /* TEXICMD_FOOTNOTE */
1.44 kristaps 177: { doignline, "footnotestyle", 13 }, /* TEXICMD_FOOTNOTESTYLE */
1.20 kristaps 178: { dotable, "ftable", 6 }, /* TEXICMD_FTABLE */
179: { dodisplay, "format", 6 }, /* TEXICMD_FORMAT */
1.43 kristaps 180: { dosymbol, "geq", 3 }, /* TEXICMD_GEQ */
1.16 kristaps 181: { doaccent, "`", 1 }, /* TEXICMD_GRAVE */
1.3 kristaps 182: { doblock, "group", 5 }, /* TEXICMD_GROUP */
1.43 kristaps 183: { dosymbol, "guillemetleft", 13 }, /* TEXICMD_GUILLEMETLEFT */
184: { dosymbol, "guillemetright", 14 }, /* TEXICMD_GUILLEMETRIGHT */
185: { dosymbol, "guillemotleft", 13 }, /* TEXICMD_GUILLEMOTLEFT */
186: { dosymbol, "guillemotright", 14 }, /* TEXICMD_GUILLEMOTRIGHT */
187: { dosymbol, "guilsinglleft", 13 }, /* TEXICMD_GUILSINGLLEFT */
188: { dosymbol, "guilsinglright", 14 }, /* TEXICMD_GUILSINGLRIGHT */
1.42 kristaps 189: { doaccent, "H", 1 }, /* TEXICMD_H */
1.2 kristaps 190: { dosection, "heading", 7 }, /* TEXICMD_HEADING */
1.3 kristaps 191: { doignline, "headings", 8 }, /* TEXICMD_HEADINGS */
1.18 kristaps 192: { doitem, "headitem", 8 }, /* TEXICMD_HEADITEM */
1.25 kristaps 193: { doignblock, "html", 4 }, /* TEXICMD_HTML */
1.3 kristaps 194: { dosymbol, "-", 1 }, /* TEXICMD_HYPHEN */
1.21 kristaps 195: { doinline, "i", 1 }, /* TEXICMD_I */
1.24 kristaps 196: { dovalue, "ifclear", 7 }, /* TEXICMD_IFCLEAR */
1.14 kristaps 197: { doignblock, "ifdocbook", 9 }, /* TEXICMD_IFDOCBOOK */
1.1 kristaps 198: { doignblock, "ifhtml", 6 }, /* TEXICMD_IFHTML */
1.26 kristaps 199: { doblock, "ifinfo", 6 }, /* TEXICMD_IFINFO */
1.14 kristaps 200: { doblock, "ifnotdocbook", 12 }, /* TEXICMD_IFNOTDOCBOOK */
201: { doblock, "ifnothtml", 9 }, /* TEXICMD_IFNOTHTML */
202: { doblock, "ifnotinfo", 9 }, /* TEXICMD_IFNOTINFO */
203: { doignblock, "ifnotplaintext", 14 }, /* TEXICMD_IFNOTPLAINTEXT */
1.3 kristaps 204: { doblock, "ifnottex", 8 }, /* TEXICMD_IFNOTTEX */
1.14 kristaps 205: { doblock, "ifnotxml", 8 }, /* TEXICMD_IFNOTXML */
206: { doblock, "ifplaintext", 11 }, /* TEXICMD_IFPLAINTEXT */
1.1 kristaps 207: { doignblock, "iftex", 5 }, /* TEXICMD_IFTEX */
1.30 kristaps 208: { dovalue, "ifset", 5 }, /* TEXICMD_IFSET */
1.14 kristaps 209: { doignblock, "ifxml", 5 }, /* TEXICMD_IFXML */
1.17 kristaps 210: { doignblock, "ignore", 6 }, /* TEXICMD_IGNORE */
1.1 kristaps 211: { doignbracket, "image", 5 }, /* TEXICMD_IMAGE */
1.2 kristaps 212: { doinclude, "include", 7 }, /* TEXICMD_INCLUDE */
1.13 kristaps 213: { dodisplay, "indentblock", 11 }, /* TEXICMD_INDENTBLOCK */
1.44 kristaps 214: { dolink, "indicateurl", 11 }, /* TEXICMD_INDICATEURL */
215: { dolink, "inforef", 7 }, /* TEXICMD_INFOREF */
1.5 kristaps 216: { doignline, "insertcopying", 13 }, /* TEXICMD_INSERTCOPYING */
1.1 kristaps 217: { doitem, "item", 4 }, /* TEXICMD_ITEM */
218: { doitemize, "itemize", 7 }, /* TEXICMD_ITEMIZE */
1.20 kristaps 219: { doitem, "itemx", 5 }, /* TEXICMD_ITEMX */
1.21 kristaps 220: { doinline, "kbd", 3 }, /* TEXICMD_KBD */
1.18 kristaps 221: { dobracket, "key", 3 }, /* TEXICMD_KEY */
1.20 kristaps 222: { doignline, "kindex", 6 }, /* TEXICMD_KINDEX */
1.42 kristaps 223: { dosymbol, "L", 1 }, /* TEXICMD_L */
1.1 kristaps 224: { dosymbol, "LaTeX", 5 }, /* TEXICMD_LATEX */
1.43 kristaps 225: { dosymbol, "leq", 3 }, /* TEXICMD_LEQ */
1.23 kristaps 226: { dosecoffs, "lowersections", 13 }, /* TEXICMD_LOWERSECTIONS */
1.42 kristaps 227: { dosymbol, "l", 1 }, /* TEXICMD_LSMALL */
1.30 kristaps 228: { domacro, "macro", 5 }, /* TEXICMD_MACRO */
1.42 kristaps 229: { doaccent, "=", 1 }, /* TEXICMD_MACRON */
1.3 kristaps 230: { domath, "math", 4 }, /* TEXICMD_MATH */
1.1 kristaps 231: { doignblock, "menu", 4 }, /* TEXICMD_MENU */
1.25 kristaps 232: { dosymbol, "minus", 5 }, /* TEXICMD_MINUS */
1.18 kristaps 233: { domultitable, "multitable", 10 }, /* TEXICMD_MULTITABLE */
1.15 kristaps 234: { doignline, "need", 4 }, /* TEXICMD_NEED */
1.3 kristaps 235: { dosymbol, "\n", 1 }, /* TEXICMD_NEWLINE */
1.1 kristaps 236: { doignline, "node", 4 }, /* TEXICMD_NODE */
1.3 kristaps 237: { doignline, "noindent", 8 }, /* TEXICMD_NOINDENT */
1.42 kristaps 238: { dosymbol, "O", 1 }, /* TEXICMD_O */
239: { dosymbol, "OE", 2 }, /* TEXICMD_OE */
240: { dosymbol, "oe", 2 }, /* TEXICMD_OESMALL */
241: { doaccent, "ogonek", 6 }, /* TEXICMD_OGONEK */
1.16 kristaps 242: { doinline, "option", 6 }, /* TEXICMD_OPTION */
1.42 kristaps 243: { dosymbol, "ordf", 4 }, /* TEXICMD_ORDF */
244: { dosymbol, "ordm", 4 }, /* TEXICMD_ORDM */
245: { dosymbol, "o", 1 }, /* TEXICMD_OSMALL */
1.3 kristaps 246: { doignline, "page", 4 }, /* TEXICMD_PAGE */
1.25 kristaps 247: { doignline, "paragraphindent", 15 }, /* TEXICMD_PARINDENT */
248: { dosymbol, ".", 1 }, /* TEXICMD_PERIOD */
1.28 kristaps 249: { doignline, "pindex", 6 }, /* TEXICMD_PINDEX */
1.43 kristaps 250: { dosymbol, "pounds", 6 }, /* TEXICMD_POUNDS */
1.2 kristaps 251: { doignline, "printindex", 10 }, /* TEXICMD_PRINTINDEX */
1.42 kristaps 252: { dolink, "pxref", 5 }, /* TEXICMD_PXREF */
253: { dosymbol, "questiondown", 12 }, /* TEXICMD_QUESTIONDOWN */
254: { dosymbol, "?", 1 }, /* TEXICMD_QUESTIONMARK */
255: { doquotation, "quotation", 9 }, /* TEXICMD_QUOTATION */
1.43 kristaps 256: { dosymbol, "quotedblbase", 12 }, /* TEXICMD_QUOTEDBLBASE */
257: { dosymbol, "quotedblleft", 12 }, /* TEXICMD_QUOTEDBLLEFT */
258: { dosymbol, "quotedblright", 13 }, /* TEXICMD_QUOTEDBLRIGHT */
259: { dosymbol, "quotesinglbase", 14 }, /* TEXICMD_QUOTESINGLBASE */
260: { dosymbol, "quoteleft", 9 }, /* TEXICMD_QUOTELEFT */
261: { dosymbol, "quoteright", 10 }, /* TEXICMD_QUOTERIGHT */
1.21 kristaps 262: { doinline, "r", 1 }, /* TEXICMD_R */
1.23 kristaps 263: { dosecoffs, "raisesections", 13 }, /* TEXICMD_RAISESECTIONS */
1.1 kristaps 264: { dobracket, "ref", 3 }, /* TEXICMD_REF */
1.28 kristaps 265: { doignline, "refill", 6 }, /* TEXICMD_REFILL */
1.43 kristaps 266: { dosymbol, "registeredsymbol", 16 }, /* TEXICMD_REGISTEREDSYMBOL */
1.15 kristaps 267: { dosymbol, "result", 6 }, /* TEXICMD_RESULT */
1.42 kristaps 268: { doaccent, "ringaccent", 10 }, /* TEXICMD_RINGACCENT */
1.21 kristaps 269: { doinline, "samp", 4 }, /* TEXICMD_SAMP */
270: { doinline, "sansserif", 9 }, /* TEXICMD_SANSSERIF */
1.58 ! kristaps 271: { doinline, "sc", 2 }, /* TEXICMD_SC */
1.1 kristaps 272: { dosection, "section", 7 }, /* TEXICMD_SECTION */
1.24 kristaps 273: { dovalue, "set", 3 }, /* TEXICMD_SET */
1.1 kristaps 274: { doignline, "setchapternewpage", 17 }, /* TEXICMD_SETCHAPNEWPAGE */
1.35 kristaps 275: { doignline, "setcontentsaftertitlepage", 25 }, /* TEXICMD_SETCONTENTSAFTER */
1.1 kristaps 276: { doignline, "setfilename", 11 }, /* TEXICMD_SETFILENAME */
1.10 kristaps 277: { dotitle, "settitle", 8 }, /* TEXICMD_SETTITLE */
1.25 kristaps 278: { doignline, "shortcontents", 13 }, /* TEXICMD_SHORTCONTENTS */
1.21 kristaps 279: { doinline, "slanted", 7 }, /* TEXICMD_SLANTED */
1.34 kristaps 280: { dosymbol, "/", 1 }, /* TEXICMD_SLASH */
1.3 kristaps 281: { dosp, "sp", 2 }, /* TEXICMD_SP */
282: { dosymbol, " ", 1 }, /* TEXICMD_SPACE */
1.17 kristaps 283: { doignline, "smallbook", 9 }, /* TEXICMD_SMALLBOOK */
1.12 kristaps 284: { dodisplay, "smalldisplay", 12 }, /* TEXICMD_SMALLDISPLAY */
1.3 kristaps 285: { doexample, "smallexample", 12 }, /* TEXICMD_SMALLEXAMPLE */
1.20 kristaps 286: { dodisplay, "smallformat", 11 }, /* TEXICMD_SMALLFORMAT */
1.13 kristaps 287: { dodisplay, "smallindentblock", 16 }, /* TEXICMD_SMALLINDENTBLOCK */
1.3 kristaps 288: { dosymbol, "{", 1 }, /* TEXICMD_SQUIGGLE_LEFT */
289: { dosymbol, "}", 1 }, /* TEXICMD_SQUIGGLE_RIGHT */
1.35 kristaps 290: { dosymbol, "ss", 2 }, /* TEXICMD_SS */
1.21 kristaps 291: { doinline, "strong", 6 }, /* TEXICMD_STRONG */
1.20 kristaps 292: { dosubsection, "subheading", 10 }, /* TEXICMD_SUBHEADING */
1.1 kristaps 293: { dosubsection, "subsection", 10 }, /* TEXICMD_SUBSECTION */
1.28 kristaps 294: { dosubsubsection, "subsubheading", 13 }, /* TEXICMD_SUBSUBHEADING */
1.23 kristaps 295: { dosubsubsection, "subsubsection", 13 }, /* TEXICMD_SUBSUBSECTION */
1.3 kristaps 296: { doignline, "subtitle", 8 }, /* TEXICMD_SUBTITLE */
1.25 kristaps 297: { doignline, "summarycontents", 15 }, /* TEXICMD_SUMMARYCONTENTS */
1.50 kristaps 298: { dodefindex, "synindex", 8 }, /* TEXICMD_SYNINDEX */
299: { dodefindex, "syncodeindex", 12 }, /* TEXICMD_SYNCODEINDEX */
1.21 kristaps 300: { doinline, "t", 1 }, /* TEXICMD_T */
1.18 kristaps 301: { dotab, "tab", 3 }, /* TEXICMD_TAB */
302: { dosymbol, "\t", 1 }, /* TEXICMD_TABSYM */
1.1 kristaps 303: { dotable, "table", 5 }, /* TEXICMD_TABLE */
304: { doignblock, "tex", 3 }, /* TEXICMD_TEX */
305: { dosymbol, "TeX", 3 }, /* TEXICMD_TEXSYM */
1.43 kristaps 306: { dosymbol, "textdegree", 10 }, /* TEXICMD_TEXTDEGREE */
1.42 kristaps 307: { dosymbol, "TH", 2 }, /* TEXICMD_TH */
308: { dosymbol, "th", 2 }, /* TEXICMD_THSMALL */
1.35 kristaps 309: { dosymbol, "tie", 3 }, /* TEXICMD_TIE */
1.42 kristaps 310: { doaccent, "tieaccent", 9 }, /* TEXICMD_TIEACCENT */
1.16 kristaps 311: { doaccent, "~", 1 }, /* TEXICMD_TILDE */
1.25 kristaps 312: { doignline, "tindex", 6 }, /* TEXICMD_TINDEX */
1.3 kristaps 313: { doignline, "title", 5 }, /* TEXICMD_TITLE */
1.1 kristaps 314: { dobracket, "titlefont", 9 }, /* TEXICMD_TITLEFONT */
315: { doignblock, "titlepage", 9 }, /* TEXICMD_TITLEPAGE */
316: { dotop, "top", 3 }, /* TEXICMD_TOP */
1.42 kristaps 317: { doaccent, "u", 1 }, /* TEXICMD_U */
318: { doaccent, "ubaraccent", 10 }, /* TEXICMD_UBARACCENT */
319: { doaccent, "udotaccent", 10 }, /* TEXICMD_UDOTACCENT */
1.16 kristaps 320: { doaccent, "\"", 1 }, /* TEXICMD_UMLAUT */
1.12 kristaps 321: { dosection, "unnumbered", 10 }, /* TEXICMD_UNNUMBERED */
1.2 kristaps 322: { dosection, "unnumberedsec", 13 }, /* TEXICMD_UNNUMBEREDSEC */
1.20 kristaps 323: { dosubsection, "unnumberedsubsec", 16 }, /* TEXICMD_UNNUMBEREDSUBSEC */
1.23 kristaps 324: { dosubsubsection, "unnumberedsubsubsec", 19 }, /* TEXICMD_UNNUMBEREDSUBSUBSEC */
1.8 kristaps 325: { dolink, "uref", 4 }, /* TEXICMD_UREF */
326: { dolink, "url", 3 }, /* TEXICMD_URL */
1.34 kristaps 327: { doignline, "", 0 }, /* TEXICMD_USER_INDEX */
1.42 kristaps 328: { doaccent, "v", 1 }, /* TEXICMD_V */
1.24 kristaps 329: { dovalue, "value", 5 }, /* TEXICMD_VALUE */
1.12 kristaps 330: { doinline, "var", 3 }, /* TEXICMD_VAR */
1.33 kristaps 331: { doverb, "verb", 4 }, /* TEXICMD_VERB */
332: { doverbatim, "verbatim", 8 }, /* TEXICMD_VERBATIM */
1.16 kristaps 333: { doverbinclude, "verbatiminclude", 15 }, /* TEXICMD_VERBATIMINCLUDE */
1.18 kristaps 334: { doignline, "vindex", 6 }, /* TEXICMD_VINDEX */
1.9 kristaps 335: { dosp, "vskip", 5 }, /* TEXICMD_VSKIP */
1.20 kristaps 336: { dotable, "vtable", 6 }, /* TEXICMD_VTABLE */
1.3 kristaps 337: { dobracket, "w", 1 }, /* TEXICMD_W */
1.8 kristaps 338: { dolink, "xref", 4 }, /* TEXICMD_XREF */
1.20 kristaps 339: /* TEXICMD__END */
1.1 kristaps 340: };
341:
1.24 kristaps 342: const struct texitok *const texitoks = __texitoks;
1.18 kristaps 343:
1.2 kristaps 344: static void
1.46 kristaps 345: dodefindex(struct texi *p, enum texicmd cmd, size_t *pos)
1.27 kristaps 346: {
347: size_t start, end;
348: char *cp;
349:
1.46 kristaps 350: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
351: advance(p, pos);
1.27 kristaps 352:
353: start = end = *pos;
1.46 kristaps 354: while (end < BUFSZ(p) && ! ismspace(BUF(p)[end]))
1.27 kristaps 355: end++;
356:
357: if (start == end) {
1.46 kristaps 358: advanceeoln(p, pos, 1);
1.27 kristaps 359: return;
360: } else if (NULL == (cp = malloc(end - start + 1)))
361: texiabort(p, NULL);
362:
1.46 kristaps 363: memcpy(cp, &BUF(p)[start], end - start);
1.27 kristaps 364: cp[end - start] = '\0';
365:
366: p->indexs = realloc(p->indexs,
367: sizeof(char *) * (p->indexsz + 1));
368:
369: if (NULL == p->indexs)
370: texiabort(p, NULL);
371: p->indexs[p->indexsz++] = cp;
372: }
373:
374: static void
1.46 kristaps 375: dodefn(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 376: {
377: const char *blk;
378:
1.5 kristaps 379: blk = NULL;
1.3 kristaps 380: switch (cmd) {
1.15 kristaps 381: case (TEXICMD_DEFFN):
1.35 kristaps 382: case (TEXICMD_DEFMAC):
1.15 kristaps 383: case (TEXICMD_DEFTP):
1.3 kristaps 384: case (TEXICMD_DEFTYPEFN):
385: case (TEXICMD_DEFTYPEFUN):
1.34 kristaps 386: case (TEXICMD_DEFTYPEMETHOD):
1.15 kristaps 387: case (TEXICMD_DEFTYPEVAR):
388: case (TEXICMD_DEFTYPEVR):
389: case (TEXICMD_DEFUN):
390: case (TEXICMD_DEFVAR):
391: case (TEXICMD_DEFVR):
1.5 kristaps 392: blk = texitoks[cmd].tok;
1.3 kristaps 393: break;
1.5 kristaps 394: default:
1.3 kristaps 395: break;
396: }
397:
398: if (p->ign) {
1.15 kristaps 399: NULL != blk ?
1.46 kristaps 400: parseto(p, pos, blk) :
401: parseeoln(p, pos);
1.3 kristaps 402: return;
403: }
404:
1.15 kristaps 405: if (NULL != blk)
406: texivspace(p);
407:
1.3 kristaps 408: switch (cmd) {
1.34 kristaps 409: case (TEXICMD_DEFTYPEMETHOD):
410: case (TEXICMD_DEFTYPEMETHODX):
411: texiputchars(p, "Method");
412: break;
1.15 kristaps 413: case (TEXICMD_DEFMAC):
414: case (TEXICMD_DEFMACX):
415: texiputchars(p, "Macro");
416: break;
417: case (TEXICMD_DEFTYPEVAR):
418: case (TEXICMD_DEFTYPEVARX):
419: case (TEXICMD_DEFVAR):
420: case (TEXICMD_DEFVARX):
421: texiputchars(p, "Variable");
422: break;
1.3 kristaps 423: case (TEXICMD_DEFTYPEFUN):
1.15 kristaps 424: case (TEXICMD_DEFTYPEFUNX):
425: case (TEXICMD_DEFUN):
426: case (TEXICMD_DEFUNX):
427: texiputchars(p, "Function");
1.3 kristaps 428: break;
429: default:
1.46 kristaps 430: parselinearg(p, pos);
1.3 kristaps 431: break;
432: }
1.15 kristaps 433:
1.48 kristaps 434: texiputchar(p, ':');
435: texiputchar(p, '\n');
1.15 kristaps 436:
437: switch (cmd) {
438: case (TEXICMD_DEFMAC):
439: case (TEXICMD_DEFMACX):
440: teximacroopen(p, "Dv");
1.46 kristaps 441: while (parselinearg(p, pos))
1.15 kristaps 442: /* Spin. */ ;
443: teximacroclose(p);
444: break;
445: case (TEXICMD_DEFFN):
446: case (TEXICMD_DEFFNX):
447: case (TEXICMD_DEFUN):
448: case (TEXICMD_DEFUNX):
449: teximacroopen(p, "Fo");
1.46 kristaps 450: parselinearg(p, pos);
1.15 kristaps 451: teximacroclose(p);
452: teximacroopen(p, "Fa");
1.46 kristaps 453: while (parselinearg(p, pos))
1.15 kristaps 454: /* Spin. */ ;
455: teximacroclose(p);
456: teximacro(p, "Fc");
457: break;
458: case (TEXICMD_DEFTYPEFUN):
459: case (TEXICMD_DEFTYPEFUNX):
460: case (TEXICMD_DEFTYPEFN):
461: case (TEXICMD_DEFTYPEFNX):
1.34 kristaps 462: case (TEXICMD_DEFTYPEMETHOD):
463: case (TEXICMD_DEFTYPEMETHODX):
1.15 kristaps 464: teximacroopen(p, "Ft");
1.46 kristaps 465: parselinearg(p, pos);
1.15 kristaps 466: teximacroclose(p);
467: teximacroopen(p, "Fo");
1.46 kristaps 468: parselinearg(p, pos);
1.15 kristaps 469: teximacroclose(p);
470: teximacroopen(p, "Fa");
1.46 kristaps 471: while (parselinearg(p, pos))
1.15 kristaps 472: /* Spin. */ ;
473: teximacroclose(p);
474: teximacro(p, "Fc");
475: break;
476: case (TEXICMD_DEFTP):
477: case (TEXICMD_DEFTPX):
478: case (TEXICMD_DEFTYPEVAR):
479: case (TEXICMD_DEFTYPEVARX):
480: case (TEXICMD_DEFTYPEVR):
481: case (TEXICMD_DEFTYPEVRX):
482: teximacroopen(p, "Vt");
1.46 kristaps 483: while (parselinearg(p, pos))
1.15 kristaps 484: /* Spin. */ ;
485: teximacroclose(p);
486: break;
487: case (TEXICMD_DEFVAR):
488: case (TEXICMD_DEFVARX):
489: case (TEXICMD_DEFVR):
490: case (TEXICMD_DEFVRX):
491: teximacroopen(p, "Va");
1.46 kristaps 492: while (parselinearg(p, pos))
1.15 kristaps 493: /* Spin. */ ;
494: teximacroclose(p);
495: break;
496: default:
497: abort();
1.3 kristaps 498: }
1.15 kristaps 499:
1.54 kristaps 500: if (NULL == blk)
501: return;
502:
503: /*
504: * All "block" definitions have their block bodies indented
505: * unless they have the "x" form of the command following.
506: * E.g.,
507: * @deffn some function
508: * @deffnx another
509: * An explanation.
510: * @end deffn
511: * With this loop, we delay opening the indented block until we
512: * skipped past conformant macros.
513: */
514: for (;;) {
515: switch (peekcmd(p, *pos)) {
516: case (TEXICMD_DEFFNX):
517: case (TEXICMD_DEFMACX):
518: case (TEXICMD_DEFTPX):
519: case (TEXICMD_DEFTYPEFNX):
520: case (TEXICMD_DEFTYPEFUNX):
521: case (TEXICMD_DEFTYPEMETHODX):
522: case (TEXICMD_DEFTYPEVARX):
523: case (TEXICMD_DEFTYPEVRX):
524: case (TEXICMD_DEFUNX):
525: case (TEXICMD_DEFVARX):
526: case (TEXICMD_DEFVRX):
527: texivspace(p);
528: parseeoln(p, pos);
529: continue;
530: default:
531: break;
532: }
533: break;
534: }
535: teximacro(p, "Bd -filled -offset indent");
536: p->seenvs = 1;
537: parseto(p, pos, blk);
538: teximacro(p, "Ed");
1.3 kristaps 539: }
540:
541: static void
1.46 kristaps 542: domacro(struct texi *p, enum texicmd cmd, size_t *pos)
1.30 kristaps 543: {
544: size_t start, end, endtoksz, len;
545: struct teximacro m;
546: const char *endtok, *blk;
547:
548: memset(&m, 0, sizeof(struct teximacro));
549:
1.46 kristaps 550: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
551: advance(p, pos);
1.30 kristaps 552:
1.46 kristaps 553: for (start = end = *pos; end < BUFSZ(p); end++)
554: if (ismspace(BUF(p)[end]) || '{' == BUF(p)[end])
1.30 kristaps 555: break;
556:
557: if (start == end)
558: texierr(p, "zero-length macro name");
559:
1.46 kristaps 560: advanceto(p, pos, end);
1.30 kristaps 561:
562: m.key = malloc(end - start + 1);
563: if (NULL == m.key)
564: texiabort(p, NULL);
1.46 kristaps 565: memcpy(m.key, &BUF(p)[start], end - start);
1.30 kristaps 566: m.key[end - start] = '\0';
567:
1.46 kristaps 568: m.args = argparse(p, pos, &m.argsz, 0);
1.30 kristaps 569:
1.46 kristaps 570: /* Note: we advance to the beginning of the macro. */
571: advanceeoln(p, pos, 1);
572:
573: /*
574: * According to the Texinfo manual, the macro ends on the
575: * newline subsequent the @end macro.
576: * That's COMPLETELY FUCKING WRONG.
577: * It ends inclusive the newline, which is why so many macros
578: * say things like @r{hello}@c, where the subsequent @c swallows
579: * the newline.
580: * However, it does swallow the leading newline, so look for the
581: * @end macro without the leading newline else we might look
582: * past empty macros.
583: */
1.30 kristaps 584: start = *pos;
1.46 kristaps 585: endtok = "@end macro\n";
1.30 kristaps 586: endtoksz = strlen(endtok);
1.46 kristaps 587: blk = memmem(&BUF(p)[start], BUFSZ(p) - start, endtok, endtoksz);
1.30 kristaps 588: if (NULL == blk)
589: texierr(p, "unterminated macro body");
1.46 kristaps 590: /* Roll us back one character. */
591: while (&BUF(p)[*pos] != blk)
592: advance(p, pos);
593: assert('@' == BUF(p)[*pos]);
594: if ('\n' != BUF(p)[*pos - 1])
595: texierr(p, "cannot handle @end macro in-line");
596:
597: len = blk - &BUF(p)[start];
1.30 kristaps 598: m.value = malloc(len + 1);
599: if (NULL == m.value)
600: texiabort(p, NULL);
1.46 kristaps 601: memcpy(m.value, &BUF(p)[start], len);
1.30 kristaps 602: m.value[len] = '\0';
603:
604: p->macros = realloc
605: (p->macros,
606: (p->macrosz + 1) *
607: sizeof(struct teximacro));
608: if (NULL == p->macros)
609: texiabort(p, NULL);
610:
611: p->macros[p->macrosz++] = m;
1.46 kristaps 612: advanceeoln(p, pos, 1);
1.30 kristaps 613: }
614:
615: static void
1.46 kristaps 616: doignblock(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 617: {
1.45 kristaps 618: char end[32], start[32];
619: const char *endt, *startt;
620: size_t esz, ssz, newpos, stack;
1.26 kristaps 621:
622: /*
1.45 kristaps 623: * FIXME: this is cheating.
624: * These tokens are supposed to begin on a newline.
625: * However, if we do that, then we would need to check within
626: * the loop for trailer (or leading, as the case may be)
627: * newline, and that's just a bit too complicated right now.
628: * This is becasue
629: * @ifset BAR
630: * @ifset FOO
631: * @end ifset
632: * @end ifset
633: * won't work right now: we'd read after the first "@end ifset"
634: * to the next line, then look for the next line after that.
1.26 kristaps 635: */
1.45 kristaps 636: ssz = snprintf(start, sizeof(start),
637: "@%s", texitoks[cmd].tok);
638: assert(ssz < sizeof(start));
639: esz = snprintf(end, sizeof(end),
640: "@end %s\n", texitoks[cmd].tok);
641: assert(esz < sizeof(end));
642: stack = 1;
643:
644: /*
645: * Here we look for the end token "end" somewhere in the file in
646: * front of us.
647: * It's not that easy, of course: if we have a nested block,
648: * then there'll be an "end" token of the same kind between us.
649: * Thus, we keep track of scopes for matching "end" blocks.
1.26 kristaps 650: */
1.46 kristaps 651: while (stack > 0 && *pos < BUFSZ(p)) {
1.52 kristaps 652: if (stack > 64)
653: texierr(p, "run-away nested stack?");
1.46 kristaps 654: endt = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, end, esz);
655: startt = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, start, ssz);
1.45 kristaps 656: if (NULL == endt) {
657: texiwarn(p, "unterminated \"%s\" "
658: "block", texitoks[cmd].tok);
1.46 kristaps 659: *pos = BUFSZ(p);
1.45 kristaps 660: break;
661: }
1.26 kristaps 662:
1.45 kristaps 663: newpos = *pos;
664: if (NULL == startt || startt > endt) {
1.46 kristaps 665: newpos += esz + (size_t)(endt - &BUF(p)[*pos]);
1.45 kristaps 666: stack--;
667: } else {
1.46 kristaps 668: newpos += ssz + (size_t)(startt - &BUF(p)[*pos]);
1.45 kristaps 669: stack++;
670: }
671:
1.46 kristaps 672: assert(newpos <= BUFSZ(p));
1.45 kristaps 673: while (*pos < newpos)
1.46 kristaps 674: advance(p, pos);
1.45 kristaps 675: }
1.1 kristaps 676: }
677:
678: static void
1.46 kristaps 679: doblock(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 680: {
681:
1.46 kristaps 682: parseto(p, pos, texitoks[cmd].tok);
1.1 kristaps 683: }
684:
685: static void
1.46 kristaps 686: doinline(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 687: {
1.21 kristaps 688: const char *macro = NULL;
1.12 kristaps 689:
690: switch (cmd) {
1.21 kristaps 691: case (TEXICMD_CODE):
692: case (TEXICMD_KBD):
693: case (TEXICMD_SAMP):
694: case (TEXICMD_T):
695: macro = "Li";
696: break;
697: case (TEXICMD_CITE):
698: case (TEXICMD_DFN):
699: case (TEXICMD_EMPH):
700: case (TEXICMD_I):
701: case (TEXICMD_SLANTED):
702: macro = "Em";
703: break;
704: case (TEXICMD_B):
705: case (TEXICMD_STRONG):
706: macro = "Sy";
707: break;
1.12 kristaps 708: case (TEXICMD_COMMAND):
709: macro = "Xr";
710: break;
711: case (TEXICMD_ENV):
712: macro = "Ev";
713: break;
714: case (TEXICMD_FILE):
715: macro = "Pa";
716: break;
1.16 kristaps 717: case (TEXICMD_OPTION):
718: macro = "Op";
719: break;
1.12 kristaps 720: case (TEXICMD_VAR):
721: macro = "Va";
722: break;
723: default:
1.22 kristaps 724: break;
1.12 kristaps 725: }
726:
1.25 kristaps 727: if (NULL == macro || p->literal || TEXILIST_TABLE == p->list) {
1.58 ! kristaps 728: if (TEXICMD_SC == cmd)
! 729: p->uppercase++;
1.53 kristaps 730: parsebracket(p, pos, 0);
1.58 ! kristaps 731: if (TEXICMD_SC == cmd)
! 732: p->uppercase--;
1.12 kristaps 733: return;
734: }
1.1 kristaps 735:
1.5 kristaps 736: teximacroopen(p, macro);
1.1 kristaps 737: p->seenws = 0;
1.58 ! kristaps 738: if (TEXICMD_SC == cmd)
! 739: p->uppercase++;
1.53 kristaps 740: parsebracket(p, pos, 0);
1.58 ! kristaps 741: if (TEXICMD_SC == cmd)
! 742: p->uppercase--;
1.46 kristaps 743: texipunctuate(p, pos);
1.5 kristaps 744: teximacroclose(p);
1.1 kristaps 745: }
746:
747: static void
1.46 kristaps 748: doverb(struct texi *p, enum texicmd cmd, size_t *pos)
1.33 kristaps 749: {
750: char delim;
1.34 kristaps 751: size_t start;
1.33 kristaps 752:
1.46 kristaps 753: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
754: advance(p, pos);
755: if (*pos == BUFSZ(p) || '{' != BUF(p)[*pos])
1.33 kristaps 756: return;
1.46 kristaps 757: advance(p, pos);
758: if (*pos == BUFSZ(p))
1.33 kristaps 759: return;
760:
1.46 kristaps 761: delim = BUF(p)[*pos];
762: advance(p, pos);
1.33 kristaps 763: /* Make sure we flush out our initial whitespace... */
764: if (p->seenws && p->outcol && 0 == p->literal)
765: texiputchar(p, ' ');
766: p->seenws = 0;
1.34 kristaps 767: start = *pos;
1.33 kristaps 768: /* Read until we see the delimiter then end-brace. */
1.46 kristaps 769: while (*pos < BUFSZ(p) - 1) {
770: if (BUF(p)[*pos] == delim && BUF(p)[*pos + 1] == '}')
1.33 kristaps 771: break;
1.46 kristaps 772: advance(p, pos);
1.33 kristaps 773: }
1.51 kristaps 774: if (*pos >= BUFSZ(p) - 1)
1.33 kristaps 775: return;
1.46 kristaps 776: texiputbuf(p, start, *pos);
1.34 kristaps 777:
1.33 kristaps 778: /* Make sure we read after the end-brace. */
1.46 kristaps 779: assert(delim == BUF(p)[*pos]);
780: advance(p, pos);
781: assert('}' == BUF(p)[*pos]);
782: advance(p, pos);
1.33 kristaps 783: }
784:
785: static void
1.46 kristaps 786: doverbatim(struct texi *p, enum texicmd cmd, size_t *pos)
1.25 kristaps 787: {
788: const char *end, *term;
789: size_t endsz, endpos;
790:
1.45 kristaps 791: /* We read from the @verbatim\n newline inclusive! */
1.25 kristaps 792: end = "\n@end verbatim\n";
793: endsz = strlen(end);
1.46 kristaps 794: advanceeoln(p, pos, 0);
795: if (*pos == BUFSZ(p)) {
1.45 kristaps 796: texiwarn(p, "unexpected end of file");
797: return;
798: }
1.25 kristaps 799:
1.46 kristaps 800: term = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, end, endsz);
1.45 kristaps 801: if (NULL == term) {
802: texiwarn(p, "unterminated verbatim block");
1.46 kristaps 803: endpos = BUFSZ(p);
1.45 kristaps 804: } else
1.46 kristaps 805: endpos = *pos + (size_t)(term - &BUF(p)[*pos]);
1.25 kristaps 806:
1.46 kristaps 807: assert(endpos <= BUFSZ(p));
808: assert('\n' == BUF(p)[*pos]);
809: advance(p, pos);
1.25 kristaps 810: teximacro(p, "Bd -literal -offset indent");
1.26 kristaps 811: while (*pos < endpos) {
1.46 kristaps 812: texiputchar(p, BUF(p)[*pos]);
813: advance(p, pos);
1.25 kristaps 814: }
815: teximacro(p, "Ed");
1.46 kristaps 816: if (*pos < BUFSZ(p))
817: advanceto(p, pos, endpos + endsz);
1.25 kristaps 818: }
819:
820: static void
1.46 kristaps 821: doverbinclude(struct texi *p, enum texicmd cmd, size_t *pos)
1.16 kristaps 822: {
1.25 kristaps 823: char fname[PATH_MAX], path[PATH_MAX];
824: int rc;
825: size_t i, end;
826: const char *v;
827: enum texicmd type;
1.16 kristaps 828:
1.46 kristaps 829: while (*pos < BUFSZ(p) && ' ' == BUF(p)[*pos])
830: advance(p, pos);
1.16 kristaps 831:
1.46 kristaps 832: for (i = 0; *pos < BUFSZ(p) && '\n' != BUF(p)[*pos]; ) {
1.16 kristaps 833: if (i == sizeof(fname) - 1)
834: break;
1.46 kristaps 835: if ('@' != BUF(p)[*pos]) {
836: fname[i++] = BUF(p)[*pos];
837: advance(p, pos);
1.25 kristaps 838: continue;
839: }
1.46 kristaps 840: type = texicmd(p, *pos, &end, NULL);
841: advanceto(p, pos, end);
1.25 kristaps 842: if (TEXICMD_VALUE != type)
843: texierr(p, "unknown verbatiminclude command");
1.46 kristaps 844: v = valueblookup(p, pos);
1.25 kristaps 845: if (NULL == v)
846: continue;
847: while ('\0' != *v) {
848: if (i == sizeof(fname) - 1)
849: break;
850: fname[i++] = *v++;
851: }
852: if ('\0' != *v)
853: break;
1.16 kristaps 854: }
855:
856: if (i == 0)
857: texierr(p, "path too short");
1.46 kristaps 858: else if ('\n' != BUF(p)[*pos])
1.16 kristaps 859: texierr(p, "path too long");
860: else if ('/' == fname[0])
861: texierr(p, "no absolute paths");
862: fname[i] = '\0';
863:
864: if (strstr(fname, "../") || strstr(fname, "/.."))
865: texierr(p, "insecure path");
866:
867: rc = snprintf(path, sizeof(path),
868: "%s/%s", p->dirs[0], fname);
869: if (rc < 0)
870: texierr(p, "couldn't format path");
871: else if ((size_t)rc >= sizeof(path))
872: texierr(p, "path too long");
873:
874: parsefile(p, path, 0);
875: }
876:
877: static void
1.46 kristaps 878: doinclude(struct texi *p, enum texicmd cmd, size_t *pos)
1.2 kristaps 879: {
1.25 kristaps 880: char fname[PATH_MAX], path[PATH_MAX];
881: size_t i, end;
882: int rc;
883: const char *v;
884: enum texicmd type;
1.2 kristaps 885:
1.46 kristaps 886: while (*pos < BUFSZ(p) && ' ' == BUF(p)[*pos])
887: advance(p, pos);
1.2 kristaps 888:
889: /* Read in the filename. */
1.46 kristaps 890: for (i = 0; *pos < BUFSZ(p) && '\n' != BUF(p)[*pos]; ) {
1.2 kristaps 891: if (i == sizeof(fname) - 1)
892: break;
1.46 kristaps 893: if ('@' != BUF(p)[*pos]) {
894: fname[i++] = BUF(p)[*pos];
895: advance(p, pos);
1.25 kristaps 896: continue;
897: }
1.46 kristaps 898: type = texicmd(p, *pos, &end, NULL);
899: advanceto(p, pos, end);
1.25 kristaps 900: if (TEXICMD_VALUE != type)
901: texierr(p, "unknown include command");
1.46 kristaps 902: v = valueblookup(p, pos);
1.25 kristaps 903: if (NULL == v)
904: continue;
905: while ('\0' != *v) {
906: if (i == sizeof(fname) - 1)
907: break;
908: fname[i++] = *v++;
909: }
910: if ('\0' != *v)
911: break;
1.2 kristaps 912: }
913:
914: if (i == 0)
915: texierr(p, "path too short");
1.46 kristaps 916: else if ('\n' != BUF(p)[*pos])
1.2 kristaps 917: texierr(p, "path too long");
918: else if ('/' == fname[0])
919: texierr(p, "no absolute paths");
920: fname[i] = '\0';
921:
922: if (strstr(fname, "../") || strstr(fname, "/.."))
923: texierr(p, "insecure path");
924:
1.5 kristaps 925: for (i = 0; i < p->dirsz; i++) {
926: rc = snprintf(path, sizeof(path),
927: "%s/%s", p->dirs[i], fname);
928: if (rc < 0)
929: texierr(p, "couldn't format path");
930: else if ((size_t)rc >= sizeof(path))
931: texierr(p, "path too long");
932: else if (-1 == access(path, R_OK))
933: continue;
934:
1.16 kristaps 935: parsefile(p, path, 1);
1.5 kristaps 936: return;
937: }
1.2 kristaps 938:
1.5 kristaps 939: texierr(p, "couldn't find %s in includes", fname);
1.2 kristaps 940: }
941:
942: static void
1.46 kristaps 943: dobracket(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 944: {
945:
1.53 kristaps 946: parsebracket(p, pos, 0);
1.1 kristaps 947: }
948:
949: static void
1.46 kristaps 950: dodisplay(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 951: {
952:
1.57 kristaps 953: advanceeoln(p, pos, 1);
954:
1.20 kristaps 955: switch (cmd) {
956: case (TEXICMD_FORMAT):
957: case (TEXICMD_SMALLFORMAT):
958: teximacro(p, "Bd -filled");
959: break;
960: default:
961: teximacro(p, "Bd -filled -offset indent");
962: break;
963: }
964:
1.11 kristaps 965: p->seenvs = 1;
1.46 kristaps 966: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 967: teximacro(p, "Ed");
1.3 kristaps 968: }
969:
970: static void
1.46 kristaps 971: doexample(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 972: {
973:
1.57 kristaps 974: advanceeoln(p, pos, 1);
975:
1.5 kristaps 976: teximacro(p, "Bd -literal -offset indent");
1.3 kristaps 977: p->literal++;
1.46 kristaps 978: parseto(p, pos, texitoks[cmd].tok);
1.3 kristaps 979: p->literal--;
1.5 kristaps 980: teximacro(p, "Ed");
1.1 kristaps 981: }
982:
983: static void
1.46 kristaps 984: dobye(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 985: {
986:
987: texiexit(p);
988: exit(EXIT_SUCCESS);
989: }
990:
991: static void
1.46 kristaps 992: dotitle(struct texi *p, enum texicmd cmd, size_t *pos)
1.10 kristaps 993: {
1.57 kristaps 994: size_t start;
1.10 kristaps 995:
1.46 kristaps 996: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
997: advance(p, pos);
1.57 kristaps 998:
999: /* We want to suck down the entire line, inclusive \n. */
1000: start = *pos;
1001: while (*pos < BUFSZ(p) && '\n' != BUF(p)[*pos]) {
1002: if ('@' == BUF(p)[*pos])
1003: advance(p, pos);
1004: advance(p, pos);
1005: }
1006: if (*pos < BUFSZ(p))
1007: advance(p, pos);
1008:
1009: /* Copy this into a buffer. */
1.10 kristaps 1010: free(p->subtitle);
1.57 kristaps 1011: if (NULL == (p->subtitle = malloc(*pos - start + 1)))
1.27 kristaps 1012: texiabort(p, NULL);
1.57 kristaps 1013: memcpy(p->subtitle, &BUF(p)[start], *pos - start);
1014: p->subtitle[*pos - start] = '\0';
1.10 kristaps 1015: }
1016:
1017: static void
1.46 kristaps 1018: doaccent(struct texi *p, enum texicmd cmd, size_t *pos)
1.16 kristaps 1019: {
1.42 kristaps 1020: int brace = 0;
1.16 kristaps 1021:
1.46 kristaps 1022: if (*pos == BUFSZ(p)) {
1.42 kristaps 1023: texiwarn(p, "truncated: @%s", texitoks[cmd].tok);
1.16 kristaps 1024: return;
1.42 kristaps 1025: }
1026:
1027: /* Pad us with space, if necessary. */
1028: if (p->seenws && p->outcol && 0 == p->literal) {
1.34 kristaps 1029: texiputchar(p, ' ');
1.42 kristaps 1030: p->seenws = 0;
1031: }
1032:
1033: /*
1034: * If we're braced, then that's that.
1035: * Otherwise, in a special Texinfo case: if we're a non
1036: * alphabetic command of one letter, then the next character is
1037: * the critical one.
1038: * Otherwise, space can sit between us and our argument.
1039: */
1.46 kristaps 1040: if ('{' == BUF(p)[*pos]) {
1.42 kristaps 1041: brace = 1;
1.46 kristaps 1042: advance(p, pos);
1.49 kristaps 1043: } else if (isalpha((unsigned char)texitoks[cmd].tok[0]))
1.46 kristaps 1044: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1045: advance(p, pos);
1.42 kristaps 1046:
1.46 kristaps 1047: if (*pos == BUFSZ(p)) {
1.42 kristaps 1048: texiwarn(p, "truncated: @%s", texitoks[cmd].tok);
1049: return;
1050: }
1051:
1052: switch (cmd) {
1.16 kristaps 1053: case (TEXICMD_ACUTE):
1.46 kristaps 1054: switch (BUF(p)[*pos]) {
1.16 kristaps 1055: case ('a'): case ('A'):
1056: case ('e'): case ('E'):
1057: case ('i'): case ('I'):
1058: case ('o'): case ('O'):
1059: case ('u'): case ('U'):
1060: texiputchars(p, "\\(\'");
1061: break;
1062: default:
1.42 kristaps 1063: texiwarn(p, "ignoring accent");
1064: break;
1.16 kristaps 1065: }
1.46 kristaps 1066: texiputchar(p, BUF(p)[*pos]);
1067: advance(p, pos);
1.42 kristaps 1068: break;
1069: case (TEXICMD_CEDILLA):
1.46 kristaps 1070: if ('c' == BUF(p)[*pos] || 'C' == BUF(p)[*pos])
1.42 kristaps 1071: texiputchars(p, "\\(,");
1072: else
1073: texiwarn(p, "ignoring accent");
1.46 kristaps 1074: texiputchar(p, BUF(p)[*pos]);
1075: advance(p, pos);
1.16 kristaps 1076: break;
1077: case (TEXICMD_CIRCUMFLEX):
1.46 kristaps 1078: switch (BUF(p)[*pos]) {
1.16 kristaps 1079: case ('a'): case ('A'):
1080: case ('e'): case ('E'):
1081: case ('i'): case ('I'):
1082: case ('o'): case ('O'):
1083: case ('u'): case ('U'):
1084: texiputchars(p, "\\(^");
1085: break;
1086: default:
1.42 kristaps 1087: texiwarn(p, "ignoring accent");
1.34 kristaps 1088: break;
1.16 kristaps 1089: }
1.46 kristaps 1090: texiputchar(p, BUF(p)[*pos]);
1091: advance(p, pos);
1.42 kristaps 1092: break;
1093: case (TEXICMD_DOTLESS):
1.46 kristaps 1094: if ('i' == BUF(p)[*pos] || 'j' == BUF(p)[*pos])
1.42 kristaps 1095: texiputchars(p, "\\(.");
1096: else
1097: texiwarn(p, "ignoring accent");
1.46 kristaps 1098: texiputchar(p, BUF(p)[*pos]);
1099: advance(p, pos);
1.16 kristaps 1100: break;
1101: case (TEXICMD_GRAVE):
1.46 kristaps 1102: switch (BUF(p)[*pos]) {
1.16 kristaps 1103: case ('a'): case ('A'):
1104: case ('e'): case ('E'):
1105: case ('i'): case ('I'):
1106: case ('o'): case ('O'):
1107: case ('u'): case ('U'):
1108: texiputchars(p, "\\(`");
1109: break;
1110: default:
1.42 kristaps 1111: texiwarn(p, "ignoring accent");
1112: break;
1.16 kristaps 1113: }
1.46 kristaps 1114: texiputchar(p, BUF(p)[*pos]);
1115: advance(p, pos);
1.16 kristaps 1116: break;
1117: case (TEXICMD_TILDE):
1.46 kristaps 1118: switch (BUF(p)[*pos]) {
1.16 kristaps 1119: case ('a'): case ('A'):
1120: case ('n'): case ('N'):
1121: case ('o'): case ('O'):
1122: texiputchars(p, "\\(~");
1123: break;
1124: default:
1.42 kristaps 1125: texiwarn(p, "ignoring accent");
1.34 kristaps 1126: break;
1.16 kristaps 1127: }
1.46 kristaps 1128: texiputchar(p, BUF(p)[*pos]);
1129: advance(p, pos);
1.16 kristaps 1130: break;
1131: case (TEXICMD_UMLAUT):
1.46 kristaps 1132: switch (BUF(p)[*pos]) {
1.16 kristaps 1133: case ('a'): case ('A'):
1134: case ('e'): case ('E'):
1135: case ('i'): case ('I'):
1136: case ('o'): case ('O'):
1137: case ('u'): case ('U'):
1138: case ('y'):
1139: texiputchars(p, "\\(:");
1140: break;
1141: default:
1.42 kristaps 1142: texiwarn(p, "ignoring accent");
1.34 kristaps 1143: break;
1.16 kristaps 1144: }
1.46 kristaps 1145: texiputchar(p, BUF(p)[*pos]);
1146: advance(p, pos);
1.16 kristaps 1147: break;
1148: default:
1.46 kristaps 1149: texiputchar(p, BUF(p)[*pos]);
1150: advance(p, pos);
1.42 kristaps 1151: break;
1152: }
1153:
1154: if (brace) {
1.46 kristaps 1155: while (*pos < BUFSZ(p) && '}' != BUF(p)[*pos]) {
1156: texiputchar(p, BUF(p)[*pos]);
1157: advance(p, pos);
1.42 kristaps 1158: }
1.46 kristaps 1159: if (*pos < BUFSZ(p))
1160: advance(p, pos);
1.42 kristaps 1161: }
1162:
1163: switch (cmd) {
1164: case (TEXICMD_TIEACCENT):
1165: texiputchar(p, ']');
1166: break;
1167: case (TEXICMD_DOTACCENT):
1168: texiputchar(p, '*');
1169: break;
1170: default:
1171: break;
1.16 kristaps 1172: }
1173: }
1174:
1175: static void
1.46 kristaps 1176: dosymbol(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1177: {
1178:
1.42 kristaps 1179: /* Remember to pad us. */
1.43 kristaps 1180: if (p->seenws && p->outcol && 0 == p->literal)
1.3 kristaps 1181: texiputchar(p, ' ');
1.43 kristaps 1182:
1183: p->seenws = 0;
1.3 kristaps 1184:
1.1 kristaps 1185: switch (cmd) {
1.42 kristaps 1186: case (TEXICMD_AA):
1187: texiputchars(p, "\\(oA");
1188: break;
1189: case (TEXICMD_AASMALL):
1190: texiputchars(p, "\\(oa");
1191: break;
1192: case (TEXICMD_AE):
1193: texiputchars(p, "\\(AE");
1194: break;
1195: case (TEXICMD_AESMALL):
1196: texiputchars(p, "\\(ae");
1197: break;
1.3 kristaps 1198: case (TEXICMD_ASTERISK):
1199: case (TEXICMD_NEWLINE):
1200: case (TEXICMD_SPACE):
1.18 kristaps 1201: case (TEXICMD_TABSYM):
1.3 kristaps 1202: texiputchar(p, ' ');
1203: break;
1.1 kristaps 1204: case (TEXICMD_AT):
1.3 kristaps 1205: texiputchar(p, '@');
1206: break;
1207: case (TEXICMD_BANG):
1208: texiputchar(p, '!');
1.7 kristaps 1209: break;
1210: case (TEXICMD_BULLET):
1211: texiputchars(p, "\\(bu");
1.1 kristaps 1212: break;
1.35 kristaps 1213: case (TEXICMD_COMMA):
1214: texiputchar(p, ',');
1215: break;
1.1 kristaps 1216: case (TEXICMD_COPYRIGHT):
1217: texiputchars(p, "\\(co");
1218: break;
1.42 kristaps 1219: case (TEXICMD_DH):
1220: texiputchars(p, "\\(-D");
1221: break;
1222: case (TEXICMD_DHSMALL):
1223: texiputchars(p, "\\(Sd");
1224: break;
1.2 kristaps 1225: case (TEXICMD_DOTS):
1.34 kristaps 1226: case (TEXICMD_ENDDOTS):
1.2 kristaps 1227: texiputchars(p, "...");
1228: break;
1.28 kristaps 1229: case (TEXICMD_EQUIV):
1230: texiputchars(p, "\\(==");
1231: break;
1.15 kristaps 1232: case (TEXICMD_ERROR):
1233: texiputchars(p, "error\\(->");
1.17 kristaps 1234: break;
1.43 kristaps 1235: case (TEXICMD_EURO):
1236: texiputchars(p, "\\(Eu");
1237: break;
1.42 kristaps 1238: case (TEXICMD_EXCLAMDOWN):
1239: texiputchars(p, "\\(r!");
1240: break;
1.17 kristaps 1241: case (TEXICMD_EXPANSION):
1242: texiputchars(p, "\\(->");
1.15 kristaps 1243: break;
1.43 kristaps 1244: case (TEXICMD_GEQ):
1245: texiputchars(p, "\\(>=");
1246: break;
1247: case (TEXICMD_GUILLEMETLEFT):
1248: case (TEXICMD_GUILLEMOTLEFT):
1249: texiputchars(p, "\\(Fo");
1250: break;
1251: case (TEXICMD_GUILLEMETRIGHT):
1252: case (TEXICMD_GUILLEMOTRIGHT):
1253: texiputchars(p, "\\(Fc");
1254: break;
1255: case (TEXICMD_GUILSINGLLEFT):
1256: texiputchars(p, "\\(fo");
1257: break;
1258: case (TEXICMD_GUILSINGLRIGHT):
1259: texiputchars(p, "\\(fc");
1260: break;
1.42 kristaps 1261: case (TEXICMD_L):
1262: texiputchars(p, "\\(/L");
1263: break;
1.1 kristaps 1264: case (TEXICMD_LATEX):
1265: texiputchars(p, "LaTeX");
1266: break;
1.43 kristaps 1267: case (TEXICMD_LEQ):
1268: texiputchars(p, "\\(<=");
1269: break;
1.42 kristaps 1270: case (TEXICMD_LSMALL):
1271: texiputchars(p, "\\(/l");
1272: break;
1.25 kristaps 1273: case (TEXICMD_MINUS):
1274: texiputchars(p, "\\-");
1275: break;
1.42 kristaps 1276: case (TEXICMD_O):
1277: texiputchars(p, "\\(/O");
1278: break;
1279: case (TEXICMD_OE):
1280: texiputchars(p, "\\(OE");
1281: break;
1282: case (TEXICMD_OESMALL):
1283: texiputchars(p, "\\(oe");
1284: break;
1285: case (TEXICMD_ORDF):
1286: texiputchars(p, "a");
1287: break;
1288: case (TEXICMD_ORDM):
1289: texiputchars(p, "o");
1290: break;
1291: case (TEXICMD_OSMALL):
1292: texiputchars(p, "\\(/o");
1293: break;
1.25 kristaps 1294: case (TEXICMD_PERIOD):
1295: texiputchar(p, '.');
1296: break;
1.43 kristaps 1297: case (TEXICMD_POUNDS):
1298: texiputchars(p, "\\(Po");
1299: break;
1.42 kristaps 1300: case (TEXICMD_QUESTIONDOWN):
1301: texiputchars(p, "\\(r?");
1302: break;
1.3 kristaps 1303: case (TEXICMD_QUESTIONMARK):
1304: texiputchar(p, '?');
1.15 kristaps 1305: break;
1.43 kristaps 1306: case (TEXICMD_QUOTEDBLBASE):
1307: texiputchars(p, "\\(Bq");
1308: break;
1309: case (TEXICMD_QUOTEDBLLEFT):
1310: texiputchars(p, "\\(lq");
1311: break;
1312: case (TEXICMD_QUOTEDBLRIGHT):
1313: texiputchars(p, "\\(rq");
1314: break;
1315: case (TEXICMD_QUOTESINGLBASE):
1316: texiputchars(p, "\\(bq");
1317: break;
1318: case (TEXICMD_QUOTELEFT):
1319: texiputchars(p, "\\(oq");
1320: break;
1321: case (TEXICMD_QUOTERIGHT):
1322: texiputchars(p, "\\(cq");
1323: break;
1324: case (TEXICMD_REGISTEREDSYMBOL):
1325: texiputchars(p, "\\(rg");
1326: break;
1.15 kristaps 1327: case (TEXICMD_RESULT):
1328: texiputchars(p, "\\(rA");
1.3 kristaps 1329: break;
1.34 kristaps 1330: case (TEXICMD_SLASH):
1331: texiputchar(p, '/');
1332: break;
1.35 kristaps 1333: case (TEXICMD_SS):
1334: texiputchars(p, "\\(ss");
1335: break;
1.3 kristaps 1336: case (TEXICMD_SQUIGGLE_LEFT):
1337: texiputchars(p, "{");
1338: break;
1339: case (TEXICMD_SQUIGGLE_RIGHT):
1340: texiputchars(p, "}");
1341: break;
1.38 kristaps 1342: case (TEXICMD_TEXSYM):
1.35 kristaps 1343: texiputchars(p, "TeX");
1.43 kristaps 1344: break;
1345: case (TEXICMD_TEXTDEGREE):
1346: texiputchars(p, "\\(de");
1.35 kristaps 1347: break;
1.42 kristaps 1348: case (TEXICMD_TH):
1349: texiputchars(p, "\\(TP");
1350: break;
1351: case (TEXICMD_THSMALL):
1352: texiputchars(p, "\\(Tp");
1353: break;
1.38 kristaps 1354: case (TEXICMD_TIE):
1.35 kristaps 1355: texiputchars(p, "\\ ");
1.1 kristaps 1356: break;
1.3 kristaps 1357: case (TEXICMD_COLON):
1358: case (TEXICMD_HYPHEN):
1359: break;
1.1 kristaps 1360: default:
1361: abort();
1362: }
1363:
1.42 kristaps 1364: /* Alphabetic commands have braces we ignore. */
1.49 kristaps 1365: if (isalpha((unsigned char)texitoks[cmd].tok[0]))
1.46 kristaps 1366: doignbracket(p, cmd, pos);
1.1 kristaps 1367: }
1368:
1369: static void
1.46 kristaps 1370: doquotation(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1371: {
1372:
1.5 kristaps 1373: teximacro(p, "Qo");
1.46 kristaps 1374: parseto(p, pos, "quotation");
1.5 kristaps 1375: teximacro(p, "Qc");
1.1 kristaps 1376: }
1377:
1.3 kristaps 1378: static void
1.46 kristaps 1379: domath(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 1380: {
1381:
1.53 kristaps 1382: parsebracket(p, pos, 1);
1.24 kristaps 1383: }
1384:
1385: static void
1.46 kristaps 1386: dovalue(struct texi *p, enum texicmd cmd, size_t *pos)
1.24 kristaps 1387: {
1.46 kristaps 1388: size_t start, end;
1.25 kristaps 1389: char *key, *val;
1390: const char *cp;
1.24 kristaps 1391:
1392: if (TEXICMD_SET == cmd) {
1.46 kristaps 1393: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1394: advance(p, pos);
1395: for (start = end = *pos; end < BUFSZ(p); end++)
1396: if (ismspace(BUF(p)[end]))
1.24 kristaps 1397: break;
1.25 kristaps 1398: /* We don't allow empty keys. */
1.24 kristaps 1399: if (start == end)
1400: return;
1.46 kristaps 1401: advanceto(p, pos, end);
1.24 kristaps 1402:
1403: key = malloc(end - start + 1);
1.27 kristaps 1404: if (NULL == key)
1405: texiabort(p, NULL);
1.46 kristaps 1406: memcpy(key, &BUF(p)[start], end - start);
1.24 kristaps 1407: key[end - start] = '\0';
1408:
1.46 kristaps 1409: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1410: advance(p, pos);
1411: for (start = end = *pos; end < BUFSZ(p); end++)
1412: if ('\n' == BUF(p)[end])
1.24 kristaps 1413: break;
1.25 kristaps 1414: /* We do allow empty values. */
1.46 kristaps 1415: advanceeoln(p, pos, 1);
1.24 kristaps 1416:
1417: val = malloc(end - start + 1);
1.27 kristaps 1418: if (NULL == val)
1419: texiabort(p, NULL);
1.46 kristaps 1420: memcpy(val, &BUF(p)[start], end - start);
1.24 kristaps 1421: val[end - start] = '\0';
1.25 kristaps 1422: valueadd(p, key, val);
1.24 kristaps 1423: } else if (TEXICMD_VALUE == cmd) {
1424: if (p->seenws)
1425: texiputchar(p, ' ');
1426: p->seenws = 0;
1.46 kristaps 1427: if (NULL != (cp = valueblookup(p, pos)))
1.56 kristaps 1428: texisplice(p, cp, strlen(cp), *pos);
1.46 kristaps 1429: else
1.25 kristaps 1430: texiputchars(p, "{No value}");
1.24 kristaps 1431: } else if (TEXICMD_IFCLEAR == cmd) {
1.46 kristaps 1432: if (NULL != valuellookup(p, pos))
1433: doignblock(p, cmd, pos);
1.26 kristaps 1434: else
1.46 kristaps 1435: parseto(p, pos, texitoks[cmd].tok);
1.30 kristaps 1436: } else if (TEXICMD_IFSET == cmd) {
1.46 kristaps 1437: if (NULL == valuellookup(p, pos))
1438: doignblock(p, cmd, pos);
1.30 kristaps 1439: else
1.46 kristaps 1440: parseto(p, pos, texitoks[cmd].tok);
1.25 kristaps 1441: } else if (TEXICMD_CLEAR == cmd)
1.46 kristaps 1442: valuelclear(p, pos);
1.3 kristaps 1443: }
1444:
1.1 kristaps 1445: static void
1.46 kristaps 1446: dolink(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1447: {
1.8 kristaps 1448: int c;
1.1 kristaps 1449:
1450: switch (cmd) {
1451: case (TEXICMD_EMAIL):
1.5 kristaps 1452: teximacroopen(p, "Mt");
1.1 kristaps 1453: break;
1.3 kristaps 1454: case (TEXICMD_UREF):
1.1 kristaps 1455: case (TEXICMD_URL):
1.44 kristaps 1456: case (TEXICMD_INDICATEURL):
1.5 kristaps 1457: teximacroopen(p, "Lk");
1.1 kristaps 1458: break;
1.8 kristaps 1459: case (TEXICMD_XREF):
1460: texiputchars(p, "See Section");
1.39 kristaps 1461: teximacroopen(p, "Dq");
1.8 kristaps 1462: break;
1463: case (TEXICMD_PXREF):
1464: texiputchars(p, "see Section");
1.39 kristaps 1465: teximacroopen(p, "Dq");
1.8 kristaps 1466: break;
1.34 kristaps 1467: case (TEXICMD_INFOREF):
1468: texiputchars(p, "See Info file node");
1.39 kristaps 1469: teximacroopen(p, "Dq");
1.34 kristaps 1470: break;
1.1 kristaps 1471: default:
1.8 kristaps 1472: abort();
1.1 kristaps 1473: }
1.8 kristaps 1474:
1.46 kristaps 1475: c = parsearg(p, pos, 0);
1.8 kristaps 1476: p->ign++;
1477: while (c > 0)
1.46 kristaps 1478: c = parsearg(p, pos, 1);
1.8 kristaps 1479: p->ign--;
1480:
1.46 kristaps 1481: texipunctuate(p, pos);
1.8 kristaps 1482: teximacroclose(p);
1483: }
1484:
1485: static void
1.46 kristaps 1486: doignargn(struct texi *p, enum texicmd cmd, size_t *pos)
1.8 kristaps 1487: {
1488: int c;
1489:
1.46 kristaps 1490: c = parsearg(p, pos, 0);
1.8 kristaps 1491: p->ign++;
1492: while (c > 0)
1.46 kristaps 1493: c = parsearg(p, pos, 1);
1.8 kristaps 1494: p->ign--;
1.1 kristaps 1495: }
1496:
1.23 kristaps 1497: /*
1498: * Sections can be made subsections and so on by way of the
1499: * @raiseections and @lowersections commands.
1500: * Perform this check here and return the actual section number adjusted
1501: * to the raise level.
1502: */
1503: static int
1504: sectioner(struct texi *p, int sec)
1505: {
1506:
1507: if ((sec -= p->secoffs) < 0) {
1508: texiwarn(p, "section below minimum, clamping");
1509: return(0);
1510: } else if (sec >= SECTSZ) {
1511: texiwarn(p, "section above maximum, clamping");
1512: return(SECTSZ - 1);
1513: }
1514: return(sec);
1515: }
1516:
1517: static void
1.46 kristaps 1518: dosubsubsection(struct texi *p, enum texicmd cmd, size_t *pos)
1.23 kristaps 1519: {
1520: int sec;
1521:
1522: sec = sectioner(p, 3);
1523:
1524: /* We don't have a subsubsubsection, so make one up. */
1525: texivspace(p);
1526: teximacroopen(p, sects[sec]);
1.46 kristaps 1527: parseeoln(p, pos);
1.23 kristaps 1528: teximacroclose(p);
1529: texivspace(p);
1530: }
1531:
1.1 kristaps 1532: static void
1.46 kristaps 1533: dosubsection(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1534: {
1.23 kristaps 1535: int sec;
1536:
1537: sec = sectioner(p, 2);
1.13 kristaps 1538:
1539: if (p->outmacro)
1.23 kristaps 1540: texierr(p, "\"%s\" in open line scope!?", sects[sec]);
1.13 kristaps 1541: else if (p->literal)
1.23 kristaps 1542: texierr(p, "\"%s\" in a literal scope!?", sects[sec]);
1.1 kristaps 1543:
1.21 kristaps 1544: /* We don't have a subsubsection, so make one up. */
1.34 kristaps 1545: if (sec > 1)
1546: texivspace(p);
1.23 kristaps 1547: teximacroopen(p, sects[sec]);
1.46 kristaps 1548: parseeoln(p, pos);
1.5 kristaps 1549: teximacroclose(p);
1.34 kristaps 1550: if (sec > 1)
1551: texivspace(p);
1.1 kristaps 1552: }
1553:
1554: static void
1.46 kristaps 1555: dosecoffs(struct texi *p, enum texicmd cmd, size_t *pos)
1.23 kristaps 1556: {
1557:
1558: if (TEXICMD_RAISESECTIONS == cmd)
1559: p->secoffs++;
1560: else
1561: p->secoffs--;
1562: }
1563:
1564: static void
1.46 kristaps 1565: dosection(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1566: {
1.23 kristaps 1567: int sec;
1.12 kristaps 1568:
1569: switch (cmd) {
1.55 kristaps 1570: case (TEXICMD_TOP):
1571: sec = 0;
1572: break;
1.12 kristaps 1573: case (TEXICMD_APPENDIX):
1574: case (TEXICMD_CHAPTER):
1575: case (TEXICMD_UNNUMBERED):
1.23 kristaps 1576: sec = sectioner(p, 0);
1.12 kristaps 1577: break;
1578: case (TEXICMD_APPENDIXSEC):
1579: case (TEXICMD_HEADING):
1580: case (TEXICMD_SECTION):
1581: case (TEXICMD_UNNUMBEREDSEC):
1.23 kristaps 1582: sec = sectioner(p, 1);
1.12 kristaps 1583: break;
1584: default:
1585: abort();
1586: }
1.1 kristaps 1587:
1.3 kristaps 1588: if (p->outmacro)
1.23 kristaps 1589: texierr(p, "\"%s\" in open line scope!?", sects[sec]);
1.3 kristaps 1590: else if (p->literal)
1.23 kristaps 1591: texierr(p, "\"%s\" in a literal scope!?", sects[sec]);
1.3 kristaps 1592:
1.55 kristaps 1593: if (0 == sec && NULL != p->chapters) {
1594: teximdocclose(p, 0);
1.56 kristaps 1595: teximdocopen(p, pos);
1.55 kristaps 1596: }
1597:
1.23 kristaps 1598: teximacroopen(p, sects[sec]);
1.46 kristaps 1599: parseeoln(p, pos);
1.3 kristaps 1600: teximacroclose(p);
1.11 kristaps 1601: p->seenvs = 1;
1.3 kristaps 1602: }
1603:
1604: static void
1.55 kristaps 1605: dotop(struct texi *p, enum texicmd cmd, size_t *pos)
1606: {
1607:
1608: if (--p->ign)
1609: texierr(p, "@top command while ignoring");
1610:
1611: if (NULL == p->chapters)
1.56 kristaps 1612: teximdocopen(p, pos);
1.55 kristaps 1613: dosection(p, cmd, pos);
1614: }
1615:
1616: static void
1.46 kristaps 1617: dosp(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 1618: {
1619:
1.57 kristaps 1620: advanceeoln(p, pos, 1);
1.37 kristaps 1621: if (p->literal)
1622: texiputchar(p, '\n');
1623: else
1624: texivspace(p);
1.1 kristaps 1625: }
1626:
1627: static void
1.46 kristaps 1628: doitem(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1629: {
1630:
1.18 kristaps 1631: /* Multitable is using raw tbl(7). */
1632: if (TEXILIST_TABLE == p->list) {
1633: texiputchar(p, '\n');
1634: return;
1635: }
1636:
1.3 kristaps 1637: if (p->outmacro)
1638: texierr(p, "item in open line scope!?");
1639: else if (p->literal)
1640: texierr(p, "item in a literal scope!?");
1641:
1642: switch (p->list) {
1643: case (TEXILIST_ITEM):
1.5 kristaps 1644: teximacroopen(p, "It");
1.3 kristaps 1645: break;
1646: case (TEXILIST_NOITEM):
1.5 kristaps 1647: teximacro(p, "It");
1.3 kristaps 1648: break;
1649: default:
1.11 kristaps 1650: texivspace(p);
1.3 kristaps 1651: break;
1652: }
1.18 kristaps 1653:
1654: /* Trick so we don't start with Pp. */
1.11 kristaps 1655: p->seenvs = 1;
1.46 kristaps 1656: parseeoln(p, pos);
1.1 kristaps 1657:
1.3 kristaps 1658: if (TEXILIST_ITEM == p->list)
1659: teximacroclose(p);
1.9 kristaps 1660: else if (p->outcol > 0)
1.1 kristaps 1661: texiputchar(p, '\n');
1.18 kristaps 1662: }
1663:
1664: static void
1.46 kristaps 1665: dotab(struct texi *p, enum texicmd cmd, size_t *pos)
1.18 kristaps 1666: {
1667:
1668: /* This command is only useful in @multitable. */
1669: if (TEXILIST_TABLE == p->list)
1670: texiputchar(p, '\t');
1671: }
1672:
1673: static void
1.46 kristaps 1674: domultitable(struct texi *p, enum texicmd cmd, size_t *pos)
1.18 kristaps 1675: {
1676: enum texilist sv = p->list;
1.32 kristaps 1677: int svliteral = p->literal;
1.18 kristaps 1678: enum texicmd type;
1679: size_t i, end, columns;
1680:
1681: p->list = TEXILIST_TABLE;
1.32 kristaps 1682: /*
1683: * TS/TE blocks aren't "in mdoc(7)", so we can disregard the
1684: * fact that we're in literal mode right now.
1685: */
1686: p->literal = 0;
1.18 kristaps 1687: teximacro(p, "TS");
1688: columns = 0;
1689:
1690: /* Advance to the first argument... */
1.46 kristaps 1691: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1692: advance(p, pos);
1.18 kristaps 1693:
1694: /* Make sure we don't print anything when scanning. */
1695: p->ign++;
1.57 kristaps 1696: if (*pos < BUFSZ(p) && '@' == BUF(p)[*pos]) {
1.18 kristaps 1697: /*
1698: * Look for @columnfractions.
1699: * We ignore these, but we do use the number of
1700: * arguments to set the number of columns that we'll
1701: * have.
1702: */
1.46 kristaps 1703: type = texicmd(p, *pos, &end, NULL);
1704: advanceto(p, pos, end);
1.18 kristaps 1705: if (TEXICMD_COLUMNFRACTIONS != type)
1.25 kristaps 1706: texierr(p, "unknown multitable command");
1.46 kristaps 1707: while (*pos < BUFSZ(p) && '\n' != BUF(p)[*pos]) {
1708: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1709: advance(p, pos);
1710: while (*pos < BUFSZ(p) && ! isws(BUF(p)[*pos])) {
1711: if ('\n' == BUF(p)[*pos])
1.18 kristaps 1712: break;
1.46 kristaps 1713: advance(p, pos);
1.18 kristaps 1714: }
1715: columns++;
1716: }
1717: } else
1718: /*
1719: * We have arguments.
1720: * We could parse these, but it's easier to just let
1721: * tbl(7) figure it out.
1722: * So use this only to count arguments.
1723: */
1.46 kristaps 1724: while (parselinearg(p, pos) > 0)
1.18 kristaps 1725: columns++;
1726: p->ign--;
1727:
1728: /* Left-justify each table entry. */
1729: for (i = 0; i < columns; i++) {
1730: if (i > 0)
1731: texiputchar(p, ' ');
1732: texiputchar(p, 'l');
1733: }
1734: texiputchars(p, ".\n");
1735: p->outmacro++;
1.46 kristaps 1736: parseto(p, pos, texitoks[cmd].tok);
1.18 kristaps 1737: p->outmacro--;
1738: teximacro(p, "TE");
1.32 kristaps 1739: p->literal = svliteral;
1.18 kristaps 1740: p->list = sv;
1.1 kristaps 1741: }
1742:
1743: static void
1.46 kristaps 1744: dotable(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1745: {
1.3 kristaps 1746: enum texilist sv = p->list;
1747:
1.57 kristaps 1748: advanceeoln(p, pos, 1);
1749:
1.3 kristaps 1750: p->list = TEXILIST_ITEM;
1.5 kristaps 1751: teximacro(p, "Bl -tag -width Ds");
1.11 kristaps 1752: p->seenvs = 1;
1.46 kristaps 1753: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 1754: teximacro(p, "El");
1.3 kristaps 1755: p->list = sv;
1.44 kristaps 1756: }
1757:
1758: static void
1.46 kristaps 1759: doend(struct texi *p, enum texicmd cmd, size_t *pos)
1.44 kristaps 1760: {
1761: size_t start;
1762:
1.46 kristaps 1763: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1764: advance(p, pos);
1.44 kristaps 1765: start = *pos;
1.46 kristaps 1766: while (*pos < BUFSZ(p) && '\n' != BUF(p)[*pos])
1767: advance(p, pos);
1.44 kristaps 1768:
1.56 kristaps 1769: texiwarn(p, "unexpected \"end\": %.*s",
1770: (int)(*pos - start), &BUF(p)[start]);
1.46 kristaps 1771: advanceeoln(p, pos, 1);
1.1 kristaps 1772: }
1773:
1774: static void
1.46 kristaps 1775: doenumerate(struct texi *p, enum texicmd cmd, size_t *pos)
1.2 kristaps 1776: {
1.3 kristaps 1777: enum texilist sv = p->list;
1.2 kristaps 1778:
1.57 kristaps 1779: advanceeoln(p, pos, 1);
1780:
1.3 kristaps 1781: p->list = TEXILIST_NOITEM;
1.5 kristaps 1782: teximacro(p, "Bl -enum");
1.11 kristaps 1783: p->seenvs = 1;
1.57 kristaps 1784: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 1785: teximacro(p, "El");
1.3 kristaps 1786: p->list = sv;
1.2 kristaps 1787: }
1788:
1789: static void
1.46 kristaps 1790: doitemize(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1791: {
1.3 kristaps 1792: enum texilist sv = p->list;
1.1 kristaps 1793:
1.57 kristaps 1794: advanceeoln(p, pos, 1);
1795:
1.21 kristaps 1796: p->list = TEXILIST_NOITEM;
1.5 kristaps 1797: teximacro(p, "Bl -bullet");
1.11 kristaps 1798: p->seenvs = 1;
1.57 kristaps 1799: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 1800: teximacro(p, "El");
1.3 kristaps 1801: p->list = sv;
1.1 kristaps 1802: }
1803:
1804: static void
1.46 kristaps 1805: doignbracket(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1806: {
1807:
1.3 kristaps 1808: p->ign++;
1.53 kristaps 1809: parsebracket(p, pos, 0);
1.3 kristaps 1810: p->ign--;
1.1 kristaps 1811: }
1812:
1813: static void
1.46 kristaps 1814: doignline(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1815: {
1816:
1.57 kristaps 1817: advanceeoln(p, pos, 1);
1.1 kristaps 1818: }
1819:
1.8 kristaps 1820: /*
1821: * Parse colon-separated directories from "cp" (if not NULL) and returns
1822: * the array of pointers.
1.40 kristaps 1823: * Prepends "base" to the array, if found.
1.8 kristaps 1824: * This does NOT sanitise the directories!
1825: */
1.5 kristaps 1826: static char **
1.27 kristaps 1827: parsedirs(struct texi *p, const char *base, const char *cp, size_t *sz)
1.5 kristaps 1828: {
1829: char *tok, *str, *tofree;
1830: const char *cpp;
1.40 kristaps 1831: size_t i = 0;
1.5 kristaps 1832: char **dirs;
1833:
1.40 kristaps 1834: /* Count up our expected arguments. */
1835: *sz = NULL != base;
1836: if (NULL != (cpp = cp))
1837: for ((*sz)++; NULL != (cpp = strchr(cpp, ':')); (*sz)++)
1.5 kristaps 1838: cpp++;
1839:
1.40 kristaps 1840: if (0 == *sz)
1841: return(NULL);
1.27 kristaps 1842: if (NULL == (dirs = calloc(*sz, sizeof(char *))))
1843: texiabort(p, NULL);
1.40 kristaps 1844: if (NULL != base && NULL == (dirs[i++] = strdup(base)))
1.27 kristaps 1845: texiabort(p, NULL);
1.5 kristaps 1846: if (NULL == cp)
1847: return(dirs);
1.27 kristaps 1848: if (NULL == (tofree = tok = str = strdup(cp)))
1849: texiabort(p, NULL);
1.5 kristaps 1850:
1.40 kristaps 1851: for ( ; NULL != (tok = strsep(&str, ":")); i++)
1.27 kristaps 1852: if (NULL == (dirs[i] = strdup(tok)))
1853: texiabort(p, NULL);
1.5 kristaps 1854:
1855: free(tofree);
1856: return(dirs);
1857: }
1858:
1.1 kristaps 1859: int
1860: main(int argc, char *argv[])
1861: {
1862: struct texi texi;
1.2 kristaps 1863: int c;
1.37 kristaps 1864: char *dirpath, *dir, *ccp;
1.10 kristaps 1865: const char *progname, *Idir, *cp;
1.1 kristaps 1866:
1867: progname = strrchr(argv[0], '/');
1868: if (progname == NULL)
1869: progname = argv[0];
1870: else
1871: ++progname;
1872:
1.10 kristaps 1873: memset(&texi, 0, sizeof(struct texi));
1.40 kristaps 1874: texi.ign = 1;
1.55 kristaps 1875: texi.outfile = stdout;
1.5 kristaps 1876: Idir = NULL;
1.10 kristaps 1877:
1.55 kristaps 1878: while (-1 != (c = getopt(argc, argv, "C:I:")))
1.1 kristaps 1879: switch (c) {
1.55 kristaps 1880: case ('C'):
1881: texi.chapters = optarg;
1882: break;
1.5 kristaps 1883: case ('I'):
1884: Idir = optarg;
1885: break;
1.1 kristaps 1886: default:
1887: goto usage;
1888: }
1889:
1890: argv += optind;
1.40 kristaps 1891: argc -= optind;
1.1 kristaps 1892:
1.40 kristaps 1893: if (argc > 0) {
1894: if (NULL == (dirpath = strdup(argv[0])))
1895: texiabort(&texi, NULL);
1896: if (NULL == (dir = dirname(dirpath)))
1897: texiabort(&texi, NULL);
1898: if (NULL != (cp = strrchr(argv[0], '/')))
1899: texi.title = strdup(cp + 1);
1900: else
1901: texi.title = strdup(argv[0]);
1902: if (NULL == texi.title)
1903: texiabort(&texi, NULL);
1904: else if (NULL != (ccp = strchr(texi.title, '.')))
1905: *ccp = '\0';
1906: texi.dirs = parsedirs(&texi, dir, Idir, &texi.dirsz);
1907: free(dirpath);
1908: parsefile(&texi, argv[0], 1);
1909: } else {
1910: texi.title = strdup("Unknown Manual");
1911: texi.dirs = parsedirs(&texi, NULL, Idir, &texi.dirsz);
1912: parsestdin(&texi);
1913: }
1.27 kristaps 1914:
1.2 kristaps 1915: texiexit(&texi);
1.56 kristaps 1916: exit(EXIT_SUCCESS);
1.1 kristaps 1917: usage:
1.55 kristaps 1918: fprintf(stderr, "usage: %s [-Cdir] [-Idirs] [file]\n", progname);
1.1 kristaps 1919: return(EXIT_FAILURE);
1920: }
CVSweb