Annotation of texi2mdoc/main.c, Revision 1.57
1.57 ! kristaps 1: /* $Id: main.c,v 1.56 2015/03/01 13:39:51 kristaps Exp $ */
1.1 kristaps 2: /*
3: * Copyright (c) 2015 Kristaps Dzonsons <kristaps@bsd.lv>
4: *
5: * Permission to use, copy, modify, and distribute this software for any
6: * purpose with or without fee is hereby granted, provided that the above
7: * copyright notice and this permission notice appear in all copies.
8: *
9: * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10: * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11: * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12: * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13: * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14: * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15: * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
16: */
1.37 kristaps 17: #if defined(__linux__) || defined(__MINT__)
18: # define _GNU_SOURCE /* memmem */
19: #endif
1.1 kristaps 20: #include <assert.h>
21: #include <ctype.h>
22: #include <getopt.h>
1.2 kristaps 23: #include <libgen.h>
24: #include <limits.h>
1.1 kristaps 25: #include <stdarg.h>
26: #include <stdio.h>
27: #include <stdlib.h>
28: #include <string.h>
1.47 kristaps 29: #include <unistd.h>
1.1 kristaps 30:
1.24 kristaps 31: #include "extern.h"
1.1 kristaps 32:
1.23 kristaps 33: #define SECTSZ 4
34: static const char *const sects[SECTSZ] = {
35: "Sh",
36: "Ss",
37: "Em",
38: "No",
39: };
40:
1.46 kristaps 41: static void doaccent(struct texi *, enum texicmd, size_t *);
42: static void doblock(struct texi *, enum texicmd, size_t *);
43: static void dobracket(struct texi *, enum texicmd, size_t *);
44: static void dobye(struct texi *, enum texicmd, size_t *);
45: static void dodefindex(struct texi *, enum texicmd, size_t *);
46: static void dodefn(struct texi *, enum texicmd, size_t *);
47: static void dodisplay(struct texi *, enum texicmd, size_t *);
48: static void doend(struct texi *, enum texicmd, size_t *);
49: static void doenumerate(struct texi *, enum texicmd, size_t *);
50: static void doexample(struct texi *, enum texicmd, size_t *);
51: static void doignargn(struct texi *, enum texicmd, size_t *);
52: static void doignblock(struct texi *, enum texicmd, size_t *);
53: static void doignbracket(struct texi *, enum texicmd, size_t *);
54: static void doignline(struct texi *, enum texicmd, size_t *);
55: static void doinline(struct texi *, enum texicmd, size_t *);
56: static void doinclude(struct texi *, enum texicmd, size_t *);
57: static void doitem(struct texi *, enum texicmd, size_t *);
58: static void doitemize(struct texi *, enum texicmd, size_t *);
59: static void dolink(struct texi *, enum texicmd, size_t *);
60: static void domacro(struct texi *, enum texicmd, size_t *);
61: static void domath(struct texi *, enum texicmd, size_t *);
62: static void domultitable(struct texi *, enum texicmd, size_t *);
63: static void doquotation(struct texi *, enum texicmd, size_t *);
64: static void dotable(struct texi *, enum texicmd, size_t *);
65: static void dotop(struct texi *, enum texicmd, size_t *);
66: static void dosecoffs(struct texi *, enum texicmd, size_t *);
67: static void dosection(struct texi *, enum texicmd, size_t *);
68: static void dosp(struct texi *, enum texicmd, size_t *);
69: static void dosubsection(struct texi *, enum texicmd, size_t *);
70: static void dosubsubsection(struct texi *, enum texicmd, size_t *);
71: static void dosymbol(struct texi *, enum texicmd, size_t *);
72: static void dotab(struct texi *, enum texicmd, size_t *);
73: static void dotitle(struct texi *, enum texicmd, size_t *);
74: static void dovalue(struct texi *, enum texicmd, size_t *);
75: static void doverb(struct texi *, enum texicmd, size_t *);
76: static void doverbatim(struct texi *, enum texicmd, size_t *);
77: static void doverbinclude(struct texi *, enum texicmd, size_t *);
1.1 kristaps 78:
1.24 kristaps 79: static const struct texitok __texitoks[TEXICMD__MAX] = {
1.20 kristaps 80: /* TEXICMD__BEGIN */
1.42 kristaps 81: { doignline, "afourpaper", 10 }, /* TEXICMD_A4PAPER */
82: { dosymbol, "AA", 2 }, /* TEXICMD_AA */
83: { dosymbol, "aa", 2 }, /* TEXICMD_AASMALL */
1.8 kristaps 84: { doignargn, "acronym", 7 }, /* TEXICMD_ACRONYM */
1.16 kristaps 85: { doaccent, "'", 1 }, /* TEXICMD_ACUTE */
1.42 kristaps 86: { dosymbol, "AE", 2 }, /* TEXICMD_AE */
87: { dosymbol, "ae", 2 }, /* TEXICMD_AESMALL */
1.1 kristaps 88: { doignbracket, "anchor", 6 }, /* TEXICMD_ANCHOR */
1.12 kristaps 89: { dosection, "appendix", 8 }, /* TEXICMD_APPENDIX */
90: { dosection, "appendixsec", 11 }, /* TEXICMD_APPENDIXSEC */
1.20 kristaps 91: { dosubsection, "appendixsubsec", 14 }, /* TEXICMD_APPENDIXSUBSEC */
1.23 kristaps 92: { dosubsubsection, "appendixsubsubsec", 17 }, /* TEXICMD_APPENDIXSUBSUBSEC */
1.25 kristaps 93: { doinline, "asis", 4 }, /* TEXICMD_ASIS */
1.3 kristaps 94: { dosymbol, "*", 1 }, /* TEXICMD_ASTERISK */
1.1 kristaps 95: { dosymbol, "@", 1 }, /* TEXICMD_AT */
1.3 kristaps 96: { doignline, "author", 6 }, /* TEXICMD_AUTHOR */
1.21 kristaps 97: { doinline, "b", 1 }, /* TEXICMD_BOLD */
1.3 kristaps 98: { dosymbol, "!", 1 }, /* TEXICMD_BANG */
1.7 kristaps 99: { dosymbol, "bullet", 6 }, /* TEXICMD_BULLET */
1.1 kristaps 100: { dobye, "bye", 3 }, /* TEXICMD_BYE */
1.34 kristaps 101: { doblock, "cartouche", 9 }, /* TEXICMD_CARTOUCHE */
102: { doaccent, ",", 1 }, /* TEXICMD_CEDILLA */
1.12 kristaps 103: { doignline, "center", 6 }, /* TEXICMD_CENTER */
104: { dosection, "chapter", 7 }, /* TEXICMD_CHAPTER */
1.1 kristaps 105: { doignline, "cindex", 6 }, /* TEXICMD_CINDEX */
1.16 kristaps 106: { doaccent, "^", 1 }, /* TEXICMD_CIRCUMFLEX */
1.24 kristaps 107: { doinline, "cite", 4 }, /* TEXICMD_CITE */
108: { dovalue, "clear", 5 }, /* TEXICMD_CLEAR */
1.21 kristaps 109: { doinline, "code", 4 }, /* TEXICMD_CODE */
1.3 kristaps 110: { dosymbol, ":", 1 }, /* TEXICMD_COLON */
1.18 kristaps 111: { NULL, "columnfractions", 15 }, /* TEXICMD_COLUMNFRACTIONS */
1.35 kristaps 112: { dosymbol, "comma", 5 }, /* TEXICMD_COMMA */
1.12 kristaps 113: { doinline, "command", 7 }, /* TEXICMD_COMMAND */
1.1 kristaps 114: { doignline, "c", 1 }, /* TEXICMD_COMMENT */
1.2 kristaps 115: { doignline, "comment", 7 }, /* TEXICMD_COMMENT_LONG */
1.1 kristaps 116: { doignline, "contents", 8 }, /* TEXICMD_CONTENTS */
117: { doignblock, "copying", 7 }, /* TEXICMD_COPYING */
118: { dosymbol, "copyright", 9 }, /* TEXICMD_COPYRIGHT */
1.27 kristaps 119: { dodefindex, "defcodeindex", 12 }, /* TEXICMD_DEFCODEINDEX */
1.15 kristaps 120: { dodefn, "deffn", 5 }, /* TEXICMD_DEFFN */
121: { dodefn, "deffnx", 6 }, /* TEXICMD_DEFFNX */
1.27 kristaps 122: { dodefindex, "defindex", 8 }, /* TEXICMD_DEFINDEX */
1.15 kristaps 123: { dodefn, "defmac", 6 }, /* TEXICMD_DEFMAC */
124: { dodefn, "defmacx", 7 }, /* TEXICMD_DEFMACX */
125: { dodefn, "deftp", 5 }, /* TEXICMD_DEFTP */
126: { dodefn, "deftpx", 6 }, /* TEXICMD_DEFTPX */
127: { dodefn, "deftypefn", 9 }, /* TEXICMD_DEFTYPEFN */
128: { dodefn, "deftypefnx", 10 }, /* TEXICMD_DEFTYPEFNX */
129: { dodefn, "deftypefun", 10 }, /* TEXICMD_DEFTYPEFUN */
130: { dodefn, "deftypefunx", 11 }, /* TEXICMD_DEFTYPEFUNX */
1.34 kristaps 131: { dodefn, "deftypemethod", 13 }, /* TEXICMD_DEFTYPEMETHOD */
132: { dodefn, "deftypemethodx", 14 }, /* TEXICMD_DEFTYPEMETHODX */
1.15 kristaps 133: { dodefn, "deftypevar", 10 }, /* TEXICMD_DEFTYPEVAR */
134: { dodefn, "deftypevarx", 11 }, /* TEXICMD_DEFTYPEVARX */
135: { dodefn, "deftypevr", 9 }, /* TEXICMD_DEFTYPEVR */
136: { dodefn, "deftypevrx", 10 }, /* TEXICMD_DEFTYPEVRX */
137: { dodefn, "defun", 5 }, /* TEXICMD_DEFUN */
138: { dodefn, "defunx", 6 }, /* TEXICMD_DEFUNX */
139: { dodefn, "defvar", 6 }, /* TEXICMD_DEFVAR */
140: { dodefn, "defvarx", 7 }, /* TEXICMD_DEFVARX */
141: { dodefn, "defvr", 5 }, /* TEXICMD_DEFVR */
142: { dodefn, "defvrx", 6 }, /* TEXICMD_DEFVRX */
1.1 kristaps 143: { doignblock, "detailmenu", 10 }, /* TEXICMD_DETAILMENU */
1.21 kristaps 144: { doinline, "dfn", 3 }, /* TEXICMD_DFN */
1.42 kristaps 145: { dosymbol, "DH", 2 }, /* TEXICMD_DH */
146: { dosymbol, "dh", 2 }, /* TEXICMD_DHSMALL */
1.1 kristaps 147: { doignline, "dircategory", 11 }, /* TEXICMD_DIRCATEGORY */
148: { doignblock, "direntry", 8 }, /* TEXICMD_DIRENTRY */
1.3 kristaps 149: { dodisplay, "display", 7 }, /* TEXICMD_DISPLAY */
1.28 kristaps 150: { doignbracket, "dmn", 3 }, /* TEXICMD_DMN */
1.40 kristaps 151: { doignblock, "documentdescription", 19 }, /* TEXICMD_DOCUMENTDESCRIPTION */
152: { doignline, "documentencoding", 16 }, /* TEXICMD_DOCUMENTENCODING */
1.44 kristaps 153: { doignline, "documentlanguage", 16 }, /* TEXICMD_DOCUMENTLANGUAGE */
1.42 kristaps 154: { doaccent, "dotaccent", 9 }, /* TEXICMD_DOTACCENT */
155: { doaccent, "dotless", 7 }, /* TEXICMD_DOTLESS */
1.2 kristaps 156: { dosymbol, "dots", 4 }, /* TEXICMD_DOTS */
1.8 kristaps 157: { dolink, "email", 5 }, /* TEXICMD_EMAIL */
1.21 kristaps 158: { doinline, "emph", 4 }, /* TEXICMD_EMPH */
1.44 kristaps 159: { doend, "end", 3 }, /* TEXICMD_END */
1.34 kristaps 160: { dosymbol, "enddots", 7 }, /* TEXICMD_ENDDOTS */
1.2 kristaps 161: { doenumerate, "enumerate", 9 }, /* TEXICMD_ENUMERATE */
1.12 kristaps 162: { doinline, "env", 3 }, /* TEXICMD_ENV */
1.28 kristaps 163: { dosymbol, "equiv", 5 }, /* TEXICMD_EQUIV */
1.15 kristaps 164: { dosymbol, "error", 5 }, /* TEXICMD_ERROR */
1.43 kristaps 165: { dosymbol, "euro", 4 }, /* TEXICMD_EURO */
1.1 kristaps 166: { doexample, "example", 7 }, /* TEXICMD_EXAMPLE */
1.42 kristaps 167: { dosymbol, "exclamdown", 10 }, /* TEXICMD_EXCLAMDOWN */
1.25 kristaps 168: { doignline, "exdent", 6 }, /* TEXICMD_EXDENT */
1.17 kristaps 169: { dosymbol, "expansion", 9 }, /* TEXICMD_EXPANSION */
1.12 kristaps 170: { doinline, "file", 4 }, /* TEXICMD_FILE */
1.17 kristaps 171: { doignline, "finalout", 8 }, /* TEXICMD_FINALOUT */
1.20 kristaps 172: { doignline, "findex", 6 }, /* TEXICMD_FINDEX */
1.44 kristaps 173: { doblock, "flushleft", 9 }, /* TEXICMD_FLUSHLEFT */
174: { doblock, "flushright", 10 }, /* TEXICMD_FLUSHRIGHT */
175: { doignline, "firstparagraphindent", 20 }, /* TEXICMD_FIRSTPARAGRAPHINDENT */
1.32 kristaps 176: { doignbracket, "footnote", 8 }, /* TEXICMD_FOOTNOTE */
1.44 kristaps 177: { doignline, "footnotestyle", 13 }, /* TEXICMD_FOOTNOTESTYLE */
1.20 kristaps 178: { dotable, "ftable", 6 }, /* TEXICMD_FTABLE */
179: { dodisplay, "format", 6 }, /* TEXICMD_FORMAT */
1.43 kristaps 180: { dosymbol, "geq", 3 }, /* TEXICMD_GEQ */
1.16 kristaps 181: { doaccent, "`", 1 }, /* TEXICMD_GRAVE */
1.3 kristaps 182: { doblock, "group", 5 }, /* TEXICMD_GROUP */
1.43 kristaps 183: { dosymbol, "guillemetleft", 13 }, /* TEXICMD_GUILLEMETLEFT */
184: { dosymbol, "guillemetright", 14 }, /* TEXICMD_GUILLEMETRIGHT */
185: { dosymbol, "guillemotleft", 13 }, /* TEXICMD_GUILLEMOTLEFT */
186: { dosymbol, "guillemotright", 14 }, /* TEXICMD_GUILLEMOTRIGHT */
187: { dosymbol, "guilsinglleft", 13 }, /* TEXICMD_GUILSINGLLEFT */
188: { dosymbol, "guilsinglright", 14 }, /* TEXICMD_GUILSINGLRIGHT */
1.42 kristaps 189: { doaccent, "H", 1 }, /* TEXICMD_H */
1.2 kristaps 190: { dosection, "heading", 7 }, /* TEXICMD_HEADING */
1.3 kristaps 191: { doignline, "headings", 8 }, /* TEXICMD_HEADINGS */
1.18 kristaps 192: { doitem, "headitem", 8 }, /* TEXICMD_HEADITEM */
1.25 kristaps 193: { doignblock, "html", 4 }, /* TEXICMD_HTML */
1.3 kristaps 194: { dosymbol, "-", 1 }, /* TEXICMD_HYPHEN */
1.21 kristaps 195: { doinline, "i", 1 }, /* TEXICMD_I */
1.24 kristaps 196: { dovalue, "ifclear", 7 }, /* TEXICMD_IFCLEAR */
1.14 kristaps 197: { doignblock, "ifdocbook", 9 }, /* TEXICMD_IFDOCBOOK */
1.1 kristaps 198: { doignblock, "ifhtml", 6 }, /* TEXICMD_IFHTML */
1.26 kristaps 199: { doblock, "ifinfo", 6 }, /* TEXICMD_IFINFO */
1.14 kristaps 200: { doblock, "ifnotdocbook", 12 }, /* TEXICMD_IFNOTDOCBOOK */
201: { doblock, "ifnothtml", 9 }, /* TEXICMD_IFNOTHTML */
202: { doblock, "ifnotinfo", 9 }, /* TEXICMD_IFNOTINFO */
203: { doignblock, "ifnotplaintext", 14 }, /* TEXICMD_IFNOTPLAINTEXT */
1.3 kristaps 204: { doblock, "ifnottex", 8 }, /* TEXICMD_IFNOTTEX */
1.14 kristaps 205: { doblock, "ifnotxml", 8 }, /* TEXICMD_IFNOTXML */
206: { doblock, "ifplaintext", 11 }, /* TEXICMD_IFPLAINTEXT */
1.1 kristaps 207: { doignblock, "iftex", 5 }, /* TEXICMD_IFTEX */
1.30 kristaps 208: { dovalue, "ifset", 5 }, /* TEXICMD_IFSET */
1.14 kristaps 209: { doignblock, "ifxml", 5 }, /* TEXICMD_IFXML */
1.17 kristaps 210: { doignblock, "ignore", 6 }, /* TEXICMD_IGNORE */
1.1 kristaps 211: { doignbracket, "image", 5 }, /* TEXICMD_IMAGE */
1.2 kristaps 212: { doinclude, "include", 7 }, /* TEXICMD_INCLUDE */
1.13 kristaps 213: { dodisplay, "indentblock", 11 }, /* TEXICMD_INDENTBLOCK */
1.44 kristaps 214: { dolink, "indicateurl", 11 }, /* TEXICMD_INDICATEURL */
215: { dolink, "inforef", 7 }, /* TEXICMD_INFOREF */
1.5 kristaps 216: { doignline, "insertcopying", 13 }, /* TEXICMD_INSERTCOPYING */
1.1 kristaps 217: { doitem, "item", 4 }, /* TEXICMD_ITEM */
218: { doitemize, "itemize", 7 }, /* TEXICMD_ITEMIZE */
1.20 kristaps 219: { doitem, "itemx", 5 }, /* TEXICMD_ITEMX */
1.21 kristaps 220: { doinline, "kbd", 3 }, /* TEXICMD_KBD */
1.18 kristaps 221: { dobracket, "key", 3 }, /* TEXICMD_KEY */
1.20 kristaps 222: { doignline, "kindex", 6 }, /* TEXICMD_KINDEX */
1.42 kristaps 223: { dosymbol, "L", 1 }, /* TEXICMD_L */
1.1 kristaps 224: { dosymbol, "LaTeX", 5 }, /* TEXICMD_LATEX */
1.43 kristaps 225: { dosymbol, "leq", 3 }, /* TEXICMD_LEQ */
1.23 kristaps 226: { dosecoffs, "lowersections", 13 }, /* TEXICMD_LOWERSECTIONS */
1.42 kristaps 227: { dosymbol, "l", 1 }, /* TEXICMD_LSMALL */
1.30 kristaps 228: { domacro, "macro", 5 }, /* TEXICMD_MACRO */
1.42 kristaps 229: { doaccent, "=", 1 }, /* TEXICMD_MACRON */
1.3 kristaps 230: { domath, "math", 4 }, /* TEXICMD_MATH */
1.1 kristaps 231: { doignblock, "menu", 4 }, /* TEXICMD_MENU */
1.25 kristaps 232: { dosymbol, "minus", 5 }, /* TEXICMD_MINUS */
1.18 kristaps 233: { domultitable, "multitable", 10 }, /* TEXICMD_MULTITABLE */
1.15 kristaps 234: { doignline, "need", 4 }, /* TEXICMD_NEED */
1.3 kristaps 235: { dosymbol, "\n", 1 }, /* TEXICMD_NEWLINE */
1.1 kristaps 236: { doignline, "node", 4 }, /* TEXICMD_NODE */
1.3 kristaps 237: { doignline, "noindent", 8 }, /* TEXICMD_NOINDENT */
1.42 kristaps 238: { dosymbol, "O", 1 }, /* TEXICMD_O */
239: { dosymbol, "OE", 2 }, /* TEXICMD_OE */
240: { dosymbol, "oe", 2 }, /* TEXICMD_OESMALL */
241: { doaccent, "ogonek", 6 }, /* TEXICMD_OGONEK */
1.16 kristaps 242: { doinline, "option", 6 }, /* TEXICMD_OPTION */
1.42 kristaps 243: { dosymbol, "ordf", 4 }, /* TEXICMD_ORDF */
244: { dosymbol, "ordm", 4 }, /* TEXICMD_ORDM */
245: { dosymbol, "o", 1 }, /* TEXICMD_OSMALL */
1.3 kristaps 246: { doignline, "page", 4 }, /* TEXICMD_PAGE */
1.25 kristaps 247: { doignline, "paragraphindent", 15 }, /* TEXICMD_PARINDENT */
248: { dosymbol, ".", 1 }, /* TEXICMD_PERIOD */
1.28 kristaps 249: { doignline, "pindex", 6 }, /* TEXICMD_PINDEX */
1.43 kristaps 250: { dosymbol, "pounds", 6 }, /* TEXICMD_POUNDS */
1.2 kristaps 251: { doignline, "printindex", 10 }, /* TEXICMD_PRINTINDEX */
1.42 kristaps 252: { dolink, "pxref", 5 }, /* TEXICMD_PXREF */
253: { dosymbol, "questiondown", 12 }, /* TEXICMD_QUESTIONDOWN */
254: { dosymbol, "?", 1 }, /* TEXICMD_QUESTIONMARK */
255: { doquotation, "quotation", 9 }, /* TEXICMD_QUOTATION */
1.43 kristaps 256: { dosymbol, "quotedblbase", 12 }, /* TEXICMD_QUOTEDBLBASE */
257: { dosymbol, "quotedblleft", 12 }, /* TEXICMD_QUOTEDBLLEFT */
258: { dosymbol, "quotedblright", 13 }, /* TEXICMD_QUOTEDBLRIGHT */
259: { dosymbol, "quotesinglbase", 14 }, /* TEXICMD_QUOTESINGLBASE */
260: { dosymbol, "quoteleft", 9 }, /* TEXICMD_QUOTELEFT */
261: { dosymbol, "quoteright", 10 }, /* TEXICMD_QUOTERIGHT */
1.21 kristaps 262: { doinline, "r", 1 }, /* TEXICMD_R */
1.23 kristaps 263: { dosecoffs, "raisesections", 13 }, /* TEXICMD_RAISESECTIONS */
1.1 kristaps 264: { dobracket, "ref", 3 }, /* TEXICMD_REF */
1.28 kristaps 265: { doignline, "refill", 6 }, /* TEXICMD_REFILL */
1.43 kristaps 266: { dosymbol, "registeredsymbol", 16 }, /* TEXICMD_REGISTEREDSYMBOL */
1.15 kristaps 267: { dosymbol, "result", 6 }, /* TEXICMD_RESULT */
1.42 kristaps 268: { doaccent, "ringaccent", 10 }, /* TEXICMD_RINGACCENT */
1.21 kristaps 269: { doinline, "samp", 4 }, /* TEXICMD_SAMP */
270: { doinline, "sansserif", 9 }, /* TEXICMD_SANSSERIF */
1.7 kristaps 271: { dobracket, "sc", 2 }, /* TEXICMD_SC */
1.1 kristaps 272: { dosection, "section", 7 }, /* TEXICMD_SECTION */
1.24 kristaps 273: { dovalue, "set", 3 }, /* TEXICMD_SET */
1.1 kristaps 274: { doignline, "setchapternewpage", 17 }, /* TEXICMD_SETCHAPNEWPAGE */
1.35 kristaps 275: { doignline, "setcontentsaftertitlepage", 25 }, /* TEXICMD_SETCONTENTSAFTER */
1.1 kristaps 276: { doignline, "setfilename", 11 }, /* TEXICMD_SETFILENAME */
1.10 kristaps 277: { dotitle, "settitle", 8 }, /* TEXICMD_SETTITLE */
1.25 kristaps 278: { doignline, "shortcontents", 13 }, /* TEXICMD_SHORTCONTENTS */
1.21 kristaps 279: { doinline, "slanted", 7 }, /* TEXICMD_SLANTED */
1.34 kristaps 280: { dosymbol, "/", 1 }, /* TEXICMD_SLASH */
1.3 kristaps 281: { dosp, "sp", 2 }, /* TEXICMD_SP */
282: { dosymbol, " ", 1 }, /* TEXICMD_SPACE */
1.17 kristaps 283: { doignline, "smallbook", 9 }, /* TEXICMD_SMALLBOOK */
1.12 kristaps 284: { dodisplay, "smalldisplay", 12 }, /* TEXICMD_SMALLDISPLAY */
1.3 kristaps 285: { doexample, "smallexample", 12 }, /* TEXICMD_SMALLEXAMPLE */
1.20 kristaps 286: { dodisplay, "smallformat", 11 }, /* TEXICMD_SMALLFORMAT */
1.13 kristaps 287: { dodisplay, "smallindentblock", 16 }, /* TEXICMD_SMALLINDENTBLOCK */
1.3 kristaps 288: { dosymbol, "{", 1 }, /* TEXICMD_SQUIGGLE_LEFT */
289: { dosymbol, "}", 1 }, /* TEXICMD_SQUIGGLE_RIGHT */
1.35 kristaps 290: { dosymbol, "ss", 2 }, /* TEXICMD_SS */
1.21 kristaps 291: { doinline, "strong", 6 }, /* TEXICMD_STRONG */
1.20 kristaps 292: { dosubsection, "subheading", 10 }, /* TEXICMD_SUBHEADING */
1.1 kristaps 293: { dosubsection, "subsection", 10 }, /* TEXICMD_SUBSECTION */
1.28 kristaps 294: { dosubsubsection, "subsubheading", 13 }, /* TEXICMD_SUBSUBHEADING */
1.23 kristaps 295: { dosubsubsection, "subsubsection", 13 }, /* TEXICMD_SUBSUBSECTION */
1.3 kristaps 296: { doignline, "subtitle", 8 }, /* TEXICMD_SUBTITLE */
1.25 kristaps 297: { doignline, "summarycontents", 15 }, /* TEXICMD_SUMMARYCONTENTS */
1.50 kristaps 298: { dodefindex, "synindex", 8 }, /* TEXICMD_SYNINDEX */
299: { dodefindex, "syncodeindex", 12 }, /* TEXICMD_SYNCODEINDEX */
1.21 kristaps 300: { doinline, "t", 1 }, /* TEXICMD_T */
1.18 kristaps 301: { dotab, "tab", 3 }, /* TEXICMD_TAB */
302: { dosymbol, "\t", 1 }, /* TEXICMD_TABSYM */
1.1 kristaps 303: { dotable, "table", 5 }, /* TEXICMD_TABLE */
304: { doignblock, "tex", 3 }, /* TEXICMD_TEX */
305: { dosymbol, "TeX", 3 }, /* TEXICMD_TEXSYM */
1.43 kristaps 306: { dosymbol, "textdegree", 10 }, /* TEXICMD_TEXTDEGREE */
1.42 kristaps 307: { dosymbol, "TH", 2 }, /* TEXICMD_TH */
308: { dosymbol, "th", 2 }, /* TEXICMD_THSMALL */
1.35 kristaps 309: { dosymbol, "tie", 3 }, /* TEXICMD_TIE */
1.42 kristaps 310: { doaccent, "tieaccent", 9 }, /* TEXICMD_TIEACCENT */
1.16 kristaps 311: { doaccent, "~", 1 }, /* TEXICMD_TILDE */
1.25 kristaps 312: { doignline, "tindex", 6 }, /* TEXICMD_TINDEX */
1.3 kristaps 313: { doignline, "title", 5 }, /* TEXICMD_TITLE */
1.1 kristaps 314: { dobracket, "titlefont", 9 }, /* TEXICMD_TITLEFONT */
315: { doignblock, "titlepage", 9 }, /* TEXICMD_TITLEPAGE */
316: { dotop, "top", 3 }, /* TEXICMD_TOP */
1.42 kristaps 317: { doaccent, "u", 1 }, /* TEXICMD_U */
318: { doaccent, "ubaraccent", 10 }, /* TEXICMD_UBARACCENT */
319: { doaccent, "udotaccent", 10 }, /* TEXICMD_UDOTACCENT */
1.16 kristaps 320: { doaccent, "\"", 1 }, /* TEXICMD_UMLAUT */
1.12 kristaps 321: { dosection, "unnumbered", 10 }, /* TEXICMD_UNNUMBERED */
1.2 kristaps 322: { dosection, "unnumberedsec", 13 }, /* TEXICMD_UNNUMBEREDSEC */
1.20 kristaps 323: { dosubsection, "unnumberedsubsec", 16 }, /* TEXICMD_UNNUMBEREDSUBSEC */
1.23 kristaps 324: { dosubsubsection, "unnumberedsubsubsec", 19 }, /* TEXICMD_UNNUMBEREDSUBSUBSEC */
1.8 kristaps 325: { dolink, "uref", 4 }, /* TEXICMD_UREF */
326: { dolink, "url", 3 }, /* TEXICMD_URL */
1.34 kristaps 327: { doignline, "", 0 }, /* TEXICMD_USER_INDEX */
1.42 kristaps 328: { doaccent, "v", 1 }, /* TEXICMD_V */
1.24 kristaps 329: { dovalue, "value", 5 }, /* TEXICMD_VALUE */
1.12 kristaps 330: { doinline, "var", 3 }, /* TEXICMD_VAR */
1.33 kristaps 331: { doverb, "verb", 4 }, /* TEXICMD_VERB */
332: { doverbatim, "verbatim", 8 }, /* TEXICMD_VERBATIM */
1.16 kristaps 333: { doverbinclude, "verbatiminclude", 15 }, /* TEXICMD_VERBATIMINCLUDE */
1.18 kristaps 334: { doignline, "vindex", 6 }, /* TEXICMD_VINDEX */
1.9 kristaps 335: { dosp, "vskip", 5 }, /* TEXICMD_VSKIP */
1.20 kristaps 336: { dotable, "vtable", 6 }, /* TEXICMD_VTABLE */
1.3 kristaps 337: { dobracket, "w", 1 }, /* TEXICMD_W */
1.8 kristaps 338: { dolink, "xref", 4 }, /* TEXICMD_XREF */
1.20 kristaps 339: /* TEXICMD__END */
1.1 kristaps 340: };
341:
1.24 kristaps 342: const struct texitok *const texitoks = __texitoks;
1.18 kristaps 343:
1.2 kristaps 344: static void
1.46 kristaps 345: dodefindex(struct texi *p, enum texicmd cmd, size_t *pos)
1.27 kristaps 346: {
347: size_t start, end;
348: char *cp;
349:
1.46 kristaps 350: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
351: advance(p, pos);
1.27 kristaps 352:
353: start = end = *pos;
1.46 kristaps 354: while (end < BUFSZ(p) && ! ismspace(BUF(p)[end]))
1.27 kristaps 355: end++;
356:
357: if (start == end) {
1.46 kristaps 358: advanceeoln(p, pos, 1);
1.27 kristaps 359: return;
360: } else if (NULL == (cp = malloc(end - start + 1)))
361: texiabort(p, NULL);
362:
1.46 kristaps 363: memcpy(cp, &BUF(p)[start], end - start);
1.27 kristaps 364: cp[end - start] = '\0';
365:
366: p->indexs = realloc(p->indexs,
367: sizeof(char *) * (p->indexsz + 1));
368:
369: if (NULL == p->indexs)
370: texiabort(p, NULL);
371: p->indexs[p->indexsz++] = cp;
372: }
373:
374: static void
1.46 kristaps 375: dodefn(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 376: {
377: const char *blk;
378:
1.5 kristaps 379: blk = NULL;
1.3 kristaps 380: switch (cmd) {
1.15 kristaps 381: case (TEXICMD_DEFFN):
1.35 kristaps 382: case (TEXICMD_DEFMAC):
1.15 kristaps 383: case (TEXICMD_DEFTP):
1.3 kristaps 384: case (TEXICMD_DEFTYPEFN):
385: case (TEXICMD_DEFTYPEFUN):
1.34 kristaps 386: case (TEXICMD_DEFTYPEMETHOD):
1.15 kristaps 387: case (TEXICMD_DEFTYPEVAR):
388: case (TEXICMD_DEFTYPEVR):
389: case (TEXICMD_DEFUN):
390: case (TEXICMD_DEFVAR):
391: case (TEXICMD_DEFVR):
1.5 kristaps 392: blk = texitoks[cmd].tok;
1.3 kristaps 393: break;
1.5 kristaps 394: default:
1.3 kristaps 395: break;
396: }
397:
398: if (p->ign) {
1.15 kristaps 399: NULL != blk ?
1.46 kristaps 400: parseto(p, pos, blk) :
401: parseeoln(p, pos);
1.3 kristaps 402: return;
403: }
404:
1.15 kristaps 405: if (NULL != blk)
406: texivspace(p);
407:
1.3 kristaps 408: switch (cmd) {
1.34 kristaps 409: case (TEXICMD_DEFTYPEMETHOD):
410: case (TEXICMD_DEFTYPEMETHODX):
411: texiputchars(p, "Method");
412: break;
1.15 kristaps 413: case (TEXICMD_DEFMAC):
414: case (TEXICMD_DEFMACX):
415: texiputchars(p, "Macro");
416: break;
417: case (TEXICMD_DEFTYPEVAR):
418: case (TEXICMD_DEFTYPEVARX):
419: case (TEXICMD_DEFVAR):
420: case (TEXICMD_DEFVARX):
421: texiputchars(p, "Variable");
422: break;
1.3 kristaps 423: case (TEXICMD_DEFTYPEFUN):
1.15 kristaps 424: case (TEXICMD_DEFTYPEFUNX):
425: case (TEXICMD_DEFUN):
426: case (TEXICMD_DEFUNX):
427: texiputchars(p, "Function");
1.3 kristaps 428: break;
429: default:
1.46 kristaps 430: parselinearg(p, pos);
1.3 kristaps 431: break;
432: }
1.15 kristaps 433:
1.48 kristaps 434: texiputchar(p, ':');
435: texiputchar(p, '\n');
1.15 kristaps 436:
437: switch (cmd) {
438: case (TEXICMD_DEFMAC):
439: case (TEXICMD_DEFMACX):
440: teximacroopen(p, "Dv");
1.46 kristaps 441: while (parselinearg(p, pos))
1.15 kristaps 442: /* Spin. */ ;
443: teximacroclose(p);
444: break;
445: case (TEXICMD_DEFFN):
446: case (TEXICMD_DEFFNX):
447: case (TEXICMD_DEFUN):
448: case (TEXICMD_DEFUNX):
449: teximacroopen(p, "Fo");
1.46 kristaps 450: parselinearg(p, pos);
1.15 kristaps 451: teximacroclose(p);
452: teximacroopen(p, "Fa");
1.46 kristaps 453: while (parselinearg(p, pos))
1.15 kristaps 454: /* Spin. */ ;
455: teximacroclose(p);
456: teximacro(p, "Fc");
457: break;
458: case (TEXICMD_DEFTYPEFUN):
459: case (TEXICMD_DEFTYPEFUNX):
460: case (TEXICMD_DEFTYPEFN):
461: case (TEXICMD_DEFTYPEFNX):
1.34 kristaps 462: case (TEXICMD_DEFTYPEMETHOD):
463: case (TEXICMD_DEFTYPEMETHODX):
1.15 kristaps 464: teximacroopen(p, "Ft");
1.46 kristaps 465: parselinearg(p, pos);
1.15 kristaps 466: teximacroclose(p);
467: teximacroopen(p, "Fo");
1.46 kristaps 468: parselinearg(p, pos);
1.15 kristaps 469: teximacroclose(p);
470: teximacroopen(p, "Fa");
1.46 kristaps 471: while (parselinearg(p, pos))
1.15 kristaps 472: /* Spin. */ ;
473: teximacroclose(p);
474: teximacro(p, "Fc");
475: break;
476: case (TEXICMD_DEFTP):
477: case (TEXICMD_DEFTPX):
478: case (TEXICMD_DEFTYPEVAR):
479: case (TEXICMD_DEFTYPEVARX):
480: case (TEXICMD_DEFTYPEVR):
481: case (TEXICMD_DEFTYPEVRX):
482: teximacroopen(p, "Vt");
1.46 kristaps 483: while (parselinearg(p, pos))
1.15 kristaps 484: /* Spin. */ ;
485: teximacroclose(p);
486: break;
487: case (TEXICMD_DEFVAR):
488: case (TEXICMD_DEFVARX):
489: case (TEXICMD_DEFVR):
490: case (TEXICMD_DEFVRX):
491: teximacroopen(p, "Va");
1.46 kristaps 492: while (parselinearg(p, pos))
1.15 kristaps 493: /* Spin. */ ;
494: teximacroclose(p);
495: break;
496: default:
497: abort();
1.3 kristaps 498: }
1.15 kristaps 499:
1.54 kristaps 500: if (NULL == blk)
501: return;
502:
503: /*
504: * All "block" definitions have their block bodies indented
505: * unless they have the "x" form of the command following.
506: * E.g.,
507: * @deffn some function
508: * @deffnx another
509: * An explanation.
510: * @end deffn
511: * With this loop, we delay opening the indented block until we
512: * skipped past conformant macros.
513: */
514: for (;;) {
515: switch (peekcmd(p, *pos)) {
516: case (TEXICMD_DEFFNX):
517: case (TEXICMD_DEFMACX):
518: case (TEXICMD_DEFTPX):
519: case (TEXICMD_DEFTYPEFNX):
520: case (TEXICMD_DEFTYPEFUNX):
521: case (TEXICMD_DEFTYPEMETHODX):
522: case (TEXICMD_DEFTYPEVARX):
523: case (TEXICMD_DEFTYPEVRX):
524: case (TEXICMD_DEFUNX):
525: case (TEXICMD_DEFVARX):
526: case (TEXICMD_DEFVRX):
527: texivspace(p);
528: parseeoln(p, pos);
529: continue;
530: default:
531: break;
532: }
533: break;
534: }
535: teximacro(p, "Bd -filled -offset indent");
536: p->seenvs = 1;
537: parseto(p, pos, blk);
538: teximacro(p, "Ed");
1.3 kristaps 539: }
540:
541: static void
1.46 kristaps 542: domacro(struct texi *p, enum texicmd cmd, size_t *pos)
1.30 kristaps 543: {
544: size_t start, end, endtoksz, len;
545: struct teximacro m;
546: const char *endtok, *blk;
547:
548: memset(&m, 0, sizeof(struct teximacro));
549:
1.46 kristaps 550: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
551: advance(p, pos);
1.30 kristaps 552:
1.46 kristaps 553: for (start = end = *pos; end < BUFSZ(p); end++)
554: if (ismspace(BUF(p)[end]) || '{' == BUF(p)[end])
1.30 kristaps 555: break;
556:
557: if (start == end)
558: texierr(p, "zero-length macro name");
559:
1.46 kristaps 560: advanceto(p, pos, end);
1.30 kristaps 561:
562: m.key = malloc(end - start + 1);
563: if (NULL == m.key)
564: texiabort(p, NULL);
1.46 kristaps 565: memcpy(m.key, &BUF(p)[start], end - start);
1.30 kristaps 566: m.key[end - start] = '\0';
567:
1.46 kristaps 568: m.args = argparse(p, pos, &m.argsz, 0);
1.30 kristaps 569:
1.46 kristaps 570: /* Note: we advance to the beginning of the macro. */
571: advanceeoln(p, pos, 1);
572:
573: /*
574: * According to the Texinfo manual, the macro ends on the
575: * newline subsequent the @end macro.
576: * That's COMPLETELY FUCKING WRONG.
577: * It ends inclusive the newline, which is why so many macros
578: * say things like @r{hello}@c, where the subsequent @c swallows
579: * the newline.
580: * However, it does swallow the leading newline, so look for the
581: * @end macro without the leading newline else we might look
582: * past empty macros.
583: */
1.30 kristaps 584: start = *pos;
1.46 kristaps 585: endtok = "@end macro\n";
1.30 kristaps 586: endtoksz = strlen(endtok);
1.46 kristaps 587: blk = memmem(&BUF(p)[start], BUFSZ(p) - start, endtok, endtoksz);
1.30 kristaps 588: if (NULL == blk)
589: texierr(p, "unterminated macro body");
1.46 kristaps 590: /* Roll us back one character. */
591: while (&BUF(p)[*pos] != blk)
592: advance(p, pos);
593: assert('@' == BUF(p)[*pos]);
594: if ('\n' != BUF(p)[*pos - 1])
595: texierr(p, "cannot handle @end macro in-line");
596:
597: len = blk - &BUF(p)[start];
1.30 kristaps 598: m.value = malloc(len + 1);
599: if (NULL == m.value)
600: texiabort(p, NULL);
1.46 kristaps 601: memcpy(m.value, &BUF(p)[start], len);
1.30 kristaps 602: m.value[len] = '\0';
603:
604: p->macros = realloc
605: (p->macros,
606: (p->macrosz + 1) *
607: sizeof(struct teximacro));
608: if (NULL == p->macros)
609: texiabort(p, NULL);
610:
611: p->macros[p->macrosz++] = m;
1.46 kristaps 612: advanceeoln(p, pos, 1);
1.30 kristaps 613: }
614:
615: static void
1.46 kristaps 616: doignblock(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 617: {
1.45 kristaps 618: char end[32], start[32];
619: const char *endt, *startt;
620: size_t esz, ssz, newpos, stack;
1.26 kristaps 621:
622: /*
1.45 kristaps 623: * FIXME: this is cheating.
624: * These tokens are supposed to begin on a newline.
625: * However, if we do that, then we would need to check within
626: * the loop for trailer (or leading, as the case may be)
627: * newline, and that's just a bit too complicated right now.
628: * This is becasue
629: * @ifset BAR
630: * @ifset FOO
631: * @end ifset
632: * @end ifset
633: * won't work right now: we'd read after the first "@end ifset"
634: * to the next line, then look for the next line after that.
1.26 kristaps 635: */
1.45 kristaps 636: ssz = snprintf(start, sizeof(start),
637: "@%s", texitoks[cmd].tok);
638: assert(ssz < sizeof(start));
639: esz = snprintf(end, sizeof(end),
640: "@end %s\n", texitoks[cmd].tok);
641: assert(esz < sizeof(end));
642: stack = 1;
643:
644: /*
645: * Here we look for the end token "end" somewhere in the file in
646: * front of us.
647: * It's not that easy, of course: if we have a nested block,
648: * then there'll be an "end" token of the same kind between us.
649: * Thus, we keep track of scopes for matching "end" blocks.
1.26 kristaps 650: */
1.46 kristaps 651: while (stack > 0 && *pos < BUFSZ(p)) {
1.52 kristaps 652: if (stack > 64)
653: texierr(p, "run-away nested stack?");
1.46 kristaps 654: endt = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, end, esz);
655: startt = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, start, ssz);
1.45 kristaps 656: if (NULL == endt) {
657: texiwarn(p, "unterminated \"%s\" "
658: "block", texitoks[cmd].tok);
1.46 kristaps 659: *pos = BUFSZ(p);
1.45 kristaps 660: break;
661: }
1.26 kristaps 662:
1.45 kristaps 663: newpos = *pos;
664: if (NULL == startt || startt > endt) {
1.46 kristaps 665: newpos += esz + (size_t)(endt - &BUF(p)[*pos]);
1.45 kristaps 666: stack--;
667: } else {
1.46 kristaps 668: newpos += ssz + (size_t)(startt - &BUF(p)[*pos]);
1.45 kristaps 669: stack++;
670: }
671:
1.46 kristaps 672: assert(newpos <= BUFSZ(p));
1.45 kristaps 673: while (*pos < newpos)
1.46 kristaps 674: advance(p, pos);
1.45 kristaps 675: }
1.1 kristaps 676: }
677:
678: static void
1.46 kristaps 679: doblock(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 680: {
681:
1.46 kristaps 682: parseto(p, pos, texitoks[cmd].tok);
1.1 kristaps 683: }
684:
685: static void
1.46 kristaps 686: doinline(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 687: {
1.21 kristaps 688: const char *macro = NULL;
1.12 kristaps 689:
690: switch (cmd) {
1.21 kristaps 691: case (TEXICMD_CODE):
692: case (TEXICMD_KBD):
693: case (TEXICMD_SAMP):
694: case (TEXICMD_T):
695: macro = "Li";
696: break;
697: case (TEXICMD_CITE):
698: case (TEXICMD_DFN):
699: case (TEXICMD_EMPH):
700: case (TEXICMD_I):
701: case (TEXICMD_SLANTED):
702: macro = "Em";
703: break;
704: case (TEXICMD_B):
705: case (TEXICMD_STRONG):
706: macro = "Sy";
707: break;
1.12 kristaps 708: case (TEXICMD_COMMAND):
709: macro = "Xr";
710: break;
711: case (TEXICMD_ENV):
712: macro = "Ev";
713: break;
714: case (TEXICMD_FILE):
715: macro = "Pa";
716: break;
1.16 kristaps 717: case (TEXICMD_OPTION):
718: macro = "Op";
719: break;
1.12 kristaps 720: case (TEXICMD_VAR):
721: macro = "Va";
722: break;
723: default:
1.22 kristaps 724: break;
1.12 kristaps 725: }
726:
1.25 kristaps 727: if (NULL == macro || p->literal || TEXILIST_TABLE == p->list) {
1.53 kristaps 728: parsebracket(p, pos, 0);
1.12 kristaps 729: return;
730: }
1.1 kristaps 731:
1.5 kristaps 732: teximacroopen(p, macro);
1.1 kristaps 733: p->seenws = 0;
1.53 kristaps 734: parsebracket(p, pos, 0);
1.46 kristaps 735: texipunctuate(p, pos);
1.5 kristaps 736: teximacroclose(p);
1.1 kristaps 737: }
738:
739: static void
1.46 kristaps 740: doverb(struct texi *p, enum texicmd cmd, size_t *pos)
1.33 kristaps 741: {
742: char delim;
1.34 kristaps 743: size_t start;
1.33 kristaps 744:
1.46 kristaps 745: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
746: advance(p, pos);
747: if (*pos == BUFSZ(p) || '{' != BUF(p)[*pos])
1.33 kristaps 748: return;
1.46 kristaps 749: advance(p, pos);
750: if (*pos == BUFSZ(p))
1.33 kristaps 751: return;
752:
1.46 kristaps 753: delim = BUF(p)[*pos];
754: advance(p, pos);
1.33 kristaps 755: /* Make sure we flush out our initial whitespace... */
756: if (p->seenws && p->outcol && 0 == p->literal)
757: texiputchar(p, ' ');
758: p->seenws = 0;
1.34 kristaps 759: start = *pos;
1.33 kristaps 760: /* Read until we see the delimiter then end-brace. */
1.46 kristaps 761: while (*pos < BUFSZ(p) - 1) {
762: if (BUF(p)[*pos] == delim && BUF(p)[*pos + 1] == '}')
1.33 kristaps 763: break;
1.46 kristaps 764: advance(p, pos);
1.33 kristaps 765: }
1.51 kristaps 766: if (*pos >= BUFSZ(p) - 1)
1.33 kristaps 767: return;
1.46 kristaps 768: texiputbuf(p, start, *pos);
1.34 kristaps 769:
1.33 kristaps 770: /* Make sure we read after the end-brace. */
1.46 kristaps 771: assert(delim == BUF(p)[*pos]);
772: advance(p, pos);
773: assert('}' == BUF(p)[*pos]);
774: advance(p, pos);
1.33 kristaps 775: }
776:
777: static void
1.46 kristaps 778: doverbatim(struct texi *p, enum texicmd cmd, size_t *pos)
1.25 kristaps 779: {
780: const char *end, *term;
781: size_t endsz, endpos;
782:
1.45 kristaps 783: /* We read from the @verbatim\n newline inclusive! */
1.25 kristaps 784: end = "\n@end verbatim\n";
785: endsz = strlen(end);
1.46 kristaps 786: advanceeoln(p, pos, 0);
787: if (*pos == BUFSZ(p)) {
1.45 kristaps 788: texiwarn(p, "unexpected end of file");
789: return;
790: }
1.25 kristaps 791:
1.46 kristaps 792: term = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, end, endsz);
1.45 kristaps 793: if (NULL == term) {
794: texiwarn(p, "unterminated verbatim block");
1.46 kristaps 795: endpos = BUFSZ(p);
1.45 kristaps 796: } else
1.46 kristaps 797: endpos = *pos + (size_t)(term - &BUF(p)[*pos]);
1.25 kristaps 798:
1.46 kristaps 799: assert(endpos <= BUFSZ(p));
800: assert('\n' == BUF(p)[*pos]);
801: advance(p, pos);
1.25 kristaps 802: teximacro(p, "Bd -literal -offset indent");
1.26 kristaps 803: while (*pos < endpos) {
1.46 kristaps 804: texiputchar(p, BUF(p)[*pos]);
805: advance(p, pos);
1.25 kristaps 806: }
807: teximacro(p, "Ed");
1.46 kristaps 808: if (*pos < BUFSZ(p))
809: advanceto(p, pos, endpos + endsz);
1.25 kristaps 810: }
811:
812: static void
1.46 kristaps 813: doverbinclude(struct texi *p, enum texicmd cmd, size_t *pos)
1.16 kristaps 814: {
1.25 kristaps 815: char fname[PATH_MAX], path[PATH_MAX];
816: int rc;
817: size_t i, end;
818: const char *v;
819: enum texicmd type;
1.16 kristaps 820:
1.46 kristaps 821: while (*pos < BUFSZ(p) && ' ' == BUF(p)[*pos])
822: advance(p, pos);
1.16 kristaps 823:
1.46 kristaps 824: for (i = 0; *pos < BUFSZ(p) && '\n' != BUF(p)[*pos]; ) {
1.16 kristaps 825: if (i == sizeof(fname) - 1)
826: break;
1.46 kristaps 827: if ('@' != BUF(p)[*pos]) {
828: fname[i++] = BUF(p)[*pos];
829: advance(p, pos);
1.25 kristaps 830: continue;
831: }
1.46 kristaps 832: type = texicmd(p, *pos, &end, NULL);
833: advanceto(p, pos, end);
1.25 kristaps 834: if (TEXICMD_VALUE != type)
835: texierr(p, "unknown verbatiminclude command");
1.46 kristaps 836: v = valueblookup(p, pos);
1.25 kristaps 837: if (NULL == v)
838: continue;
839: while ('\0' != *v) {
840: if (i == sizeof(fname) - 1)
841: break;
842: fname[i++] = *v++;
843: }
844: if ('\0' != *v)
845: break;
1.16 kristaps 846: }
847:
848: if (i == 0)
849: texierr(p, "path too short");
1.46 kristaps 850: else if ('\n' != BUF(p)[*pos])
1.16 kristaps 851: texierr(p, "path too long");
852: else if ('/' == fname[0])
853: texierr(p, "no absolute paths");
854: fname[i] = '\0';
855:
856: if (strstr(fname, "../") || strstr(fname, "/.."))
857: texierr(p, "insecure path");
858:
859: rc = snprintf(path, sizeof(path),
860: "%s/%s", p->dirs[0], fname);
861: if (rc < 0)
862: texierr(p, "couldn't format path");
863: else if ((size_t)rc >= sizeof(path))
864: texierr(p, "path too long");
865:
866: parsefile(p, path, 0);
867: }
868:
869: static void
1.46 kristaps 870: doinclude(struct texi *p, enum texicmd cmd, size_t *pos)
1.2 kristaps 871: {
1.25 kristaps 872: char fname[PATH_MAX], path[PATH_MAX];
873: size_t i, end;
874: int rc;
875: const char *v;
876: enum texicmd type;
1.2 kristaps 877:
1.46 kristaps 878: while (*pos < BUFSZ(p) && ' ' == BUF(p)[*pos])
879: advance(p, pos);
1.2 kristaps 880:
881: /* Read in the filename. */
1.46 kristaps 882: for (i = 0; *pos < BUFSZ(p) && '\n' != BUF(p)[*pos]; ) {
1.2 kristaps 883: if (i == sizeof(fname) - 1)
884: break;
1.46 kristaps 885: if ('@' != BUF(p)[*pos]) {
886: fname[i++] = BUF(p)[*pos];
887: advance(p, pos);
1.25 kristaps 888: continue;
889: }
1.46 kristaps 890: type = texicmd(p, *pos, &end, NULL);
891: advanceto(p, pos, end);
1.25 kristaps 892: if (TEXICMD_VALUE != type)
893: texierr(p, "unknown include command");
1.46 kristaps 894: v = valueblookup(p, pos);
1.25 kristaps 895: if (NULL == v)
896: continue;
897: while ('\0' != *v) {
898: if (i == sizeof(fname) - 1)
899: break;
900: fname[i++] = *v++;
901: }
902: if ('\0' != *v)
903: break;
1.2 kristaps 904: }
905:
906: if (i == 0)
907: texierr(p, "path too short");
1.46 kristaps 908: else if ('\n' != BUF(p)[*pos])
1.2 kristaps 909: texierr(p, "path too long");
910: else if ('/' == fname[0])
911: texierr(p, "no absolute paths");
912: fname[i] = '\0';
913:
914: if (strstr(fname, "../") || strstr(fname, "/.."))
915: texierr(p, "insecure path");
916:
1.5 kristaps 917: for (i = 0; i < p->dirsz; i++) {
918: rc = snprintf(path, sizeof(path),
919: "%s/%s", p->dirs[i], fname);
920: if (rc < 0)
921: texierr(p, "couldn't format path");
922: else if ((size_t)rc >= sizeof(path))
923: texierr(p, "path too long");
924: else if (-1 == access(path, R_OK))
925: continue;
926:
1.16 kristaps 927: parsefile(p, path, 1);
1.5 kristaps 928: return;
929: }
1.2 kristaps 930:
1.5 kristaps 931: texierr(p, "couldn't find %s in includes", fname);
1.2 kristaps 932: }
933:
934: static void
1.46 kristaps 935: dobracket(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 936: {
937:
1.53 kristaps 938: parsebracket(p, pos, 0);
1.1 kristaps 939: }
940:
941: static void
1.46 kristaps 942: dodisplay(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 943: {
944:
1.57 ! kristaps 945: advanceeoln(p, pos, 1);
! 946:
1.20 kristaps 947: switch (cmd) {
948: case (TEXICMD_FORMAT):
949: case (TEXICMD_SMALLFORMAT):
950: teximacro(p, "Bd -filled");
951: break;
952: default:
953: teximacro(p, "Bd -filled -offset indent");
954: break;
955: }
956:
1.11 kristaps 957: p->seenvs = 1;
1.46 kristaps 958: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 959: teximacro(p, "Ed");
1.3 kristaps 960: }
961:
962: static void
1.46 kristaps 963: doexample(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 964: {
965:
1.57 ! kristaps 966: advanceeoln(p, pos, 1);
! 967:
1.5 kristaps 968: teximacro(p, "Bd -literal -offset indent");
1.3 kristaps 969: p->literal++;
1.46 kristaps 970: parseto(p, pos, texitoks[cmd].tok);
1.3 kristaps 971: p->literal--;
1.5 kristaps 972: teximacro(p, "Ed");
1.1 kristaps 973: }
974:
975: static void
1.46 kristaps 976: dobye(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 977: {
978:
979: texiexit(p);
980: exit(EXIT_SUCCESS);
981: }
982:
983: static void
1.46 kristaps 984: dotitle(struct texi *p, enum texicmd cmd, size_t *pos)
1.10 kristaps 985: {
1.57 ! kristaps 986: size_t start;
1.10 kristaps 987:
1.46 kristaps 988: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
989: advance(p, pos);
1.57 ! kristaps 990:
! 991: /* We want to suck down the entire line, inclusive \n. */
! 992: start = *pos;
! 993: while (*pos < BUFSZ(p) && '\n' != BUF(p)[*pos]) {
! 994: if ('@' == BUF(p)[*pos])
! 995: advance(p, pos);
! 996: advance(p, pos);
! 997: }
! 998: if (*pos < BUFSZ(p))
! 999: advance(p, pos);
! 1000:
! 1001: /* Copy this into a buffer. */
1.10 kristaps 1002: free(p->subtitle);
1.57 ! kristaps 1003: if (NULL == (p->subtitle = malloc(*pos - start + 1)))
1.27 kristaps 1004: texiabort(p, NULL);
1.57 ! kristaps 1005: memcpy(p->subtitle, &BUF(p)[start], *pos - start);
! 1006: p->subtitle[*pos - start] = '\0';
1.10 kristaps 1007: }
1008:
1009: static void
1.46 kristaps 1010: doaccent(struct texi *p, enum texicmd cmd, size_t *pos)
1.16 kristaps 1011: {
1.42 kristaps 1012: int brace = 0;
1.16 kristaps 1013:
1.46 kristaps 1014: if (*pos == BUFSZ(p)) {
1.42 kristaps 1015: texiwarn(p, "truncated: @%s", texitoks[cmd].tok);
1.16 kristaps 1016: return;
1.42 kristaps 1017: }
1018:
1019: /* Pad us with space, if necessary. */
1020: if (p->seenws && p->outcol && 0 == p->literal) {
1.34 kristaps 1021: texiputchar(p, ' ');
1.42 kristaps 1022: p->seenws = 0;
1023: }
1024:
1025: /*
1026: * If we're braced, then that's that.
1027: * Otherwise, in a special Texinfo case: if we're a non
1028: * alphabetic command of one letter, then the next character is
1029: * the critical one.
1030: * Otherwise, space can sit between us and our argument.
1031: */
1.46 kristaps 1032: if ('{' == BUF(p)[*pos]) {
1.42 kristaps 1033: brace = 1;
1.46 kristaps 1034: advance(p, pos);
1.49 kristaps 1035: } else if (isalpha((unsigned char)texitoks[cmd].tok[0]))
1.46 kristaps 1036: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1037: advance(p, pos);
1.42 kristaps 1038:
1.46 kristaps 1039: if (*pos == BUFSZ(p)) {
1.42 kristaps 1040: texiwarn(p, "truncated: @%s", texitoks[cmd].tok);
1041: return;
1042: }
1043:
1044: switch (cmd) {
1.16 kristaps 1045: case (TEXICMD_ACUTE):
1.46 kristaps 1046: switch (BUF(p)[*pos]) {
1.16 kristaps 1047: case ('a'): case ('A'):
1048: case ('e'): case ('E'):
1049: case ('i'): case ('I'):
1050: case ('o'): case ('O'):
1051: case ('u'): case ('U'):
1052: texiputchars(p, "\\(\'");
1053: break;
1054: default:
1.42 kristaps 1055: texiwarn(p, "ignoring accent");
1056: break;
1.16 kristaps 1057: }
1.46 kristaps 1058: texiputchar(p, BUF(p)[*pos]);
1059: advance(p, pos);
1.42 kristaps 1060: break;
1061: case (TEXICMD_CEDILLA):
1.46 kristaps 1062: if ('c' == BUF(p)[*pos] || 'C' == BUF(p)[*pos])
1.42 kristaps 1063: texiputchars(p, "\\(,");
1064: else
1065: texiwarn(p, "ignoring accent");
1.46 kristaps 1066: texiputchar(p, BUF(p)[*pos]);
1067: advance(p, pos);
1.16 kristaps 1068: break;
1069: case (TEXICMD_CIRCUMFLEX):
1.46 kristaps 1070: switch (BUF(p)[*pos]) {
1.16 kristaps 1071: case ('a'): case ('A'):
1072: case ('e'): case ('E'):
1073: case ('i'): case ('I'):
1074: case ('o'): case ('O'):
1075: case ('u'): case ('U'):
1076: texiputchars(p, "\\(^");
1077: break;
1078: default:
1.42 kristaps 1079: texiwarn(p, "ignoring accent");
1.34 kristaps 1080: break;
1.16 kristaps 1081: }
1.46 kristaps 1082: texiputchar(p, BUF(p)[*pos]);
1083: advance(p, pos);
1.42 kristaps 1084: break;
1085: case (TEXICMD_DOTLESS):
1.46 kristaps 1086: if ('i' == BUF(p)[*pos] || 'j' == BUF(p)[*pos])
1.42 kristaps 1087: texiputchars(p, "\\(.");
1088: else
1089: texiwarn(p, "ignoring accent");
1.46 kristaps 1090: texiputchar(p, BUF(p)[*pos]);
1091: advance(p, pos);
1.16 kristaps 1092: break;
1093: case (TEXICMD_GRAVE):
1.46 kristaps 1094: switch (BUF(p)[*pos]) {
1.16 kristaps 1095: case ('a'): case ('A'):
1096: case ('e'): case ('E'):
1097: case ('i'): case ('I'):
1098: case ('o'): case ('O'):
1099: case ('u'): case ('U'):
1100: texiputchars(p, "\\(`");
1101: break;
1102: default:
1.42 kristaps 1103: texiwarn(p, "ignoring accent");
1104: break;
1.16 kristaps 1105: }
1.46 kristaps 1106: texiputchar(p, BUF(p)[*pos]);
1107: advance(p, pos);
1.16 kristaps 1108: break;
1109: case (TEXICMD_TILDE):
1.46 kristaps 1110: switch (BUF(p)[*pos]) {
1.16 kristaps 1111: case ('a'): case ('A'):
1112: case ('n'): case ('N'):
1113: case ('o'): case ('O'):
1114: texiputchars(p, "\\(~");
1115: break;
1116: default:
1.42 kristaps 1117: texiwarn(p, "ignoring accent");
1.34 kristaps 1118: break;
1.16 kristaps 1119: }
1.46 kristaps 1120: texiputchar(p, BUF(p)[*pos]);
1121: advance(p, pos);
1.16 kristaps 1122: break;
1123: case (TEXICMD_UMLAUT):
1.46 kristaps 1124: switch (BUF(p)[*pos]) {
1.16 kristaps 1125: case ('a'): case ('A'):
1126: case ('e'): case ('E'):
1127: case ('i'): case ('I'):
1128: case ('o'): case ('O'):
1129: case ('u'): case ('U'):
1130: case ('y'):
1131: texiputchars(p, "\\(:");
1132: break;
1133: default:
1.42 kristaps 1134: texiwarn(p, "ignoring accent");
1.34 kristaps 1135: break;
1.16 kristaps 1136: }
1.46 kristaps 1137: texiputchar(p, BUF(p)[*pos]);
1138: advance(p, pos);
1.16 kristaps 1139: break;
1140: default:
1.46 kristaps 1141: texiputchar(p, BUF(p)[*pos]);
1142: advance(p, pos);
1.42 kristaps 1143: break;
1144: }
1145:
1146: if (brace) {
1.46 kristaps 1147: while (*pos < BUFSZ(p) && '}' != BUF(p)[*pos]) {
1148: texiputchar(p, BUF(p)[*pos]);
1149: advance(p, pos);
1.42 kristaps 1150: }
1.46 kristaps 1151: if (*pos < BUFSZ(p))
1152: advance(p, pos);
1.42 kristaps 1153: }
1154:
1155: switch (cmd) {
1156: case (TEXICMD_TIEACCENT):
1157: texiputchar(p, ']');
1158: break;
1159: case (TEXICMD_DOTACCENT):
1160: texiputchar(p, '*');
1161: break;
1162: default:
1163: break;
1.16 kristaps 1164: }
1165: }
1166:
1167: static void
1.46 kristaps 1168: dosymbol(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1169: {
1170:
1.42 kristaps 1171: /* Remember to pad us. */
1.43 kristaps 1172: if (p->seenws && p->outcol && 0 == p->literal)
1.3 kristaps 1173: texiputchar(p, ' ');
1.43 kristaps 1174:
1175: p->seenws = 0;
1.3 kristaps 1176:
1.1 kristaps 1177: switch (cmd) {
1.42 kristaps 1178: case (TEXICMD_AA):
1179: texiputchars(p, "\\(oA");
1180: break;
1181: case (TEXICMD_AASMALL):
1182: texiputchars(p, "\\(oa");
1183: break;
1184: case (TEXICMD_AE):
1185: texiputchars(p, "\\(AE");
1186: break;
1187: case (TEXICMD_AESMALL):
1188: texiputchars(p, "\\(ae");
1189: break;
1.3 kristaps 1190: case (TEXICMD_ASTERISK):
1191: case (TEXICMD_NEWLINE):
1192: case (TEXICMD_SPACE):
1.18 kristaps 1193: case (TEXICMD_TABSYM):
1.3 kristaps 1194: texiputchar(p, ' ');
1195: break;
1.1 kristaps 1196: case (TEXICMD_AT):
1.3 kristaps 1197: texiputchar(p, '@');
1198: break;
1199: case (TEXICMD_BANG):
1200: texiputchar(p, '!');
1.7 kristaps 1201: break;
1202: case (TEXICMD_BULLET):
1203: texiputchars(p, "\\(bu");
1.1 kristaps 1204: break;
1.35 kristaps 1205: case (TEXICMD_COMMA):
1206: texiputchar(p, ',');
1207: break;
1.1 kristaps 1208: case (TEXICMD_COPYRIGHT):
1209: texiputchars(p, "\\(co");
1210: break;
1.42 kristaps 1211: case (TEXICMD_DH):
1212: texiputchars(p, "\\(-D");
1213: break;
1214: case (TEXICMD_DHSMALL):
1215: texiputchars(p, "\\(Sd");
1216: break;
1.2 kristaps 1217: case (TEXICMD_DOTS):
1.34 kristaps 1218: case (TEXICMD_ENDDOTS):
1.2 kristaps 1219: texiputchars(p, "...");
1220: break;
1.28 kristaps 1221: case (TEXICMD_EQUIV):
1222: texiputchars(p, "\\(==");
1223: break;
1.15 kristaps 1224: case (TEXICMD_ERROR):
1225: texiputchars(p, "error\\(->");
1.17 kristaps 1226: break;
1.43 kristaps 1227: case (TEXICMD_EURO):
1228: texiputchars(p, "\\(Eu");
1229: break;
1.42 kristaps 1230: case (TEXICMD_EXCLAMDOWN):
1231: texiputchars(p, "\\(r!");
1232: break;
1.17 kristaps 1233: case (TEXICMD_EXPANSION):
1234: texiputchars(p, "\\(->");
1.15 kristaps 1235: break;
1.43 kristaps 1236: case (TEXICMD_GEQ):
1237: texiputchars(p, "\\(>=");
1238: break;
1239: case (TEXICMD_GUILLEMETLEFT):
1240: case (TEXICMD_GUILLEMOTLEFT):
1241: texiputchars(p, "\\(Fo");
1242: break;
1243: case (TEXICMD_GUILLEMETRIGHT):
1244: case (TEXICMD_GUILLEMOTRIGHT):
1245: texiputchars(p, "\\(Fc");
1246: break;
1247: case (TEXICMD_GUILSINGLLEFT):
1248: texiputchars(p, "\\(fo");
1249: break;
1250: case (TEXICMD_GUILSINGLRIGHT):
1251: texiputchars(p, "\\(fc");
1252: break;
1.42 kristaps 1253: case (TEXICMD_L):
1254: texiputchars(p, "\\(/L");
1255: break;
1.1 kristaps 1256: case (TEXICMD_LATEX):
1257: texiputchars(p, "LaTeX");
1258: break;
1.43 kristaps 1259: case (TEXICMD_LEQ):
1260: texiputchars(p, "\\(<=");
1261: break;
1.42 kristaps 1262: case (TEXICMD_LSMALL):
1263: texiputchars(p, "\\(/l");
1264: break;
1.25 kristaps 1265: case (TEXICMD_MINUS):
1266: texiputchars(p, "\\-");
1267: break;
1.42 kristaps 1268: case (TEXICMD_O):
1269: texiputchars(p, "\\(/O");
1270: break;
1271: case (TEXICMD_OE):
1272: texiputchars(p, "\\(OE");
1273: break;
1274: case (TEXICMD_OESMALL):
1275: texiputchars(p, "\\(oe");
1276: break;
1277: case (TEXICMD_ORDF):
1278: texiputchars(p, "a");
1279: break;
1280: case (TEXICMD_ORDM):
1281: texiputchars(p, "o");
1282: break;
1283: case (TEXICMD_OSMALL):
1284: texiputchars(p, "\\(/o");
1285: break;
1.25 kristaps 1286: case (TEXICMD_PERIOD):
1287: texiputchar(p, '.');
1288: break;
1.43 kristaps 1289: case (TEXICMD_POUNDS):
1290: texiputchars(p, "\\(Po");
1291: break;
1.42 kristaps 1292: case (TEXICMD_QUESTIONDOWN):
1293: texiputchars(p, "\\(r?");
1294: break;
1.3 kristaps 1295: case (TEXICMD_QUESTIONMARK):
1296: texiputchar(p, '?');
1.15 kristaps 1297: break;
1.43 kristaps 1298: case (TEXICMD_QUOTEDBLBASE):
1299: texiputchars(p, "\\(Bq");
1300: break;
1301: case (TEXICMD_QUOTEDBLLEFT):
1302: texiputchars(p, "\\(lq");
1303: break;
1304: case (TEXICMD_QUOTEDBLRIGHT):
1305: texiputchars(p, "\\(rq");
1306: break;
1307: case (TEXICMD_QUOTESINGLBASE):
1308: texiputchars(p, "\\(bq");
1309: break;
1310: case (TEXICMD_QUOTELEFT):
1311: texiputchars(p, "\\(oq");
1312: break;
1313: case (TEXICMD_QUOTERIGHT):
1314: texiputchars(p, "\\(cq");
1315: break;
1316: case (TEXICMD_REGISTEREDSYMBOL):
1317: texiputchars(p, "\\(rg");
1318: break;
1.15 kristaps 1319: case (TEXICMD_RESULT):
1320: texiputchars(p, "\\(rA");
1.3 kristaps 1321: break;
1.34 kristaps 1322: case (TEXICMD_SLASH):
1323: texiputchar(p, '/');
1324: break;
1.35 kristaps 1325: case (TEXICMD_SS):
1326: texiputchars(p, "\\(ss");
1327: break;
1.3 kristaps 1328: case (TEXICMD_SQUIGGLE_LEFT):
1329: texiputchars(p, "{");
1330: break;
1331: case (TEXICMD_SQUIGGLE_RIGHT):
1332: texiputchars(p, "}");
1333: break;
1.38 kristaps 1334: case (TEXICMD_TEXSYM):
1.35 kristaps 1335: texiputchars(p, "TeX");
1.43 kristaps 1336: break;
1337: case (TEXICMD_TEXTDEGREE):
1338: texiputchars(p, "\\(de");
1.35 kristaps 1339: break;
1.42 kristaps 1340: case (TEXICMD_TH):
1341: texiputchars(p, "\\(TP");
1342: break;
1343: case (TEXICMD_THSMALL):
1344: texiputchars(p, "\\(Tp");
1345: break;
1.38 kristaps 1346: case (TEXICMD_TIE):
1.35 kristaps 1347: texiputchars(p, "\\ ");
1.1 kristaps 1348: break;
1.3 kristaps 1349: case (TEXICMD_COLON):
1350: case (TEXICMD_HYPHEN):
1351: break;
1.1 kristaps 1352: default:
1353: abort();
1354: }
1355:
1.42 kristaps 1356: /* Alphabetic commands have braces we ignore. */
1.49 kristaps 1357: if (isalpha((unsigned char)texitoks[cmd].tok[0]))
1.46 kristaps 1358: doignbracket(p, cmd, pos);
1.1 kristaps 1359: }
1360:
1361: static void
1.46 kristaps 1362: doquotation(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1363: {
1364:
1.5 kristaps 1365: teximacro(p, "Qo");
1.46 kristaps 1366: parseto(p, pos, "quotation");
1.5 kristaps 1367: teximacro(p, "Qc");
1.1 kristaps 1368: }
1369:
1.3 kristaps 1370: static void
1.46 kristaps 1371: domath(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 1372: {
1373:
1.53 kristaps 1374: parsebracket(p, pos, 1);
1.24 kristaps 1375: }
1376:
1377: static void
1.46 kristaps 1378: dovalue(struct texi *p, enum texicmd cmd, size_t *pos)
1.24 kristaps 1379: {
1.46 kristaps 1380: size_t start, end;
1.25 kristaps 1381: char *key, *val;
1382: const char *cp;
1.24 kristaps 1383:
1384: if (TEXICMD_SET == cmd) {
1.46 kristaps 1385: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1386: advance(p, pos);
1387: for (start = end = *pos; end < BUFSZ(p); end++)
1388: if (ismspace(BUF(p)[end]))
1.24 kristaps 1389: break;
1.25 kristaps 1390: /* We don't allow empty keys. */
1.24 kristaps 1391: if (start == end)
1392: return;
1.46 kristaps 1393: advanceto(p, pos, end);
1.24 kristaps 1394:
1395: key = malloc(end - start + 1);
1.27 kristaps 1396: if (NULL == key)
1397: texiabort(p, NULL);
1.46 kristaps 1398: memcpy(key, &BUF(p)[start], end - start);
1.24 kristaps 1399: key[end - start] = '\0';
1400:
1.46 kristaps 1401: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1402: advance(p, pos);
1403: for (start = end = *pos; end < BUFSZ(p); end++)
1404: if ('\n' == BUF(p)[end])
1.24 kristaps 1405: break;
1.25 kristaps 1406: /* We do allow empty values. */
1.46 kristaps 1407: advanceeoln(p, pos, 1);
1.24 kristaps 1408:
1409: val = malloc(end - start + 1);
1.27 kristaps 1410: if (NULL == val)
1411: texiabort(p, NULL);
1.46 kristaps 1412: memcpy(val, &BUF(p)[start], end - start);
1.24 kristaps 1413: val[end - start] = '\0';
1.25 kristaps 1414: valueadd(p, key, val);
1.24 kristaps 1415: } else if (TEXICMD_VALUE == cmd) {
1416: if (p->seenws)
1417: texiputchar(p, ' ');
1418: p->seenws = 0;
1.46 kristaps 1419: if (NULL != (cp = valueblookup(p, pos)))
1.56 kristaps 1420: texisplice(p, cp, strlen(cp), *pos);
1.46 kristaps 1421: else
1.25 kristaps 1422: texiputchars(p, "{No value}");
1.24 kristaps 1423: } else if (TEXICMD_IFCLEAR == cmd) {
1.46 kristaps 1424: if (NULL != valuellookup(p, pos))
1425: doignblock(p, cmd, pos);
1.26 kristaps 1426: else
1.46 kristaps 1427: parseto(p, pos, texitoks[cmd].tok);
1.30 kristaps 1428: } else if (TEXICMD_IFSET == cmd) {
1.46 kristaps 1429: if (NULL == valuellookup(p, pos))
1430: doignblock(p, cmd, pos);
1.30 kristaps 1431: else
1.46 kristaps 1432: parseto(p, pos, texitoks[cmd].tok);
1.25 kristaps 1433: } else if (TEXICMD_CLEAR == cmd)
1.46 kristaps 1434: valuelclear(p, pos);
1.3 kristaps 1435: }
1436:
1.1 kristaps 1437: static void
1.46 kristaps 1438: dolink(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1439: {
1.8 kristaps 1440: int c;
1.1 kristaps 1441:
1442: switch (cmd) {
1443: case (TEXICMD_EMAIL):
1.5 kristaps 1444: teximacroopen(p, "Mt");
1.1 kristaps 1445: break;
1.3 kristaps 1446: case (TEXICMD_UREF):
1.1 kristaps 1447: case (TEXICMD_URL):
1.44 kristaps 1448: case (TEXICMD_INDICATEURL):
1.5 kristaps 1449: teximacroopen(p, "Lk");
1.1 kristaps 1450: break;
1.8 kristaps 1451: case (TEXICMD_XREF):
1452: texiputchars(p, "See Section");
1.39 kristaps 1453: teximacroopen(p, "Dq");
1.8 kristaps 1454: break;
1455: case (TEXICMD_PXREF):
1456: texiputchars(p, "see Section");
1.39 kristaps 1457: teximacroopen(p, "Dq");
1.8 kristaps 1458: break;
1.34 kristaps 1459: case (TEXICMD_INFOREF):
1460: texiputchars(p, "See Info file node");
1.39 kristaps 1461: teximacroopen(p, "Dq");
1.34 kristaps 1462: break;
1.1 kristaps 1463: default:
1.8 kristaps 1464: abort();
1.1 kristaps 1465: }
1.8 kristaps 1466:
1.46 kristaps 1467: c = parsearg(p, pos, 0);
1.8 kristaps 1468: p->ign++;
1469: while (c > 0)
1.46 kristaps 1470: c = parsearg(p, pos, 1);
1.8 kristaps 1471: p->ign--;
1472:
1.46 kristaps 1473: texipunctuate(p, pos);
1.8 kristaps 1474: teximacroclose(p);
1475: }
1476:
1477: static void
1.46 kristaps 1478: doignargn(struct texi *p, enum texicmd cmd, size_t *pos)
1.8 kristaps 1479: {
1480: int c;
1481:
1.46 kristaps 1482: c = parsearg(p, pos, 0);
1.8 kristaps 1483: p->ign++;
1484: while (c > 0)
1.46 kristaps 1485: c = parsearg(p, pos, 1);
1.8 kristaps 1486: p->ign--;
1.1 kristaps 1487: }
1488:
1.23 kristaps 1489: /*
1490: * Sections can be made subsections and so on by way of the
1491: * @raiseections and @lowersections commands.
1492: * Perform this check here and return the actual section number adjusted
1493: * to the raise level.
1494: */
1495: static int
1496: sectioner(struct texi *p, int sec)
1497: {
1498:
1499: if ((sec -= p->secoffs) < 0) {
1500: texiwarn(p, "section below minimum, clamping");
1501: return(0);
1502: } else if (sec >= SECTSZ) {
1503: texiwarn(p, "section above maximum, clamping");
1504: return(SECTSZ - 1);
1505: }
1506: return(sec);
1507: }
1508:
1509: static void
1.46 kristaps 1510: dosubsubsection(struct texi *p, enum texicmd cmd, size_t *pos)
1.23 kristaps 1511: {
1512: int sec;
1513:
1514: sec = sectioner(p, 3);
1515:
1516: /* We don't have a subsubsubsection, so make one up. */
1517: texivspace(p);
1518: teximacroopen(p, sects[sec]);
1.46 kristaps 1519: parseeoln(p, pos);
1.23 kristaps 1520: teximacroclose(p);
1521: texivspace(p);
1522: }
1523:
1.1 kristaps 1524: static void
1.46 kristaps 1525: dosubsection(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1526: {
1.23 kristaps 1527: int sec;
1528:
1529: sec = sectioner(p, 2);
1.13 kristaps 1530:
1531: if (p->outmacro)
1.23 kristaps 1532: texierr(p, "\"%s\" in open line scope!?", sects[sec]);
1.13 kristaps 1533: else if (p->literal)
1.23 kristaps 1534: texierr(p, "\"%s\" in a literal scope!?", sects[sec]);
1.1 kristaps 1535:
1.21 kristaps 1536: /* We don't have a subsubsection, so make one up. */
1.34 kristaps 1537: if (sec > 1)
1538: texivspace(p);
1.23 kristaps 1539: teximacroopen(p, sects[sec]);
1.46 kristaps 1540: parseeoln(p, pos);
1.5 kristaps 1541: teximacroclose(p);
1.34 kristaps 1542: if (sec > 1)
1543: texivspace(p);
1.1 kristaps 1544: }
1545:
1546: static void
1.46 kristaps 1547: dosecoffs(struct texi *p, enum texicmd cmd, size_t *pos)
1.23 kristaps 1548: {
1549:
1550: if (TEXICMD_RAISESECTIONS == cmd)
1551: p->secoffs++;
1552: else
1553: p->secoffs--;
1554: }
1555:
1556: static void
1.46 kristaps 1557: dosection(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1558: {
1.23 kristaps 1559: int sec;
1.12 kristaps 1560:
1561: switch (cmd) {
1.55 kristaps 1562: case (TEXICMD_TOP):
1563: sec = 0;
1564: break;
1.12 kristaps 1565: case (TEXICMD_APPENDIX):
1566: case (TEXICMD_CHAPTER):
1567: case (TEXICMD_UNNUMBERED):
1.23 kristaps 1568: sec = sectioner(p, 0);
1.12 kristaps 1569: break;
1570: case (TEXICMD_APPENDIXSEC):
1571: case (TEXICMD_HEADING):
1572: case (TEXICMD_SECTION):
1573: case (TEXICMD_UNNUMBEREDSEC):
1.23 kristaps 1574: sec = sectioner(p, 1);
1.12 kristaps 1575: break;
1576: default:
1577: abort();
1578: }
1.1 kristaps 1579:
1.3 kristaps 1580: if (p->outmacro)
1.23 kristaps 1581: texierr(p, "\"%s\" in open line scope!?", sects[sec]);
1.3 kristaps 1582: else if (p->literal)
1.23 kristaps 1583: texierr(p, "\"%s\" in a literal scope!?", sects[sec]);
1.3 kristaps 1584:
1.55 kristaps 1585: if (0 == sec && NULL != p->chapters) {
1586: teximdocclose(p, 0);
1.56 kristaps 1587: teximdocopen(p, pos);
1.55 kristaps 1588: }
1589:
1.23 kristaps 1590: teximacroopen(p, sects[sec]);
1.46 kristaps 1591: parseeoln(p, pos);
1.3 kristaps 1592: teximacroclose(p);
1.11 kristaps 1593: p->seenvs = 1;
1.3 kristaps 1594: }
1595:
1596: static void
1.55 kristaps 1597: dotop(struct texi *p, enum texicmd cmd, size_t *pos)
1598: {
1599:
1600: if (--p->ign)
1601: texierr(p, "@top command while ignoring");
1602:
1603: if (NULL == p->chapters)
1.56 kristaps 1604: teximdocopen(p, pos);
1.55 kristaps 1605: dosection(p, cmd, pos);
1606: }
1607:
1608: static void
1.46 kristaps 1609: dosp(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 1610: {
1611:
1.57 ! kristaps 1612: advanceeoln(p, pos, 1);
1.37 kristaps 1613: if (p->literal)
1614: texiputchar(p, '\n');
1615: else
1616: texivspace(p);
1.1 kristaps 1617: }
1618:
1619: static void
1.46 kristaps 1620: doitem(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1621: {
1622:
1.18 kristaps 1623: /* Multitable is using raw tbl(7). */
1624: if (TEXILIST_TABLE == p->list) {
1625: texiputchar(p, '\n');
1626: return;
1627: }
1628:
1.3 kristaps 1629: if (p->outmacro)
1630: texierr(p, "item in open line scope!?");
1631: else if (p->literal)
1632: texierr(p, "item in a literal scope!?");
1633:
1634: switch (p->list) {
1635: case (TEXILIST_ITEM):
1.5 kristaps 1636: teximacroopen(p, "It");
1.3 kristaps 1637: break;
1638: case (TEXILIST_NOITEM):
1.5 kristaps 1639: teximacro(p, "It");
1.3 kristaps 1640: break;
1641: default:
1.11 kristaps 1642: texivspace(p);
1.3 kristaps 1643: break;
1644: }
1.18 kristaps 1645:
1646: /* Trick so we don't start with Pp. */
1.11 kristaps 1647: p->seenvs = 1;
1.46 kristaps 1648: parseeoln(p, pos);
1.1 kristaps 1649:
1.3 kristaps 1650: if (TEXILIST_ITEM == p->list)
1651: teximacroclose(p);
1.9 kristaps 1652: else if (p->outcol > 0)
1.1 kristaps 1653: texiputchar(p, '\n');
1.18 kristaps 1654: }
1655:
1656: static void
1.46 kristaps 1657: dotab(struct texi *p, enum texicmd cmd, size_t *pos)
1.18 kristaps 1658: {
1659:
1660: /* This command is only useful in @multitable. */
1661: if (TEXILIST_TABLE == p->list)
1662: texiputchar(p, '\t');
1663: }
1664:
1665: static void
1.46 kristaps 1666: domultitable(struct texi *p, enum texicmd cmd, size_t *pos)
1.18 kristaps 1667: {
1668: enum texilist sv = p->list;
1.32 kristaps 1669: int svliteral = p->literal;
1.18 kristaps 1670: enum texicmd type;
1671: size_t i, end, columns;
1672:
1673: p->list = TEXILIST_TABLE;
1.32 kristaps 1674: /*
1675: * TS/TE blocks aren't "in mdoc(7)", so we can disregard the
1676: * fact that we're in literal mode right now.
1677: */
1678: p->literal = 0;
1.18 kristaps 1679: teximacro(p, "TS");
1680: columns = 0;
1681:
1682: /* Advance to the first argument... */
1.46 kristaps 1683: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1684: advance(p, pos);
1.18 kristaps 1685:
1686: /* Make sure we don't print anything when scanning. */
1687: p->ign++;
1.57 ! kristaps 1688: if (*pos < BUFSZ(p) && '@' == BUF(p)[*pos]) {
1.18 kristaps 1689: /*
1690: * Look for @columnfractions.
1691: * We ignore these, but we do use the number of
1692: * arguments to set the number of columns that we'll
1693: * have.
1694: */
1.46 kristaps 1695: type = texicmd(p, *pos, &end, NULL);
1696: advanceto(p, pos, end);
1.18 kristaps 1697: if (TEXICMD_COLUMNFRACTIONS != type)
1.25 kristaps 1698: texierr(p, "unknown multitable command");
1.46 kristaps 1699: while (*pos < BUFSZ(p) && '\n' != BUF(p)[*pos]) {
1700: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1701: advance(p, pos);
1702: while (*pos < BUFSZ(p) && ! isws(BUF(p)[*pos])) {
1703: if ('\n' == BUF(p)[*pos])
1.18 kristaps 1704: break;
1.46 kristaps 1705: advance(p, pos);
1.18 kristaps 1706: }
1707: columns++;
1708: }
1709: } else
1710: /*
1711: * We have arguments.
1712: * We could parse these, but it's easier to just let
1713: * tbl(7) figure it out.
1714: * So use this only to count arguments.
1715: */
1.46 kristaps 1716: while (parselinearg(p, pos) > 0)
1.18 kristaps 1717: columns++;
1718: p->ign--;
1719:
1720: /* Left-justify each table entry. */
1721: for (i = 0; i < columns; i++) {
1722: if (i > 0)
1723: texiputchar(p, ' ');
1724: texiputchar(p, 'l');
1725: }
1726: texiputchars(p, ".\n");
1727: p->outmacro++;
1.46 kristaps 1728: parseto(p, pos, texitoks[cmd].tok);
1.18 kristaps 1729: p->outmacro--;
1730: teximacro(p, "TE");
1.32 kristaps 1731: p->literal = svliteral;
1.18 kristaps 1732: p->list = sv;
1.1 kristaps 1733: }
1734:
1735: static void
1.46 kristaps 1736: dotable(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1737: {
1.3 kristaps 1738: enum texilist sv = p->list;
1739:
1.57 ! kristaps 1740: advanceeoln(p, pos, 1);
! 1741:
1.3 kristaps 1742: p->list = TEXILIST_ITEM;
1.5 kristaps 1743: teximacro(p, "Bl -tag -width Ds");
1.11 kristaps 1744: p->seenvs = 1;
1.46 kristaps 1745: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 1746: teximacro(p, "El");
1.3 kristaps 1747: p->list = sv;
1.44 kristaps 1748: }
1749:
1750: static void
1.46 kristaps 1751: doend(struct texi *p, enum texicmd cmd, size_t *pos)
1.44 kristaps 1752: {
1753: size_t start;
1754:
1.46 kristaps 1755: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1756: advance(p, pos);
1.44 kristaps 1757: start = *pos;
1.46 kristaps 1758: while (*pos < BUFSZ(p) && '\n' != BUF(p)[*pos])
1759: advance(p, pos);
1.44 kristaps 1760:
1.56 kristaps 1761: texiwarn(p, "unexpected \"end\": %.*s",
1762: (int)(*pos - start), &BUF(p)[start]);
1.46 kristaps 1763: advanceeoln(p, pos, 1);
1.1 kristaps 1764: }
1765:
1766: static void
1.46 kristaps 1767: doenumerate(struct texi *p, enum texicmd cmd, size_t *pos)
1.2 kristaps 1768: {
1.3 kristaps 1769: enum texilist sv = p->list;
1.2 kristaps 1770:
1.57 ! kristaps 1771: advanceeoln(p, pos, 1);
! 1772:
1.3 kristaps 1773: p->list = TEXILIST_NOITEM;
1.5 kristaps 1774: teximacro(p, "Bl -enum");
1.11 kristaps 1775: p->seenvs = 1;
1.57 ! kristaps 1776: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 1777: teximacro(p, "El");
1.3 kristaps 1778: p->list = sv;
1.2 kristaps 1779: }
1780:
1781: static void
1.46 kristaps 1782: doitemize(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1783: {
1.3 kristaps 1784: enum texilist sv = p->list;
1.1 kristaps 1785:
1.57 ! kristaps 1786: advanceeoln(p, pos, 1);
! 1787:
1.21 kristaps 1788: p->list = TEXILIST_NOITEM;
1.5 kristaps 1789: teximacro(p, "Bl -bullet");
1.11 kristaps 1790: p->seenvs = 1;
1.57 ! kristaps 1791: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 1792: teximacro(p, "El");
1.3 kristaps 1793: p->list = sv;
1.1 kristaps 1794: }
1795:
1796: static void
1.46 kristaps 1797: doignbracket(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1798: {
1799:
1.3 kristaps 1800: p->ign++;
1.53 kristaps 1801: parsebracket(p, pos, 0);
1.3 kristaps 1802: p->ign--;
1.1 kristaps 1803: }
1804:
1805: static void
1.46 kristaps 1806: doignline(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1807: {
1808:
1.57 ! kristaps 1809: advanceeoln(p, pos, 1);
1.1 kristaps 1810: }
1811:
1.8 kristaps 1812: /*
1813: * Parse colon-separated directories from "cp" (if not NULL) and returns
1814: * the array of pointers.
1.40 kristaps 1815: * Prepends "base" to the array, if found.
1.8 kristaps 1816: * This does NOT sanitise the directories!
1817: */
1.5 kristaps 1818: static char **
1.27 kristaps 1819: parsedirs(struct texi *p, const char *base, const char *cp, size_t *sz)
1.5 kristaps 1820: {
1821: char *tok, *str, *tofree;
1822: const char *cpp;
1.40 kristaps 1823: size_t i = 0;
1.5 kristaps 1824: char **dirs;
1825:
1.40 kristaps 1826: /* Count up our expected arguments. */
1827: *sz = NULL != base;
1828: if (NULL != (cpp = cp))
1829: for ((*sz)++; NULL != (cpp = strchr(cpp, ':')); (*sz)++)
1.5 kristaps 1830: cpp++;
1831:
1.40 kristaps 1832: if (0 == *sz)
1833: return(NULL);
1.27 kristaps 1834: if (NULL == (dirs = calloc(*sz, sizeof(char *))))
1835: texiabort(p, NULL);
1.40 kristaps 1836: if (NULL != base && NULL == (dirs[i++] = strdup(base)))
1.27 kristaps 1837: texiabort(p, NULL);
1.5 kristaps 1838: if (NULL == cp)
1839: return(dirs);
1.27 kristaps 1840: if (NULL == (tofree = tok = str = strdup(cp)))
1841: texiabort(p, NULL);
1.5 kristaps 1842:
1.40 kristaps 1843: for ( ; NULL != (tok = strsep(&str, ":")); i++)
1.27 kristaps 1844: if (NULL == (dirs[i] = strdup(tok)))
1845: texiabort(p, NULL);
1.5 kristaps 1846:
1847: free(tofree);
1848: return(dirs);
1849: }
1850:
1.1 kristaps 1851: int
1852: main(int argc, char *argv[])
1853: {
1854: struct texi texi;
1.2 kristaps 1855: int c;
1.37 kristaps 1856: char *dirpath, *dir, *ccp;
1.10 kristaps 1857: const char *progname, *Idir, *cp;
1.1 kristaps 1858:
1859: progname = strrchr(argv[0], '/');
1860: if (progname == NULL)
1861: progname = argv[0];
1862: else
1863: ++progname;
1864:
1.10 kristaps 1865: memset(&texi, 0, sizeof(struct texi));
1.40 kristaps 1866: texi.ign = 1;
1.55 kristaps 1867: texi.outfile = stdout;
1.5 kristaps 1868: Idir = NULL;
1.10 kristaps 1869:
1.55 kristaps 1870: while (-1 != (c = getopt(argc, argv, "C:I:")))
1.1 kristaps 1871: switch (c) {
1.55 kristaps 1872: case ('C'):
1873: texi.chapters = optarg;
1874: break;
1.5 kristaps 1875: case ('I'):
1876: Idir = optarg;
1877: break;
1.1 kristaps 1878: default:
1879: goto usage;
1880: }
1881:
1882: argv += optind;
1.40 kristaps 1883: argc -= optind;
1.1 kristaps 1884:
1.40 kristaps 1885: if (argc > 0) {
1886: if (NULL == (dirpath = strdup(argv[0])))
1887: texiabort(&texi, NULL);
1888: if (NULL == (dir = dirname(dirpath)))
1889: texiabort(&texi, NULL);
1890: if (NULL != (cp = strrchr(argv[0], '/')))
1891: texi.title = strdup(cp + 1);
1892: else
1893: texi.title = strdup(argv[0]);
1894: if (NULL == texi.title)
1895: texiabort(&texi, NULL);
1896: else if (NULL != (ccp = strchr(texi.title, '.')))
1897: *ccp = '\0';
1898: texi.dirs = parsedirs(&texi, dir, Idir, &texi.dirsz);
1899: free(dirpath);
1900: parsefile(&texi, argv[0], 1);
1901: } else {
1902: texi.title = strdup("Unknown Manual");
1903: texi.dirs = parsedirs(&texi, NULL, Idir, &texi.dirsz);
1904: parsestdin(&texi);
1905: }
1.27 kristaps 1906:
1.2 kristaps 1907: texiexit(&texi);
1.56 kristaps 1908: exit(EXIT_SUCCESS);
1.1 kristaps 1909: usage:
1.55 kristaps 1910: fprintf(stderr, "usage: %s [-Cdir] [-Idirs] [file]\n", progname);
1.1 kristaps 1911: return(EXIT_FAILURE);
1912: }
CVSweb