Annotation of texi2mdoc/main.c, Revision 1.55
1.55 ! kristaps 1: /* $Id: main.c,v 1.54 2015/02/28 13:16:44 kristaps Exp $ */
1.1 kristaps 2: /*
3: * Copyright (c) 2015 Kristaps Dzonsons <kristaps@bsd.lv>
4: *
5: * Permission to use, copy, modify, and distribute this software for any
6: * purpose with or without fee is hereby granted, provided that the above
7: * copyright notice and this permission notice appear in all copies.
8: *
9: * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10: * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11: * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12: * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13: * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14: * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15: * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
16: */
1.37 kristaps 17: #if defined(__linux__) || defined(__MINT__)
18: # define _GNU_SOURCE /* memmem */
19: #endif
1.1 kristaps 20: #include <assert.h>
21: #include <ctype.h>
22: #include <getopt.h>
1.2 kristaps 23: #include <libgen.h>
24: #include <limits.h>
1.1 kristaps 25: #include <stdarg.h>
26: #include <stdio.h>
27: #include <stdlib.h>
28: #include <string.h>
1.47 kristaps 29: #include <unistd.h>
1.1 kristaps 30:
1.24 kristaps 31: #include "extern.h"
1.1 kristaps 32:
1.23 kristaps 33: #define SECTSZ 4
34: static const char *const sects[SECTSZ] = {
35: "Sh",
36: "Ss",
37: "Em",
38: "No",
39: };
40:
1.46 kristaps 41: static void doaccent(struct texi *, enum texicmd, size_t *);
42: static void doblock(struct texi *, enum texicmd, size_t *);
43: static void dobracket(struct texi *, enum texicmd, size_t *);
44: static void dobye(struct texi *, enum texicmd, size_t *);
45: static void dodefindex(struct texi *, enum texicmd, size_t *);
46: static void dodefn(struct texi *, enum texicmd, size_t *);
47: static void dodisplay(struct texi *, enum texicmd, size_t *);
48: static void doend(struct texi *, enum texicmd, size_t *);
49: static void doenumerate(struct texi *, enum texicmd, size_t *);
50: static void doexample(struct texi *, enum texicmd, size_t *);
51: static void doignargn(struct texi *, enum texicmd, size_t *);
52: static void doignblock(struct texi *, enum texicmd, size_t *);
53: static void doignbracket(struct texi *, enum texicmd, size_t *);
54: static void doignline(struct texi *, enum texicmd, size_t *);
55: static void doinline(struct texi *, enum texicmd, size_t *);
56: static void doinclude(struct texi *, enum texicmd, size_t *);
57: static void doitem(struct texi *, enum texicmd, size_t *);
58: static void doitemize(struct texi *, enum texicmd, size_t *);
59: static void dolink(struct texi *, enum texicmd, size_t *);
60: static void domacro(struct texi *, enum texicmd, size_t *);
61: static void domath(struct texi *, enum texicmd, size_t *);
62: static void domultitable(struct texi *, enum texicmd, size_t *);
63: static void doquotation(struct texi *, enum texicmd, size_t *);
64: static void dotable(struct texi *, enum texicmd, size_t *);
65: static void dotop(struct texi *, enum texicmd, size_t *);
66: static void dosecoffs(struct texi *, enum texicmd, size_t *);
67: static void dosection(struct texi *, enum texicmd, size_t *);
68: static void dosp(struct texi *, enum texicmd, size_t *);
69: static void dosubsection(struct texi *, enum texicmd, size_t *);
70: static void dosubsubsection(struct texi *, enum texicmd, size_t *);
71: static void dosymbol(struct texi *, enum texicmd, size_t *);
72: static void dotab(struct texi *, enum texicmd, size_t *);
73: static void dotitle(struct texi *, enum texicmd, size_t *);
74: static void dovalue(struct texi *, enum texicmd, size_t *);
75: static void doverb(struct texi *, enum texicmd, size_t *);
76: static void doverbatim(struct texi *, enum texicmd, size_t *);
77: static void doverbinclude(struct texi *, enum texicmd, size_t *);
1.1 kristaps 78:
1.24 kristaps 79: static const struct texitok __texitoks[TEXICMD__MAX] = {
1.20 kristaps 80: /* TEXICMD__BEGIN */
1.42 kristaps 81: { doignline, "afourpaper", 10 }, /* TEXICMD_A4PAPER */
82: { dosymbol, "AA", 2 }, /* TEXICMD_AA */
83: { dosymbol, "aa", 2 }, /* TEXICMD_AASMALL */
1.8 kristaps 84: { doignargn, "acronym", 7 }, /* TEXICMD_ACRONYM */
1.16 kristaps 85: { doaccent, "'", 1 }, /* TEXICMD_ACUTE */
1.42 kristaps 86: { dosymbol, "AE", 2 }, /* TEXICMD_AE */
87: { dosymbol, "ae", 2 }, /* TEXICMD_AESMALL */
1.1 kristaps 88: { doignbracket, "anchor", 6 }, /* TEXICMD_ANCHOR */
1.12 kristaps 89: { dosection, "appendix", 8 }, /* TEXICMD_APPENDIX */
90: { dosection, "appendixsec", 11 }, /* TEXICMD_APPENDIXSEC */
1.20 kristaps 91: { dosubsection, "appendixsubsec", 14 }, /* TEXICMD_APPENDIXSUBSEC */
1.23 kristaps 92: { dosubsubsection, "appendixsubsubsec", 17 }, /* TEXICMD_APPENDIXSUBSUBSEC */
1.25 kristaps 93: { doinline, "asis", 4 }, /* TEXICMD_ASIS */
1.3 kristaps 94: { dosymbol, "*", 1 }, /* TEXICMD_ASTERISK */
1.1 kristaps 95: { dosymbol, "@", 1 }, /* TEXICMD_AT */
1.3 kristaps 96: { doignline, "author", 6 }, /* TEXICMD_AUTHOR */
1.21 kristaps 97: { doinline, "b", 1 }, /* TEXICMD_BOLD */
1.3 kristaps 98: { dosymbol, "!", 1 }, /* TEXICMD_BANG */
1.7 kristaps 99: { dosymbol, "bullet", 6 }, /* TEXICMD_BULLET */
1.1 kristaps 100: { dobye, "bye", 3 }, /* TEXICMD_BYE */
1.34 kristaps 101: { doblock, "cartouche", 9 }, /* TEXICMD_CARTOUCHE */
102: { doaccent, ",", 1 }, /* TEXICMD_CEDILLA */
1.12 kristaps 103: { doignline, "center", 6 }, /* TEXICMD_CENTER */
104: { dosection, "chapter", 7 }, /* TEXICMD_CHAPTER */
1.1 kristaps 105: { doignline, "cindex", 6 }, /* TEXICMD_CINDEX */
1.16 kristaps 106: { doaccent, "^", 1 }, /* TEXICMD_CIRCUMFLEX */
1.24 kristaps 107: { doinline, "cite", 4 }, /* TEXICMD_CITE */
108: { dovalue, "clear", 5 }, /* TEXICMD_CLEAR */
1.21 kristaps 109: { doinline, "code", 4 }, /* TEXICMD_CODE */
1.3 kristaps 110: { dosymbol, ":", 1 }, /* TEXICMD_COLON */
1.18 kristaps 111: { NULL, "columnfractions", 15 }, /* TEXICMD_COLUMNFRACTIONS */
1.35 kristaps 112: { dosymbol, "comma", 5 }, /* TEXICMD_COMMA */
1.12 kristaps 113: { doinline, "command", 7 }, /* TEXICMD_COMMAND */
1.1 kristaps 114: { doignline, "c", 1 }, /* TEXICMD_COMMENT */
1.2 kristaps 115: { doignline, "comment", 7 }, /* TEXICMD_COMMENT_LONG */
1.1 kristaps 116: { doignline, "contents", 8 }, /* TEXICMD_CONTENTS */
117: { doignblock, "copying", 7 }, /* TEXICMD_COPYING */
118: { dosymbol, "copyright", 9 }, /* TEXICMD_COPYRIGHT */
1.27 kristaps 119: { dodefindex, "defcodeindex", 12 }, /* TEXICMD_DEFCODEINDEX */
1.15 kristaps 120: { dodefn, "deffn", 5 }, /* TEXICMD_DEFFN */
121: { dodefn, "deffnx", 6 }, /* TEXICMD_DEFFNX */
1.27 kristaps 122: { dodefindex, "defindex", 8 }, /* TEXICMD_DEFINDEX */
1.15 kristaps 123: { dodefn, "defmac", 6 }, /* TEXICMD_DEFMAC */
124: { dodefn, "defmacx", 7 }, /* TEXICMD_DEFMACX */
125: { dodefn, "deftp", 5 }, /* TEXICMD_DEFTP */
126: { dodefn, "deftpx", 6 }, /* TEXICMD_DEFTPX */
127: { dodefn, "deftypefn", 9 }, /* TEXICMD_DEFTYPEFN */
128: { dodefn, "deftypefnx", 10 }, /* TEXICMD_DEFTYPEFNX */
129: { dodefn, "deftypefun", 10 }, /* TEXICMD_DEFTYPEFUN */
130: { dodefn, "deftypefunx", 11 }, /* TEXICMD_DEFTYPEFUNX */
1.34 kristaps 131: { dodefn, "deftypemethod", 13 }, /* TEXICMD_DEFTYPEMETHOD */
132: { dodefn, "deftypemethodx", 14 }, /* TEXICMD_DEFTYPEMETHODX */
1.15 kristaps 133: { dodefn, "deftypevar", 10 }, /* TEXICMD_DEFTYPEVAR */
134: { dodefn, "deftypevarx", 11 }, /* TEXICMD_DEFTYPEVARX */
135: { dodefn, "deftypevr", 9 }, /* TEXICMD_DEFTYPEVR */
136: { dodefn, "deftypevrx", 10 }, /* TEXICMD_DEFTYPEVRX */
137: { dodefn, "defun", 5 }, /* TEXICMD_DEFUN */
138: { dodefn, "defunx", 6 }, /* TEXICMD_DEFUNX */
139: { dodefn, "defvar", 6 }, /* TEXICMD_DEFVAR */
140: { dodefn, "defvarx", 7 }, /* TEXICMD_DEFVARX */
141: { dodefn, "defvr", 5 }, /* TEXICMD_DEFVR */
142: { dodefn, "defvrx", 6 }, /* TEXICMD_DEFVRX */
1.1 kristaps 143: { doignblock, "detailmenu", 10 }, /* TEXICMD_DETAILMENU */
1.21 kristaps 144: { doinline, "dfn", 3 }, /* TEXICMD_DFN */
1.42 kristaps 145: { dosymbol, "DH", 2 }, /* TEXICMD_DH */
146: { dosymbol, "dh", 2 }, /* TEXICMD_DHSMALL */
1.1 kristaps 147: { doignline, "dircategory", 11 }, /* TEXICMD_DIRCATEGORY */
148: { doignblock, "direntry", 8 }, /* TEXICMD_DIRENTRY */
1.3 kristaps 149: { dodisplay, "display", 7 }, /* TEXICMD_DISPLAY */
1.28 kristaps 150: { doignbracket, "dmn", 3 }, /* TEXICMD_DMN */
1.40 kristaps 151: { doignblock, "documentdescription", 19 }, /* TEXICMD_DOCUMENTDESCRIPTION */
152: { doignline, "documentencoding", 16 }, /* TEXICMD_DOCUMENTENCODING */
1.44 kristaps 153: { doignline, "documentlanguage", 16 }, /* TEXICMD_DOCUMENTLANGUAGE */
1.42 kristaps 154: { doaccent, "dotaccent", 9 }, /* TEXICMD_DOTACCENT */
155: { doaccent, "dotless", 7 }, /* TEXICMD_DOTLESS */
1.2 kristaps 156: { dosymbol, "dots", 4 }, /* TEXICMD_DOTS */
1.8 kristaps 157: { dolink, "email", 5 }, /* TEXICMD_EMAIL */
1.21 kristaps 158: { doinline, "emph", 4 }, /* TEXICMD_EMPH */
1.44 kristaps 159: { doend, "end", 3 }, /* TEXICMD_END */
1.34 kristaps 160: { dosymbol, "enddots", 7 }, /* TEXICMD_ENDDOTS */
1.2 kristaps 161: { doenumerate, "enumerate", 9 }, /* TEXICMD_ENUMERATE */
1.12 kristaps 162: { doinline, "env", 3 }, /* TEXICMD_ENV */
1.28 kristaps 163: { dosymbol, "equiv", 5 }, /* TEXICMD_EQUIV */
1.15 kristaps 164: { dosymbol, "error", 5 }, /* TEXICMD_ERROR */
1.43 kristaps 165: { dosymbol, "euro", 4 }, /* TEXICMD_EURO */
1.1 kristaps 166: { doexample, "example", 7 }, /* TEXICMD_EXAMPLE */
1.42 kristaps 167: { dosymbol, "exclamdown", 10 }, /* TEXICMD_EXCLAMDOWN */
1.25 kristaps 168: { doignline, "exdent", 6 }, /* TEXICMD_EXDENT */
1.17 kristaps 169: { dosymbol, "expansion", 9 }, /* TEXICMD_EXPANSION */
1.12 kristaps 170: { doinline, "file", 4 }, /* TEXICMD_FILE */
1.17 kristaps 171: { doignline, "finalout", 8 }, /* TEXICMD_FINALOUT */
1.20 kristaps 172: { doignline, "findex", 6 }, /* TEXICMD_FINDEX */
1.44 kristaps 173: { doblock, "flushleft", 9 }, /* TEXICMD_FLUSHLEFT */
174: { doblock, "flushright", 10 }, /* TEXICMD_FLUSHRIGHT */
175: { doignline, "firstparagraphindent", 20 }, /* TEXICMD_FIRSTPARAGRAPHINDENT */
1.32 kristaps 176: { doignbracket, "footnote", 8 }, /* TEXICMD_FOOTNOTE */
1.44 kristaps 177: { doignline, "footnotestyle", 13 }, /* TEXICMD_FOOTNOTESTYLE */
1.20 kristaps 178: { dotable, "ftable", 6 }, /* TEXICMD_FTABLE */
179: { dodisplay, "format", 6 }, /* TEXICMD_FORMAT */
1.43 kristaps 180: { dosymbol, "geq", 3 }, /* TEXICMD_GEQ */
1.16 kristaps 181: { doaccent, "`", 1 }, /* TEXICMD_GRAVE */
1.3 kristaps 182: { doblock, "group", 5 }, /* TEXICMD_GROUP */
1.43 kristaps 183: { dosymbol, "guillemetleft", 13 }, /* TEXICMD_GUILLEMETLEFT */
184: { dosymbol, "guillemetright", 14 }, /* TEXICMD_GUILLEMETRIGHT */
185: { dosymbol, "guillemotleft", 13 }, /* TEXICMD_GUILLEMOTLEFT */
186: { dosymbol, "guillemotright", 14 }, /* TEXICMD_GUILLEMOTRIGHT */
187: { dosymbol, "guilsinglleft", 13 }, /* TEXICMD_GUILSINGLLEFT */
188: { dosymbol, "guilsinglright", 14 }, /* TEXICMD_GUILSINGLRIGHT */
1.42 kristaps 189: { doaccent, "H", 1 }, /* TEXICMD_H */
1.2 kristaps 190: { dosection, "heading", 7 }, /* TEXICMD_HEADING */
1.3 kristaps 191: { doignline, "headings", 8 }, /* TEXICMD_HEADINGS */
1.18 kristaps 192: { doitem, "headitem", 8 }, /* TEXICMD_HEADITEM */
1.25 kristaps 193: { doignblock, "html", 4 }, /* TEXICMD_HTML */
1.3 kristaps 194: { dosymbol, "-", 1 }, /* TEXICMD_HYPHEN */
1.21 kristaps 195: { doinline, "i", 1 }, /* TEXICMD_I */
1.24 kristaps 196: { dovalue, "ifclear", 7 }, /* TEXICMD_IFCLEAR */
1.14 kristaps 197: { doignblock, "ifdocbook", 9 }, /* TEXICMD_IFDOCBOOK */
1.1 kristaps 198: { doignblock, "ifhtml", 6 }, /* TEXICMD_IFHTML */
1.26 kristaps 199: { doblock, "ifinfo", 6 }, /* TEXICMD_IFINFO */
1.14 kristaps 200: { doblock, "ifnotdocbook", 12 }, /* TEXICMD_IFNOTDOCBOOK */
201: { doblock, "ifnothtml", 9 }, /* TEXICMD_IFNOTHTML */
202: { doblock, "ifnotinfo", 9 }, /* TEXICMD_IFNOTINFO */
203: { doignblock, "ifnotplaintext", 14 }, /* TEXICMD_IFNOTPLAINTEXT */
1.3 kristaps 204: { doblock, "ifnottex", 8 }, /* TEXICMD_IFNOTTEX */
1.14 kristaps 205: { doblock, "ifnotxml", 8 }, /* TEXICMD_IFNOTXML */
206: { doblock, "ifplaintext", 11 }, /* TEXICMD_IFPLAINTEXT */
1.1 kristaps 207: { doignblock, "iftex", 5 }, /* TEXICMD_IFTEX */
1.30 kristaps 208: { dovalue, "ifset", 5 }, /* TEXICMD_IFSET */
1.14 kristaps 209: { doignblock, "ifxml", 5 }, /* TEXICMD_IFXML */
1.17 kristaps 210: { doignblock, "ignore", 6 }, /* TEXICMD_IGNORE */
1.1 kristaps 211: { doignbracket, "image", 5 }, /* TEXICMD_IMAGE */
1.2 kristaps 212: { doinclude, "include", 7 }, /* TEXICMD_INCLUDE */
1.13 kristaps 213: { dodisplay, "indentblock", 11 }, /* TEXICMD_INDENTBLOCK */
1.44 kristaps 214: { dolink, "indicateurl", 11 }, /* TEXICMD_INDICATEURL */
215: { dolink, "inforef", 7 }, /* TEXICMD_INFOREF */
1.5 kristaps 216: { doignline, "insertcopying", 13 }, /* TEXICMD_INSERTCOPYING */
1.1 kristaps 217: { doitem, "item", 4 }, /* TEXICMD_ITEM */
218: { doitemize, "itemize", 7 }, /* TEXICMD_ITEMIZE */
1.20 kristaps 219: { doitem, "itemx", 5 }, /* TEXICMD_ITEMX */
1.21 kristaps 220: { doinline, "kbd", 3 }, /* TEXICMD_KBD */
1.18 kristaps 221: { dobracket, "key", 3 }, /* TEXICMD_KEY */
1.20 kristaps 222: { doignline, "kindex", 6 }, /* TEXICMD_KINDEX */
1.42 kristaps 223: { dosymbol, "L", 1 }, /* TEXICMD_L */
1.1 kristaps 224: { dosymbol, "LaTeX", 5 }, /* TEXICMD_LATEX */
1.43 kristaps 225: { dosymbol, "leq", 3 }, /* TEXICMD_LEQ */
1.23 kristaps 226: { dosecoffs, "lowersections", 13 }, /* TEXICMD_LOWERSECTIONS */
1.42 kristaps 227: { dosymbol, "l", 1 }, /* TEXICMD_LSMALL */
1.30 kristaps 228: { domacro, "macro", 5 }, /* TEXICMD_MACRO */
1.42 kristaps 229: { doaccent, "=", 1 }, /* TEXICMD_MACRON */
1.3 kristaps 230: { domath, "math", 4 }, /* TEXICMD_MATH */
1.1 kristaps 231: { doignblock, "menu", 4 }, /* TEXICMD_MENU */
1.25 kristaps 232: { dosymbol, "minus", 5 }, /* TEXICMD_MINUS */
1.18 kristaps 233: { domultitable, "multitable", 10 }, /* TEXICMD_MULTITABLE */
1.15 kristaps 234: { doignline, "need", 4 }, /* TEXICMD_NEED */
1.3 kristaps 235: { dosymbol, "\n", 1 }, /* TEXICMD_NEWLINE */
1.1 kristaps 236: { doignline, "node", 4 }, /* TEXICMD_NODE */
1.3 kristaps 237: { doignline, "noindent", 8 }, /* TEXICMD_NOINDENT */
1.42 kristaps 238: { dosymbol, "O", 1 }, /* TEXICMD_O */
239: { dosymbol, "OE", 2 }, /* TEXICMD_OE */
240: { dosymbol, "oe", 2 }, /* TEXICMD_OESMALL */
241: { doaccent, "ogonek", 6 }, /* TEXICMD_OGONEK */
1.16 kristaps 242: { doinline, "option", 6 }, /* TEXICMD_OPTION */
1.42 kristaps 243: { dosymbol, "ordf", 4 }, /* TEXICMD_ORDF */
244: { dosymbol, "ordm", 4 }, /* TEXICMD_ORDM */
245: { dosymbol, "o", 1 }, /* TEXICMD_OSMALL */
1.3 kristaps 246: { doignline, "page", 4 }, /* TEXICMD_PAGE */
1.25 kristaps 247: { doignline, "paragraphindent", 15 }, /* TEXICMD_PARINDENT */
248: { dosymbol, ".", 1 }, /* TEXICMD_PERIOD */
1.28 kristaps 249: { doignline, "pindex", 6 }, /* TEXICMD_PINDEX */
1.43 kristaps 250: { dosymbol, "pounds", 6 }, /* TEXICMD_POUNDS */
1.2 kristaps 251: { doignline, "printindex", 10 }, /* TEXICMD_PRINTINDEX */
1.42 kristaps 252: { dolink, "pxref", 5 }, /* TEXICMD_PXREF */
253: { dosymbol, "questiondown", 12 }, /* TEXICMD_QUESTIONDOWN */
254: { dosymbol, "?", 1 }, /* TEXICMD_QUESTIONMARK */
255: { doquotation, "quotation", 9 }, /* TEXICMD_QUOTATION */
1.43 kristaps 256: { dosymbol, "quotedblbase", 12 }, /* TEXICMD_QUOTEDBLBASE */
257: { dosymbol, "quotedblleft", 12 }, /* TEXICMD_QUOTEDBLLEFT */
258: { dosymbol, "quotedblright", 13 }, /* TEXICMD_QUOTEDBLRIGHT */
259: { dosymbol, "quotesinglbase", 14 }, /* TEXICMD_QUOTESINGLBASE */
260: { dosymbol, "quoteleft", 9 }, /* TEXICMD_QUOTELEFT */
261: { dosymbol, "quoteright", 10 }, /* TEXICMD_QUOTERIGHT */
1.21 kristaps 262: { doinline, "r", 1 }, /* TEXICMD_R */
1.23 kristaps 263: { dosecoffs, "raisesections", 13 }, /* TEXICMD_RAISESECTIONS */
1.1 kristaps 264: { dobracket, "ref", 3 }, /* TEXICMD_REF */
1.28 kristaps 265: { doignline, "refill", 6 }, /* TEXICMD_REFILL */
1.43 kristaps 266: { dosymbol, "registeredsymbol", 16 }, /* TEXICMD_REGISTEREDSYMBOL */
1.15 kristaps 267: { dosymbol, "result", 6 }, /* TEXICMD_RESULT */
1.42 kristaps 268: { doaccent, "ringaccent", 10 }, /* TEXICMD_RINGACCENT */
1.21 kristaps 269: { doinline, "samp", 4 }, /* TEXICMD_SAMP */
270: { doinline, "sansserif", 9 }, /* TEXICMD_SANSSERIF */
1.7 kristaps 271: { dobracket, "sc", 2 }, /* TEXICMD_SC */
1.1 kristaps 272: { dosection, "section", 7 }, /* TEXICMD_SECTION */
1.24 kristaps 273: { dovalue, "set", 3 }, /* TEXICMD_SET */
1.1 kristaps 274: { doignline, "setchapternewpage", 17 }, /* TEXICMD_SETCHAPNEWPAGE */
1.35 kristaps 275: { doignline, "setcontentsaftertitlepage", 25 }, /* TEXICMD_SETCONTENTSAFTER */
1.1 kristaps 276: { doignline, "setfilename", 11 }, /* TEXICMD_SETFILENAME */
1.10 kristaps 277: { dotitle, "settitle", 8 }, /* TEXICMD_SETTITLE */
1.25 kristaps 278: { doignline, "shortcontents", 13 }, /* TEXICMD_SHORTCONTENTS */
1.21 kristaps 279: { doinline, "slanted", 7 }, /* TEXICMD_SLANTED */
1.34 kristaps 280: { dosymbol, "/", 1 }, /* TEXICMD_SLASH */
1.3 kristaps 281: { dosp, "sp", 2 }, /* TEXICMD_SP */
282: { dosymbol, " ", 1 }, /* TEXICMD_SPACE */
1.17 kristaps 283: { doignline, "smallbook", 9 }, /* TEXICMD_SMALLBOOK */
1.12 kristaps 284: { dodisplay, "smalldisplay", 12 }, /* TEXICMD_SMALLDISPLAY */
1.3 kristaps 285: { doexample, "smallexample", 12 }, /* TEXICMD_SMALLEXAMPLE */
1.20 kristaps 286: { dodisplay, "smallformat", 11 }, /* TEXICMD_SMALLFORMAT */
1.13 kristaps 287: { dodisplay, "smallindentblock", 16 }, /* TEXICMD_SMALLINDENTBLOCK */
1.3 kristaps 288: { dosymbol, "{", 1 }, /* TEXICMD_SQUIGGLE_LEFT */
289: { dosymbol, "}", 1 }, /* TEXICMD_SQUIGGLE_RIGHT */
1.35 kristaps 290: { dosymbol, "ss", 2 }, /* TEXICMD_SS */
1.21 kristaps 291: { doinline, "strong", 6 }, /* TEXICMD_STRONG */
1.20 kristaps 292: { dosubsection, "subheading", 10 }, /* TEXICMD_SUBHEADING */
1.1 kristaps 293: { dosubsection, "subsection", 10 }, /* TEXICMD_SUBSECTION */
1.28 kristaps 294: { dosubsubsection, "subsubheading", 13 }, /* TEXICMD_SUBSUBHEADING */
1.23 kristaps 295: { dosubsubsection, "subsubsection", 13 }, /* TEXICMD_SUBSUBSECTION */
1.3 kristaps 296: { doignline, "subtitle", 8 }, /* TEXICMD_SUBTITLE */
1.25 kristaps 297: { doignline, "summarycontents", 15 }, /* TEXICMD_SUMMARYCONTENTS */
1.50 kristaps 298: { dodefindex, "synindex", 8 }, /* TEXICMD_SYNINDEX */
299: { dodefindex, "syncodeindex", 12 }, /* TEXICMD_SYNCODEINDEX */
1.21 kristaps 300: { doinline, "t", 1 }, /* TEXICMD_T */
1.18 kristaps 301: { dotab, "tab", 3 }, /* TEXICMD_TAB */
302: { dosymbol, "\t", 1 }, /* TEXICMD_TABSYM */
1.1 kristaps 303: { dotable, "table", 5 }, /* TEXICMD_TABLE */
304: { doignblock, "tex", 3 }, /* TEXICMD_TEX */
305: { dosymbol, "TeX", 3 }, /* TEXICMD_TEXSYM */
1.43 kristaps 306: { dosymbol, "textdegree", 10 }, /* TEXICMD_TEXTDEGREE */
1.42 kristaps 307: { dosymbol, "TH", 2 }, /* TEXICMD_TH */
308: { dosymbol, "th", 2 }, /* TEXICMD_THSMALL */
1.35 kristaps 309: { dosymbol, "tie", 3 }, /* TEXICMD_TIE */
1.42 kristaps 310: { doaccent, "tieaccent", 9 }, /* TEXICMD_TIEACCENT */
1.16 kristaps 311: { doaccent, "~", 1 }, /* TEXICMD_TILDE */
1.25 kristaps 312: { doignline, "tindex", 6 }, /* TEXICMD_TINDEX */
1.3 kristaps 313: { doignline, "title", 5 }, /* TEXICMD_TITLE */
1.1 kristaps 314: { dobracket, "titlefont", 9 }, /* TEXICMD_TITLEFONT */
315: { doignblock, "titlepage", 9 }, /* TEXICMD_TITLEPAGE */
316: { dotop, "top", 3 }, /* TEXICMD_TOP */
1.42 kristaps 317: { doaccent, "u", 1 }, /* TEXICMD_U */
318: { doaccent, "ubaraccent", 10 }, /* TEXICMD_UBARACCENT */
319: { doaccent, "udotaccent", 10 }, /* TEXICMD_UDOTACCENT */
1.16 kristaps 320: { doaccent, "\"", 1 }, /* TEXICMD_UMLAUT */
1.12 kristaps 321: { dosection, "unnumbered", 10 }, /* TEXICMD_UNNUMBERED */
1.2 kristaps 322: { dosection, "unnumberedsec", 13 }, /* TEXICMD_UNNUMBEREDSEC */
1.20 kristaps 323: { dosubsection, "unnumberedsubsec", 16 }, /* TEXICMD_UNNUMBEREDSUBSEC */
1.23 kristaps 324: { dosubsubsection, "unnumberedsubsubsec", 19 }, /* TEXICMD_UNNUMBEREDSUBSUBSEC */
1.8 kristaps 325: { dolink, "uref", 4 }, /* TEXICMD_UREF */
326: { dolink, "url", 3 }, /* TEXICMD_URL */
1.34 kristaps 327: { doignline, "", 0 }, /* TEXICMD_USER_INDEX */
1.42 kristaps 328: { doaccent, "v", 1 }, /* TEXICMD_V */
1.24 kristaps 329: { dovalue, "value", 5 }, /* TEXICMD_VALUE */
1.12 kristaps 330: { doinline, "var", 3 }, /* TEXICMD_VAR */
1.33 kristaps 331: { doverb, "verb", 4 }, /* TEXICMD_VERB */
332: { doverbatim, "verbatim", 8 }, /* TEXICMD_VERBATIM */
1.16 kristaps 333: { doverbinclude, "verbatiminclude", 15 }, /* TEXICMD_VERBATIMINCLUDE */
1.18 kristaps 334: { doignline, "vindex", 6 }, /* TEXICMD_VINDEX */
1.9 kristaps 335: { dosp, "vskip", 5 }, /* TEXICMD_VSKIP */
1.20 kristaps 336: { dotable, "vtable", 6 }, /* TEXICMD_VTABLE */
1.3 kristaps 337: { dobracket, "w", 1 }, /* TEXICMD_W */
1.8 kristaps 338: { dolink, "xref", 4 }, /* TEXICMD_XREF */
1.20 kristaps 339: /* TEXICMD__END */
1.1 kristaps 340: };
341:
1.24 kristaps 342: const struct texitok *const texitoks = __texitoks;
1.18 kristaps 343:
1.2 kristaps 344: static void
1.46 kristaps 345: dodefindex(struct texi *p, enum texicmd cmd, size_t *pos)
1.27 kristaps 346: {
347: size_t start, end;
348: char *cp;
349:
1.46 kristaps 350: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
351: advance(p, pos);
1.27 kristaps 352:
353: start = end = *pos;
1.46 kristaps 354: while (end < BUFSZ(p) && ! ismspace(BUF(p)[end]))
1.27 kristaps 355: end++;
356:
357: if (start == end) {
1.46 kristaps 358: advanceeoln(p, pos, 1);
1.27 kristaps 359: return;
360: } else if (NULL == (cp = malloc(end - start + 1)))
361: texiabort(p, NULL);
362:
1.46 kristaps 363: memcpy(cp, &BUF(p)[start], end - start);
1.27 kristaps 364: cp[end - start] = '\0';
365:
366: p->indexs = realloc(p->indexs,
367: sizeof(char *) * (p->indexsz + 1));
368:
369: if (NULL == p->indexs)
370: texiabort(p, NULL);
371: p->indexs[p->indexsz++] = cp;
372: }
373:
374: static void
1.46 kristaps 375: dodefn(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 376: {
377: const char *blk;
378:
1.5 kristaps 379: blk = NULL;
1.3 kristaps 380: switch (cmd) {
1.15 kristaps 381: case (TEXICMD_DEFFN):
1.35 kristaps 382: case (TEXICMD_DEFMAC):
1.15 kristaps 383: case (TEXICMD_DEFTP):
1.3 kristaps 384: case (TEXICMD_DEFTYPEFN):
385: case (TEXICMD_DEFTYPEFUN):
1.34 kristaps 386: case (TEXICMD_DEFTYPEMETHOD):
1.15 kristaps 387: case (TEXICMD_DEFTYPEVAR):
388: case (TEXICMD_DEFTYPEVR):
389: case (TEXICMD_DEFUN):
390: case (TEXICMD_DEFVAR):
391: case (TEXICMD_DEFVR):
1.5 kristaps 392: blk = texitoks[cmd].tok;
1.3 kristaps 393: break;
1.5 kristaps 394: default:
1.3 kristaps 395: break;
396: }
397:
398: if (p->ign) {
1.15 kristaps 399: NULL != blk ?
1.46 kristaps 400: parseto(p, pos, blk) :
401: parseeoln(p, pos);
1.3 kristaps 402: return;
403: }
404:
1.15 kristaps 405: if (NULL != blk)
406: texivspace(p);
407:
1.3 kristaps 408: switch (cmd) {
1.34 kristaps 409: case (TEXICMD_DEFTYPEMETHOD):
410: case (TEXICMD_DEFTYPEMETHODX):
411: texiputchars(p, "Method");
412: break;
1.15 kristaps 413: case (TEXICMD_DEFMAC):
414: case (TEXICMD_DEFMACX):
415: texiputchars(p, "Macro");
416: break;
417: case (TEXICMD_DEFTYPEVAR):
418: case (TEXICMD_DEFTYPEVARX):
419: case (TEXICMD_DEFVAR):
420: case (TEXICMD_DEFVARX):
421: texiputchars(p, "Variable");
422: break;
1.3 kristaps 423: case (TEXICMD_DEFTYPEFUN):
1.15 kristaps 424: case (TEXICMD_DEFTYPEFUNX):
425: case (TEXICMD_DEFUN):
426: case (TEXICMD_DEFUNX):
427: texiputchars(p, "Function");
1.3 kristaps 428: break;
429: default:
1.46 kristaps 430: parselinearg(p, pos);
1.3 kristaps 431: break;
432: }
1.15 kristaps 433:
1.48 kristaps 434: texiputchar(p, ':');
435: texiputchar(p, '\n');
1.15 kristaps 436:
437: switch (cmd) {
438: case (TEXICMD_DEFMAC):
439: case (TEXICMD_DEFMACX):
440: teximacroopen(p, "Dv");
1.46 kristaps 441: while (parselinearg(p, pos))
1.15 kristaps 442: /* Spin. */ ;
443: teximacroclose(p);
444: break;
445: case (TEXICMD_DEFFN):
446: case (TEXICMD_DEFFNX):
447: case (TEXICMD_DEFUN):
448: case (TEXICMD_DEFUNX):
449: teximacroopen(p, "Fo");
1.46 kristaps 450: parselinearg(p, pos);
1.15 kristaps 451: teximacroclose(p);
452: teximacroopen(p, "Fa");
1.46 kristaps 453: while (parselinearg(p, pos))
1.15 kristaps 454: /* Spin. */ ;
455: teximacroclose(p);
456: teximacro(p, "Fc");
457: break;
458: case (TEXICMD_DEFTYPEFUN):
459: case (TEXICMD_DEFTYPEFUNX):
460: case (TEXICMD_DEFTYPEFN):
461: case (TEXICMD_DEFTYPEFNX):
1.34 kristaps 462: case (TEXICMD_DEFTYPEMETHOD):
463: case (TEXICMD_DEFTYPEMETHODX):
1.15 kristaps 464: teximacroopen(p, "Ft");
1.46 kristaps 465: parselinearg(p, pos);
1.15 kristaps 466: teximacroclose(p);
467: teximacroopen(p, "Fo");
1.46 kristaps 468: parselinearg(p, pos);
1.15 kristaps 469: teximacroclose(p);
470: teximacroopen(p, "Fa");
1.46 kristaps 471: while (parselinearg(p, pos))
1.15 kristaps 472: /* Spin. */ ;
473: teximacroclose(p);
474: teximacro(p, "Fc");
475: break;
476: case (TEXICMD_DEFTP):
477: case (TEXICMD_DEFTPX):
478: case (TEXICMD_DEFTYPEVAR):
479: case (TEXICMD_DEFTYPEVARX):
480: case (TEXICMD_DEFTYPEVR):
481: case (TEXICMD_DEFTYPEVRX):
482: teximacroopen(p, "Vt");
1.46 kristaps 483: while (parselinearg(p, pos))
1.15 kristaps 484: /* Spin. */ ;
485: teximacroclose(p);
486: break;
487: case (TEXICMD_DEFVAR):
488: case (TEXICMD_DEFVARX):
489: case (TEXICMD_DEFVR):
490: case (TEXICMD_DEFVRX):
491: teximacroopen(p, "Va");
1.46 kristaps 492: while (parselinearg(p, pos))
1.15 kristaps 493: /* Spin. */ ;
494: teximacroclose(p);
495: break;
496: default:
497: abort();
1.3 kristaps 498: }
1.15 kristaps 499:
1.54 kristaps 500: if (NULL == blk)
501: return;
502:
503: /*
504: * All "block" definitions have their block bodies indented
505: * unless they have the "x" form of the command following.
506: * E.g.,
507: * @deffn some function
508: * @deffnx another
509: * An explanation.
510: * @end deffn
511: * With this loop, we delay opening the indented block until we
512: * skipped past conformant macros.
513: */
514: for (;;) {
515: switch (peekcmd(p, *pos)) {
516: case (TEXICMD_DEFFNX):
517: case (TEXICMD_DEFMACX):
518: case (TEXICMD_DEFTPX):
519: case (TEXICMD_DEFTYPEFNX):
520: case (TEXICMD_DEFTYPEFUNX):
521: case (TEXICMD_DEFTYPEMETHODX):
522: case (TEXICMD_DEFTYPEVARX):
523: case (TEXICMD_DEFTYPEVRX):
524: case (TEXICMD_DEFUNX):
525: case (TEXICMD_DEFVARX):
526: case (TEXICMD_DEFVRX):
527: texivspace(p);
528: parseeoln(p, pos);
529: continue;
530: default:
531: break;
532: }
533: break;
534: }
535: teximacro(p, "Bd -filled -offset indent");
536: p->seenvs = 1;
537: parseto(p, pos, blk);
538: teximacro(p, "Ed");
1.3 kristaps 539: }
540:
541: static void
1.46 kristaps 542: domacro(struct texi *p, enum texicmd cmd, size_t *pos)
1.30 kristaps 543: {
544: size_t start, end, endtoksz, len;
545: struct teximacro m;
546: const char *endtok, *blk;
547:
548: memset(&m, 0, sizeof(struct teximacro));
549:
1.46 kristaps 550: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
551: advance(p, pos);
1.30 kristaps 552:
1.46 kristaps 553: for (start = end = *pos; end < BUFSZ(p); end++)
554: if (ismspace(BUF(p)[end]) || '{' == BUF(p)[end])
1.30 kristaps 555: break;
556:
557: if (start == end)
558: texierr(p, "zero-length macro name");
559:
1.46 kristaps 560: advanceto(p, pos, end);
1.30 kristaps 561:
562: m.key = malloc(end - start + 1);
563: if (NULL == m.key)
564: texiabort(p, NULL);
1.46 kristaps 565: memcpy(m.key, &BUF(p)[start], end - start);
1.30 kristaps 566: m.key[end - start] = '\0';
567:
1.46 kristaps 568: m.args = argparse(p, pos, &m.argsz, 0);
1.30 kristaps 569:
1.46 kristaps 570: /* Note: we advance to the beginning of the macro. */
571: advanceeoln(p, pos, 1);
572:
573: /*
574: * According to the Texinfo manual, the macro ends on the
575: * newline subsequent the @end macro.
576: * That's COMPLETELY FUCKING WRONG.
577: * It ends inclusive the newline, which is why so many macros
578: * say things like @r{hello}@c, where the subsequent @c swallows
579: * the newline.
580: * However, it does swallow the leading newline, so look for the
581: * @end macro without the leading newline else we might look
582: * past empty macros.
583: */
1.30 kristaps 584: start = *pos;
1.46 kristaps 585: endtok = "@end macro\n";
1.30 kristaps 586: endtoksz = strlen(endtok);
1.46 kristaps 587: blk = memmem(&BUF(p)[start], BUFSZ(p) - start, endtok, endtoksz);
1.30 kristaps 588: if (NULL == blk)
589: texierr(p, "unterminated macro body");
1.46 kristaps 590: /* Roll us back one character. */
591: while (&BUF(p)[*pos] != blk)
592: advance(p, pos);
593: assert('@' == BUF(p)[*pos]);
594: if ('\n' != BUF(p)[*pos - 1])
595: texierr(p, "cannot handle @end macro in-line");
596:
597: len = blk - &BUF(p)[start];
1.30 kristaps 598: m.value = malloc(len + 1);
599: if (NULL == m.value)
600: texiabort(p, NULL);
1.46 kristaps 601: memcpy(m.value, &BUF(p)[start], len);
1.30 kristaps 602: m.value[len] = '\0';
603:
604: p->macros = realloc
605: (p->macros,
606: (p->macrosz + 1) *
607: sizeof(struct teximacro));
608: if (NULL == p->macros)
609: texiabort(p, NULL);
610:
611: p->macros[p->macrosz++] = m;
1.46 kristaps 612: advanceeoln(p, pos, 1);
1.30 kristaps 613: }
614:
615: static void
1.46 kristaps 616: doignblock(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 617: {
1.45 kristaps 618: char end[32], start[32];
619: const char *endt, *startt;
620: size_t esz, ssz, newpos, stack;
1.26 kristaps 621:
622: /*
1.45 kristaps 623: * FIXME: this is cheating.
624: * These tokens are supposed to begin on a newline.
625: * However, if we do that, then we would need to check within
626: * the loop for trailer (or leading, as the case may be)
627: * newline, and that's just a bit too complicated right now.
628: * This is becasue
629: * @ifset BAR
630: * @ifset FOO
631: * @end ifset
632: * @end ifset
633: * won't work right now: we'd read after the first "@end ifset"
634: * to the next line, then look for the next line after that.
1.26 kristaps 635: */
1.45 kristaps 636: ssz = snprintf(start, sizeof(start),
637: "@%s", texitoks[cmd].tok);
638: assert(ssz < sizeof(start));
639: esz = snprintf(end, sizeof(end),
640: "@end %s\n", texitoks[cmd].tok);
641: assert(esz < sizeof(end));
642: stack = 1;
643:
644: /*
645: * Here we look for the end token "end" somewhere in the file in
646: * front of us.
647: * It's not that easy, of course: if we have a nested block,
648: * then there'll be an "end" token of the same kind between us.
649: * Thus, we keep track of scopes for matching "end" blocks.
1.26 kristaps 650: */
1.46 kristaps 651: while (stack > 0 && *pos < BUFSZ(p)) {
1.52 kristaps 652: if (stack > 64)
653: texierr(p, "run-away nested stack?");
1.46 kristaps 654: endt = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, end, esz);
655: startt = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, start, ssz);
1.45 kristaps 656: if (NULL == endt) {
657: texiwarn(p, "unterminated \"%s\" "
658: "block", texitoks[cmd].tok);
1.46 kristaps 659: *pos = BUFSZ(p);
1.45 kristaps 660: break;
661: }
1.26 kristaps 662:
1.45 kristaps 663: newpos = *pos;
664: if (NULL == startt || startt > endt) {
1.46 kristaps 665: newpos += esz + (size_t)(endt - &BUF(p)[*pos]);
1.45 kristaps 666: stack--;
667: } else {
1.46 kristaps 668: newpos += ssz + (size_t)(startt - &BUF(p)[*pos]);
1.45 kristaps 669: stack++;
670: }
671:
1.46 kristaps 672: assert(newpos <= BUFSZ(p));
1.45 kristaps 673: while (*pos < newpos)
1.46 kristaps 674: advance(p, pos);
1.45 kristaps 675: }
1.1 kristaps 676: }
677:
678: static void
1.46 kristaps 679: doblock(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 680: {
681:
1.46 kristaps 682: parseto(p, pos, texitoks[cmd].tok);
1.1 kristaps 683: }
684:
685: static void
1.46 kristaps 686: doinline(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 687: {
1.21 kristaps 688: const char *macro = NULL;
1.12 kristaps 689:
690: switch (cmd) {
1.21 kristaps 691: case (TEXICMD_CODE):
692: case (TEXICMD_KBD):
693: case (TEXICMD_SAMP):
694: case (TEXICMD_T):
695: macro = "Li";
696: break;
697: case (TEXICMD_CITE):
698: case (TEXICMD_DFN):
699: case (TEXICMD_EMPH):
700: case (TEXICMD_I):
701: case (TEXICMD_SLANTED):
702: macro = "Em";
703: break;
704: case (TEXICMD_B):
705: case (TEXICMD_STRONG):
706: macro = "Sy";
707: break;
1.12 kristaps 708: case (TEXICMD_COMMAND):
709: macro = "Xr";
710: break;
711: case (TEXICMD_ENV):
712: macro = "Ev";
713: break;
714: case (TEXICMD_FILE):
715: macro = "Pa";
716: break;
1.16 kristaps 717: case (TEXICMD_OPTION):
718: macro = "Op";
719: break;
1.12 kristaps 720: case (TEXICMD_VAR):
721: macro = "Va";
722: break;
723: default:
1.22 kristaps 724: break;
1.12 kristaps 725: }
726:
1.25 kristaps 727: if (NULL == macro || p->literal || TEXILIST_TABLE == p->list) {
1.53 kristaps 728: parsebracket(p, pos, 0);
1.12 kristaps 729: return;
730: }
1.1 kristaps 731:
1.5 kristaps 732: teximacroopen(p, macro);
1.1 kristaps 733: p->seenws = 0;
1.53 kristaps 734: parsebracket(p, pos, 0);
1.46 kristaps 735: texipunctuate(p, pos);
1.5 kristaps 736: teximacroclose(p);
1.1 kristaps 737: }
738:
739: static void
1.46 kristaps 740: doverb(struct texi *p, enum texicmd cmd, size_t *pos)
1.33 kristaps 741: {
742: char delim;
1.34 kristaps 743: size_t start;
1.33 kristaps 744:
1.46 kristaps 745: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
746: advance(p, pos);
747: if (*pos == BUFSZ(p) || '{' != BUF(p)[*pos])
1.33 kristaps 748: return;
1.46 kristaps 749: advance(p, pos);
750: if (*pos == BUFSZ(p))
1.33 kristaps 751: return;
752:
1.46 kristaps 753: delim = BUF(p)[*pos];
754: advance(p, pos);
1.33 kristaps 755: /* Make sure we flush out our initial whitespace... */
756: if (p->seenws && p->outcol && 0 == p->literal)
757: texiputchar(p, ' ');
758: p->seenws = 0;
1.34 kristaps 759: start = *pos;
1.33 kristaps 760: /* Read until we see the delimiter then end-brace. */
1.46 kristaps 761: while (*pos < BUFSZ(p) - 1) {
762: if (BUF(p)[*pos] == delim && BUF(p)[*pos + 1] == '}')
1.33 kristaps 763: break;
1.46 kristaps 764: advance(p, pos);
1.33 kristaps 765: }
1.51 kristaps 766: if (*pos >= BUFSZ(p) - 1)
1.33 kristaps 767: return;
1.46 kristaps 768: texiputbuf(p, start, *pos);
1.34 kristaps 769:
1.33 kristaps 770: /* Make sure we read after the end-brace. */
1.46 kristaps 771: assert(delim == BUF(p)[*pos]);
772: advance(p, pos);
773: assert('}' == BUF(p)[*pos]);
774: advance(p, pos);
1.33 kristaps 775: }
776:
777: static void
1.46 kristaps 778: doverbatim(struct texi *p, enum texicmd cmd, size_t *pos)
1.25 kristaps 779: {
780: const char *end, *term;
781: size_t endsz, endpos;
782:
1.45 kristaps 783: /* We read from the @verbatim\n newline inclusive! */
1.25 kristaps 784: end = "\n@end verbatim\n";
785: endsz = strlen(end);
1.46 kristaps 786: advanceeoln(p, pos, 0);
787: if (*pos == BUFSZ(p)) {
1.45 kristaps 788: texiwarn(p, "unexpected end of file");
789: return;
790: }
1.25 kristaps 791:
1.46 kristaps 792: term = memmem(&BUF(p)[*pos], BUFSZ(p) - *pos, end, endsz);
1.45 kristaps 793: if (NULL == term) {
794: texiwarn(p, "unterminated verbatim block");
1.46 kristaps 795: endpos = BUFSZ(p);
1.45 kristaps 796: } else
1.46 kristaps 797: endpos = *pos + (size_t)(term - &BUF(p)[*pos]);
1.25 kristaps 798:
1.46 kristaps 799: assert(endpos <= BUFSZ(p));
800: assert('\n' == BUF(p)[*pos]);
801: advance(p, pos);
1.25 kristaps 802: teximacro(p, "Bd -literal -offset indent");
1.26 kristaps 803: while (*pos < endpos) {
1.46 kristaps 804: texiputchar(p, BUF(p)[*pos]);
805: advance(p, pos);
1.25 kristaps 806: }
807: teximacro(p, "Ed");
1.46 kristaps 808: if (*pos < BUFSZ(p))
809: advanceto(p, pos, endpos + endsz);
1.25 kristaps 810: }
811:
812: static void
1.46 kristaps 813: doverbinclude(struct texi *p, enum texicmd cmd, size_t *pos)
1.16 kristaps 814: {
1.25 kristaps 815: char fname[PATH_MAX], path[PATH_MAX];
816: int rc;
817: size_t i, end;
818: const char *v;
819: enum texicmd type;
1.16 kristaps 820:
1.46 kristaps 821: while (*pos < BUFSZ(p) && ' ' == BUF(p)[*pos])
822: advance(p, pos);
1.16 kristaps 823:
1.46 kristaps 824: for (i = 0; *pos < BUFSZ(p) && '\n' != BUF(p)[*pos]; ) {
1.16 kristaps 825: if (i == sizeof(fname) - 1)
826: break;
1.46 kristaps 827: if ('@' != BUF(p)[*pos]) {
828: fname[i++] = BUF(p)[*pos];
829: advance(p, pos);
1.25 kristaps 830: continue;
831: }
1.46 kristaps 832: type = texicmd(p, *pos, &end, NULL);
833: advanceto(p, pos, end);
1.25 kristaps 834: if (TEXICMD_VALUE != type)
835: texierr(p, "unknown verbatiminclude command");
1.46 kristaps 836: v = valueblookup(p, pos);
1.25 kristaps 837: if (NULL == v)
838: continue;
839: while ('\0' != *v) {
840: if (i == sizeof(fname) - 1)
841: break;
842: fname[i++] = *v++;
843: }
844: if ('\0' != *v)
845: break;
1.16 kristaps 846: }
847:
848: if (i == 0)
849: texierr(p, "path too short");
1.46 kristaps 850: else if ('\n' != BUF(p)[*pos])
1.16 kristaps 851: texierr(p, "path too long");
852: else if ('/' == fname[0])
853: texierr(p, "no absolute paths");
854: fname[i] = '\0';
855:
856: if (strstr(fname, "../") || strstr(fname, "/.."))
857: texierr(p, "insecure path");
858:
859: rc = snprintf(path, sizeof(path),
860: "%s/%s", p->dirs[0], fname);
861: if (rc < 0)
862: texierr(p, "couldn't format path");
863: else if ((size_t)rc >= sizeof(path))
864: texierr(p, "path too long");
865:
866: parsefile(p, path, 0);
867: }
868:
869: static void
1.46 kristaps 870: doinclude(struct texi *p, enum texicmd cmd, size_t *pos)
1.2 kristaps 871: {
1.25 kristaps 872: char fname[PATH_MAX], path[PATH_MAX];
873: size_t i, end;
874: int rc;
875: const char *v;
876: enum texicmd type;
1.2 kristaps 877:
1.46 kristaps 878: while (*pos < BUFSZ(p) && ' ' == BUF(p)[*pos])
879: advance(p, pos);
1.2 kristaps 880:
881: /* Read in the filename. */
1.46 kristaps 882: for (i = 0; *pos < BUFSZ(p) && '\n' != BUF(p)[*pos]; ) {
1.2 kristaps 883: if (i == sizeof(fname) - 1)
884: break;
1.46 kristaps 885: if ('@' != BUF(p)[*pos]) {
886: fname[i++] = BUF(p)[*pos];
887: advance(p, pos);
1.25 kristaps 888: continue;
889: }
1.46 kristaps 890: type = texicmd(p, *pos, &end, NULL);
891: advanceto(p, pos, end);
1.25 kristaps 892: if (TEXICMD_VALUE != type)
893: texierr(p, "unknown include command");
1.46 kristaps 894: v = valueblookup(p, pos);
1.25 kristaps 895: if (NULL == v)
896: continue;
897: while ('\0' != *v) {
898: if (i == sizeof(fname) - 1)
899: break;
900: fname[i++] = *v++;
901: }
902: if ('\0' != *v)
903: break;
1.2 kristaps 904: }
905:
906: if (i == 0)
907: texierr(p, "path too short");
1.46 kristaps 908: else if ('\n' != BUF(p)[*pos])
1.2 kristaps 909: texierr(p, "path too long");
910: else if ('/' == fname[0])
911: texierr(p, "no absolute paths");
912: fname[i] = '\0';
913:
914: if (strstr(fname, "../") || strstr(fname, "/.."))
915: texierr(p, "insecure path");
916:
1.5 kristaps 917: for (i = 0; i < p->dirsz; i++) {
918: rc = snprintf(path, sizeof(path),
919: "%s/%s", p->dirs[i], fname);
920: if (rc < 0)
921: texierr(p, "couldn't format path");
922: else if ((size_t)rc >= sizeof(path))
923: texierr(p, "path too long");
924: else if (-1 == access(path, R_OK))
925: continue;
926:
1.16 kristaps 927: parsefile(p, path, 1);
1.5 kristaps 928: return;
929: }
1.2 kristaps 930:
1.5 kristaps 931: texierr(p, "couldn't find %s in includes", fname);
1.2 kristaps 932: }
933:
934: static void
1.46 kristaps 935: dobracket(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 936: {
937:
1.53 kristaps 938: parsebracket(p, pos, 0);
1.1 kristaps 939: }
940:
941: static void
1.46 kristaps 942: dodisplay(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 943: {
944:
1.20 kristaps 945: switch (cmd) {
946: case (TEXICMD_FORMAT):
947: case (TEXICMD_SMALLFORMAT):
948: teximacro(p, "Bd -filled");
949: break;
950: default:
951: teximacro(p, "Bd -filled -offset indent");
952: break;
953: }
954:
1.11 kristaps 955: p->seenvs = 1;
1.12 kristaps 956: /* FIXME: ignore and parseeoln. */
1.46 kristaps 957: advanceeoln(p, pos, 1);
958: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 959: teximacro(p, "Ed");
1.3 kristaps 960: }
961:
962: static void
1.46 kristaps 963: doexample(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 964: {
965:
1.5 kristaps 966: teximacro(p, "Bd -literal -offset indent");
1.12 kristaps 967: /* FIXME: ignore and parseeoln. */
1.46 kristaps 968: advanceeoln(p, pos, 1);
1.3 kristaps 969: p->literal++;
1.46 kristaps 970: parseto(p, pos, texitoks[cmd].tok);
1.3 kristaps 971: p->literal--;
1.5 kristaps 972: teximacro(p, "Ed");
1.1 kristaps 973: }
974:
975: static void
1.46 kristaps 976: dobye(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 977: {
978:
979: texiexit(p);
980: exit(EXIT_SUCCESS);
981: }
982:
983: static void
1.46 kristaps 984: dotitle(struct texi *p, enum texicmd cmd, size_t *pos)
1.10 kristaps 985: {
986: size_t start, end;
987:
1.46 kristaps 988: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
989: advance(p, pos);
1.10 kristaps 990: start = end = *pos;
1.46 kristaps 991: while (end < BUFSZ(p) && '\n' != BUF(p)[end])
1.10 kristaps 992: end++;
1.46 kristaps 993: advanceeoln(p, pos, 1);
1.10 kristaps 994: free(p->subtitle);
995: p->subtitle = malloc(end - start + 1);
1.27 kristaps 996: if (NULL == p->subtitle)
997: texiabort(p, NULL);
1.46 kristaps 998: memcpy(p->subtitle, &BUF(p)[start], end - start);
1.10 kristaps 999: p->subtitle[end - start] = '\0';
1000: }
1001:
1002: static void
1.46 kristaps 1003: doaccent(struct texi *p, enum texicmd cmd, size_t *pos)
1.16 kristaps 1004: {
1.42 kristaps 1005: int brace = 0;
1.16 kristaps 1006:
1.46 kristaps 1007: if (*pos == BUFSZ(p)) {
1.42 kristaps 1008: texiwarn(p, "truncated: @%s", texitoks[cmd].tok);
1.16 kristaps 1009: return;
1.42 kristaps 1010: }
1011:
1012: /* Pad us with space, if necessary. */
1013: if (p->seenws && p->outcol && 0 == p->literal) {
1.34 kristaps 1014: texiputchar(p, ' ');
1.42 kristaps 1015: p->seenws = 0;
1016: }
1017:
1018: /*
1019: * If we're braced, then that's that.
1020: * Otherwise, in a special Texinfo case: if we're a non
1021: * alphabetic command of one letter, then the next character is
1022: * the critical one.
1023: * Otherwise, space can sit between us and our argument.
1024: */
1.46 kristaps 1025: if ('{' == BUF(p)[*pos]) {
1.42 kristaps 1026: brace = 1;
1.46 kristaps 1027: advance(p, pos);
1.49 kristaps 1028: } else if (isalpha((unsigned char)texitoks[cmd].tok[0]))
1.46 kristaps 1029: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1030: advance(p, pos);
1.42 kristaps 1031:
1.46 kristaps 1032: if (*pos == BUFSZ(p)) {
1.42 kristaps 1033: texiwarn(p, "truncated: @%s", texitoks[cmd].tok);
1034: return;
1035: }
1036:
1037: switch (cmd) {
1.16 kristaps 1038: case (TEXICMD_ACUTE):
1.46 kristaps 1039: switch (BUF(p)[*pos]) {
1.16 kristaps 1040: case ('a'): case ('A'):
1041: case ('e'): case ('E'):
1042: case ('i'): case ('I'):
1043: case ('o'): case ('O'):
1044: case ('u'): case ('U'):
1045: texiputchars(p, "\\(\'");
1046: break;
1047: default:
1.42 kristaps 1048: texiwarn(p, "ignoring accent");
1049: break;
1.16 kristaps 1050: }
1.46 kristaps 1051: texiputchar(p, BUF(p)[*pos]);
1052: advance(p, pos);
1.42 kristaps 1053: break;
1054: case (TEXICMD_CEDILLA):
1.46 kristaps 1055: if ('c' == BUF(p)[*pos] || 'C' == BUF(p)[*pos])
1.42 kristaps 1056: texiputchars(p, "\\(,");
1057: else
1058: texiwarn(p, "ignoring accent");
1.46 kristaps 1059: texiputchar(p, BUF(p)[*pos]);
1060: advance(p, pos);
1.16 kristaps 1061: break;
1062: case (TEXICMD_CIRCUMFLEX):
1.46 kristaps 1063: switch (BUF(p)[*pos]) {
1.16 kristaps 1064: case ('a'): case ('A'):
1065: case ('e'): case ('E'):
1066: case ('i'): case ('I'):
1067: case ('o'): case ('O'):
1068: case ('u'): case ('U'):
1069: texiputchars(p, "\\(^");
1070: break;
1071: default:
1.42 kristaps 1072: texiwarn(p, "ignoring accent");
1.34 kristaps 1073: break;
1.16 kristaps 1074: }
1.46 kristaps 1075: texiputchar(p, BUF(p)[*pos]);
1076: advance(p, pos);
1.42 kristaps 1077: break;
1078: case (TEXICMD_DOTLESS):
1.46 kristaps 1079: if ('i' == BUF(p)[*pos] || 'j' == BUF(p)[*pos])
1.42 kristaps 1080: texiputchars(p, "\\(.");
1081: else
1082: texiwarn(p, "ignoring accent");
1.46 kristaps 1083: texiputchar(p, BUF(p)[*pos]);
1084: advance(p, pos);
1.16 kristaps 1085: break;
1086: case (TEXICMD_GRAVE):
1.46 kristaps 1087: switch (BUF(p)[*pos]) {
1.16 kristaps 1088: case ('a'): case ('A'):
1089: case ('e'): case ('E'):
1090: case ('i'): case ('I'):
1091: case ('o'): case ('O'):
1092: case ('u'): case ('U'):
1093: texiputchars(p, "\\(`");
1094: break;
1095: default:
1.42 kristaps 1096: texiwarn(p, "ignoring accent");
1097: break;
1.16 kristaps 1098: }
1.46 kristaps 1099: texiputchar(p, BUF(p)[*pos]);
1100: advance(p, pos);
1.16 kristaps 1101: break;
1102: case (TEXICMD_TILDE):
1.46 kristaps 1103: switch (BUF(p)[*pos]) {
1.16 kristaps 1104: case ('a'): case ('A'):
1105: case ('n'): case ('N'):
1106: case ('o'): case ('O'):
1107: texiputchars(p, "\\(~");
1108: break;
1109: default:
1.42 kristaps 1110: texiwarn(p, "ignoring accent");
1.34 kristaps 1111: break;
1.16 kristaps 1112: }
1.46 kristaps 1113: texiputchar(p, BUF(p)[*pos]);
1114: advance(p, pos);
1.16 kristaps 1115: break;
1116: case (TEXICMD_UMLAUT):
1.46 kristaps 1117: switch (BUF(p)[*pos]) {
1.16 kristaps 1118: case ('a'): case ('A'):
1119: case ('e'): case ('E'):
1120: case ('i'): case ('I'):
1121: case ('o'): case ('O'):
1122: case ('u'): case ('U'):
1123: case ('y'):
1124: texiputchars(p, "\\(:");
1125: break;
1126: default:
1.42 kristaps 1127: texiwarn(p, "ignoring accent");
1.34 kristaps 1128: break;
1.16 kristaps 1129: }
1.46 kristaps 1130: texiputchar(p, BUF(p)[*pos]);
1131: advance(p, pos);
1.16 kristaps 1132: break;
1133: default:
1.46 kristaps 1134: texiputchar(p, BUF(p)[*pos]);
1135: advance(p, pos);
1.42 kristaps 1136: break;
1137: }
1138:
1139: if (brace) {
1.46 kristaps 1140: while (*pos < BUFSZ(p) && '}' != BUF(p)[*pos]) {
1141: texiputchar(p, BUF(p)[*pos]);
1142: advance(p, pos);
1.42 kristaps 1143: }
1.46 kristaps 1144: if (*pos < BUFSZ(p))
1145: advance(p, pos);
1.42 kristaps 1146: }
1147:
1148: switch (cmd) {
1149: case (TEXICMD_TIEACCENT):
1150: texiputchar(p, ']');
1151: break;
1152: case (TEXICMD_DOTACCENT):
1153: texiputchar(p, '*');
1154: break;
1155: default:
1156: break;
1.16 kristaps 1157: }
1158: }
1159:
1160: static void
1.46 kristaps 1161: dosymbol(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1162: {
1163:
1.42 kristaps 1164: /* Remember to pad us. */
1.43 kristaps 1165: if (p->seenws && p->outcol && 0 == p->literal)
1.3 kristaps 1166: texiputchar(p, ' ');
1.43 kristaps 1167:
1168: p->seenws = 0;
1.3 kristaps 1169:
1.1 kristaps 1170: switch (cmd) {
1.42 kristaps 1171: case (TEXICMD_AA):
1172: texiputchars(p, "\\(oA");
1173: break;
1174: case (TEXICMD_AASMALL):
1175: texiputchars(p, "\\(oa");
1176: break;
1177: case (TEXICMD_AE):
1178: texiputchars(p, "\\(AE");
1179: break;
1180: case (TEXICMD_AESMALL):
1181: texiputchars(p, "\\(ae");
1182: break;
1.3 kristaps 1183: case (TEXICMD_ASTERISK):
1184: case (TEXICMD_NEWLINE):
1185: case (TEXICMD_SPACE):
1.18 kristaps 1186: case (TEXICMD_TABSYM):
1.3 kristaps 1187: texiputchar(p, ' ');
1188: break;
1.1 kristaps 1189: case (TEXICMD_AT):
1.3 kristaps 1190: texiputchar(p, '@');
1191: break;
1192: case (TEXICMD_BANG):
1193: texiputchar(p, '!');
1.7 kristaps 1194: break;
1195: case (TEXICMD_BULLET):
1196: texiputchars(p, "\\(bu");
1.1 kristaps 1197: break;
1.35 kristaps 1198: case (TEXICMD_COMMA):
1199: texiputchar(p, ',');
1200: break;
1.1 kristaps 1201: case (TEXICMD_COPYRIGHT):
1202: texiputchars(p, "\\(co");
1203: break;
1.42 kristaps 1204: case (TEXICMD_DH):
1205: texiputchars(p, "\\(-D");
1206: break;
1207: case (TEXICMD_DHSMALL):
1208: texiputchars(p, "\\(Sd");
1209: break;
1.2 kristaps 1210: case (TEXICMD_DOTS):
1.34 kristaps 1211: case (TEXICMD_ENDDOTS):
1.2 kristaps 1212: texiputchars(p, "...");
1213: break;
1.28 kristaps 1214: case (TEXICMD_EQUIV):
1215: texiputchars(p, "\\(==");
1216: break;
1.15 kristaps 1217: case (TEXICMD_ERROR):
1218: texiputchars(p, "error\\(->");
1.17 kristaps 1219: break;
1.43 kristaps 1220: case (TEXICMD_EURO):
1221: texiputchars(p, "\\(Eu");
1222: break;
1.42 kristaps 1223: case (TEXICMD_EXCLAMDOWN):
1224: texiputchars(p, "\\(r!");
1225: break;
1.17 kristaps 1226: case (TEXICMD_EXPANSION):
1227: texiputchars(p, "\\(->");
1.15 kristaps 1228: break;
1.43 kristaps 1229: case (TEXICMD_GEQ):
1230: texiputchars(p, "\\(>=");
1231: break;
1232: case (TEXICMD_GUILLEMETLEFT):
1233: case (TEXICMD_GUILLEMOTLEFT):
1234: texiputchars(p, "\\(Fo");
1235: break;
1236: case (TEXICMD_GUILLEMETRIGHT):
1237: case (TEXICMD_GUILLEMOTRIGHT):
1238: texiputchars(p, "\\(Fc");
1239: break;
1240: case (TEXICMD_GUILSINGLLEFT):
1241: texiputchars(p, "\\(fo");
1242: break;
1243: case (TEXICMD_GUILSINGLRIGHT):
1244: texiputchars(p, "\\(fc");
1245: break;
1.42 kristaps 1246: case (TEXICMD_L):
1247: texiputchars(p, "\\(/L");
1248: break;
1.1 kristaps 1249: case (TEXICMD_LATEX):
1250: texiputchars(p, "LaTeX");
1251: break;
1.43 kristaps 1252: case (TEXICMD_LEQ):
1253: texiputchars(p, "\\(<=");
1254: break;
1.42 kristaps 1255: case (TEXICMD_LSMALL):
1256: texiputchars(p, "\\(/l");
1257: break;
1.25 kristaps 1258: case (TEXICMD_MINUS):
1259: texiputchars(p, "\\-");
1260: break;
1.42 kristaps 1261: case (TEXICMD_O):
1262: texiputchars(p, "\\(/O");
1263: break;
1264: case (TEXICMD_OE):
1265: texiputchars(p, "\\(OE");
1266: break;
1267: case (TEXICMD_OESMALL):
1268: texiputchars(p, "\\(oe");
1269: break;
1270: case (TEXICMD_ORDF):
1271: texiputchars(p, "a");
1272: break;
1273: case (TEXICMD_ORDM):
1274: texiputchars(p, "o");
1275: break;
1276: case (TEXICMD_OSMALL):
1277: texiputchars(p, "\\(/o");
1278: break;
1.25 kristaps 1279: case (TEXICMD_PERIOD):
1280: texiputchar(p, '.');
1281: break;
1.43 kristaps 1282: case (TEXICMD_POUNDS):
1283: texiputchars(p, "\\(Po");
1284: break;
1.42 kristaps 1285: case (TEXICMD_QUESTIONDOWN):
1286: texiputchars(p, "\\(r?");
1287: break;
1.3 kristaps 1288: case (TEXICMD_QUESTIONMARK):
1289: texiputchar(p, '?');
1.15 kristaps 1290: break;
1.43 kristaps 1291: case (TEXICMD_QUOTEDBLBASE):
1292: texiputchars(p, "\\(Bq");
1293: break;
1294: case (TEXICMD_QUOTEDBLLEFT):
1295: texiputchars(p, "\\(lq");
1296: break;
1297: case (TEXICMD_QUOTEDBLRIGHT):
1298: texiputchars(p, "\\(rq");
1299: break;
1300: case (TEXICMD_QUOTESINGLBASE):
1301: texiputchars(p, "\\(bq");
1302: break;
1303: case (TEXICMD_QUOTELEFT):
1304: texiputchars(p, "\\(oq");
1305: break;
1306: case (TEXICMD_QUOTERIGHT):
1307: texiputchars(p, "\\(cq");
1308: break;
1309: case (TEXICMD_REGISTEREDSYMBOL):
1310: texiputchars(p, "\\(rg");
1311: break;
1.15 kristaps 1312: case (TEXICMD_RESULT):
1313: texiputchars(p, "\\(rA");
1.3 kristaps 1314: break;
1.34 kristaps 1315: case (TEXICMD_SLASH):
1316: texiputchar(p, '/');
1317: break;
1.35 kristaps 1318: case (TEXICMD_SS):
1319: texiputchars(p, "\\(ss");
1320: break;
1.3 kristaps 1321: case (TEXICMD_SQUIGGLE_LEFT):
1322: texiputchars(p, "{");
1323: break;
1324: case (TEXICMD_SQUIGGLE_RIGHT):
1325: texiputchars(p, "}");
1326: break;
1.38 kristaps 1327: case (TEXICMD_TEXSYM):
1.35 kristaps 1328: texiputchars(p, "TeX");
1.43 kristaps 1329: break;
1330: case (TEXICMD_TEXTDEGREE):
1331: texiputchars(p, "\\(de");
1.35 kristaps 1332: break;
1.42 kristaps 1333: case (TEXICMD_TH):
1334: texiputchars(p, "\\(TP");
1335: break;
1336: case (TEXICMD_THSMALL):
1337: texiputchars(p, "\\(Tp");
1338: break;
1.38 kristaps 1339: case (TEXICMD_TIE):
1.35 kristaps 1340: texiputchars(p, "\\ ");
1.1 kristaps 1341: break;
1.3 kristaps 1342: case (TEXICMD_COLON):
1343: case (TEXICMD_HYPHEN):
1344: break;
1.1 kristaps 1345: default:
1346: abort();
1347: }
1348:
1.42 kristaps 1349: /* Alphabetic commands have braces we ignore. */
1.49 kristaps 1350: if (isalpha((unsigned char)texitoks[cmd].tok[0]))
1.46 kristaps 1351: doignbracket(p, cmd, pos);
1.1 kristaps 1352: }
1353:
1354: static void
1.46 kristaps 1355: doquotation(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1356: {
1357:
1.5 kristaps 1358: teximacro(p, "Qo");
1.46 kristaps 1359: parseto(p, pos, "quotation");
1.5 kristaps 1360: teximacro(p, "Qc");
1.1 kristaps 1361: }
1362:
1.3 kristaps 1363: static void
1.46 kristaps 1364: domath(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 1365: {
1366:
1.53 kristaps 1367: parsebracket(p, pos, 1);
1.24 kristaps 1368: }
1369:
1370: static void
1.46 kristaps 1371: dovalue(struct texi *p, enum texicmd cmd, size_t *pos)
1.24 kristaps 1372: {
1.46 kristaps 1373: size_t start, end;
1.25 kristaps 1374: char *key, *val;
1375: const char *cp;
1.24 kristaps 1376:
1377: if (TEXICMD_SET == cmd) {
1.46 kristaps 1378: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1379: advance(p, pos);
1380: for (start = end = *pos; end < BUFSZ(p); end++)
1381: if (ismspace(BUF(p)[end]))
1.24 kristaps 1382: break;
1.25 kristaps 1383: /* We don't allow empty keys. */
1.24 kristaps 1384: if (start == end)
1385: return;
1.46 kristaps 1386: advanceto(p, pos, end);
1.24 kristaps 1387:
1388: key = malloc(end - start + 1);
1.27 kristaps 1389: if (NULL == key)
1390: texiabort(p, NULL);
1.46 kristaps 1391: memcpy(key, &BUF(p)[start], end - start);
1.24 kristaps 1392: key[end - start] = '\0';
1393:
1.46 kristaps 1394: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1395: advance(p, pos);
1396: for (start = end = *pos; end < BUFSZ(p); end++)
1397: if ('\n' == BUF(p)[end])
1.24 kristaps 1398: break;
1.25 kristaps 1399: /* We do allow empty values. */
1.46 kristaps 1400: advanceeoln(p, pos, 1);
1.24 kristaps 1401:
1402: val = malloc(end - start + 1);
1.27 kristaps 1403: if (NULL == val)
1404: texiabort(p, NULL);
1.46 kristaps 1405: memcpy(val, &BUF(p)[start], end - start);
1.24 kristaps 1406: val[end - start] = '\0';
1.25 kristaps 1407: valueadd(p, key, val);
1.24 kristaps 1408: } else if (TEXICMD_VALUE == cmd) {
1409: if (p->seenws)
1410: texiputchar(p, ' ');
1411: p->seenws = 0;
1.46 kristaps 1412: if (NULL != (cp = valueblookup(p, pos)))
1413: texisplice(p, cp, strlen(cp), pos);
1414: else
1.25 kristaps 1415: texiputchars(p, "{No value}");
1.24 kristaps 1416: } else if (TEXICMD_IFCLEAR == cmd) {
1.46 kristaps 1417: if (NULL != valuellookup(p, pos))
1418: doignblock(p, cmd, pos);
1.26 kristaps 1419: else
1.46 kristaps 1420: parseto(p, pos, texitoks[cmd].tok);
1.30 kristaps 1421: } else if (TEXICMD_IFSET == cmd) {
1.46 kristaps 1422: if (NULL == valuellookup(p, pos))
1423: doignblock(p, cmd, pos);
1.30 kristaps 1424: else
1.46 kristaps 1425: parseto(p, pos, texitoks[cmd].tok);
1.25 kristaps 1426: } else if (TEXICMD_CLEAR == cmd)
1.46 kristaps 1427: valuelclear(p, pos);
1.3 kristaps 1428: }
1429:
1.1 kristaps 1430: static void
1.46 kristaps 1431: dolink(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1432: {
1.8 kristaps 1433: int c;
1.1 kristaps 1434:
1435: switch (cmd) {
1436: case (TEXICMD_EMAIL):
1.5 kristaps 1437: teximacroopen(p, "Mt");
1.1 kristaps 1438: break;
1.3 kristaps 1439: case (TEXICMD_UREF):
1.1 kristaps 1440: case (TEXICMD_URL):
1.44 kristaps 1441: case (TEXICMD_INDICATEURL):
1.5 kristaps 1442: teximacroopen(p, "Lk");
1.1 kristaps 1443: break;
1.8 kristaps 1444: case (TEXICMD_XREF):
1445: texiputchars(p, "See Section");
1.39 kristaps 1446: teximacroopen(p, "Dq");
1.8 kristaps 1447: break;
1448: case (TEXICMD_PXREF):
1449: texiputchars(p, "see Section");
1.39 kristaps 1450: teximacroopen(p, "Dq");
1.8 kristaps 1451: break;
1.34 kristaps 1452: case (TEXICMD_INFOREF):
1453: texiputchars(p, "See Info file node");
1.39 kristaps 1454: teximacroopen(p, "Dq");
1.34 kristaps 1455: break;
1.1 kristaps 1456: default:
1.8 kristaps 1457: abort();
1.1 kristaps 1458: }
1.8 kristaps 1459:
1.46 kristaps 1460: c = parsearg(p, pos, 0);
1.8 kristaps 1461: p->ign++;
1462: while (c > 0)
1.46 kristaps 1463: c = parsearg(p, pos, 1);
1.8 kristaps 1464: p->ign--;
1465:
1.46 kristaps 1466: texipunctuate(p, pos);
1.8 kristaps 1467: teximacroclose(p);
1468: }
1469:
1470: static void
1.46 kristaps 1471: doignargn(struct texi *p, enum texicmd cmd, size_t *pos)
1.8 kristaps 1472: {
1473: int c;
1474:
1.46 kristaps 1475: c = parsearg(p, pos, 0);
1.8 kristaps 1476: p->ign++;
1477: while (c > 0)
1.46 kristaps 1478: c = parsearg(p, pos, 1);
1.8 kristaps 1479: p->ign--;
1.1 kristaps 1480: }
1481:
1.23 kristaps 1482: /*
1483: * Sections can be made subsections and so on by way of the
1484: * @raiseections and @lowersections commands.
1485: * Perform this check here and return the actual section number adjusted
1486: * to the raise level.
1487: */
1488: static int
1489: sectioner(struct texi *p, int sec)
1490: {
1491:
1492: if ((sec -= p->secoffs) < 0) {
1493: texiwarn(p, "section below minimum, clamping");
1494: return(0);
1495: } else if (sec >= SECTSZ) {
1496: texiwarn(p, "section above maximum, clamping");
1497: return(SECTSZ - 1);
1498: }
1499: return(sec);
1500: }
1501:
1502: static void
1.46 kristaps 1503: dosubsubsection(struct texi *p, enum texicmd cmd, size_t *pos)
1.23 kristaps 1504: {
1505: int sec;
1506:
1507: sec = sectioner(p, 3);
1508:
1509: /* We don't have a subsubsubsection, so make one up. */
1510: texivspace(p);
1511: teximacroopen(p, sects[sec]);
1.46 kristaps 1512: parseeoln(p, pos);
1.23 kristaps 1513: teximacroclose(p);
1514: texivspace(p);
1515: }
1516:
1.1 kristaps 1517: static void
1.46 kristaps 1518: dosubsection(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1519: {
1.23 kristaps 1520: int sec;
1521:
1522: sec = sectioner(p, 2);
1.13 kristaps 1523:
1524: if (p->outmacro)
1.23 kristaps 1525: texierr(p, "\"%s\" in open line scope!?", sects[sec]);
1.13 kristaps 1526: else if (p->literal)
1.23 kristaps 1527: texierr(p, "\"%s\" in a literal scope!?", sects[sec]);
1.1 kristaps 1528:
1.21 kristaps 1529: /* We don't have a subsubsection, so make one up. */
1.34 kristaps 1530: if (sec > 1)
1531: texivspace(p);
1.23 kristaps 1532: teximacroopen(p, sects[sec]);
1.46 kristaps 1533: parseeoln(p, pos);
1.5 kristaps 1534: teximacroclose(p);
1.34 kristaps 1535: if (sec > 1)
1536: texivspace(p);
1.1 kristaps 1537: }
1538:
1539: static void
1.46 kristaps 1540: dosecoffs(struct texi *p, enum texicmd cmd, size_t *pos)
1.23 kristaps 1541: {
1542:
1543: if (TEXICMD_RAISESECTIONS == cmd)
1544: p->secoffs++;
1545: else
1546: p->secoffs--;
1547: }
1548:
1549: static void
1.46 kristaps 1550: dosection(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1551: {
1.23 kristaps 1552: int sec;
1.12 kristaps 1553:
1554: switch (cmd) {
1.55 ! kristaps 1555: case (TEXICMD_TOP):
! 1556: sec = 0;
! 1557: break;
1.12 kristaps 1558: case (TEXICMD_APPENDIX):
1559: case (TEXICMD_CHAPTER):
1560: case (TEXICMD_UNNUMBERED):
1.23 kristaps 1561: sec = sectioner(p, 0);
1.12 kristaps 1562: break;
1563: case (TEXICMD_APPENDIXSEC):
1564: case (TEXICMD_HEADING):
1565: case (TEXICMD_SECTION):
1566: case (TEXICMD_UNNUMBEREDSEC):
1.23 kristaps 1567: sec = sectioner(p, 1);
1.12 kristaps 1568: break;
1569: default:
1570: abort();
1571: }
1.1 kristaps 1572:
1.3 kristaps 1573: if (p->outmacro)
1.23 kristaps 1574: texierr(p, "\"%s\" in open line scope!?", sects[sec]);
1.3 kristaps 1575: else if (p->literal)
1.23 kristaps 1576: texierr(p, "\"%s\" in a literal scope!?", sects[sec]);
1.3 kristaps 1577:
1.55 ! kristaps 1578: if (0 == sec && NULL != p->chapters) {
! 1579: teximdocclose(p, 0);
! 1580: teximdocopen(p);
! 1581: }
! 1582:
1.23 kristaps 1583: teximacroopen(p, sects[sec]);
1.46 kristaps 1584: parseeoln(p, pos);
1.3 kristaps 1585: teximacroclose(p);
1.11 kristaps 1586: p->seenvs = 1;
1.3 kristaps 1587: }
1588:
1589: static void
1.55 ! kristaps 1590: dotop(struct texi *p, enum texicmd cmd, size_t *pos)
! 1591: {
! 1592:
! 1593: if (--p->ign)
! 1594: texierr(p, "@top command while ignoring");
! 1595:
! 1596: if (NULL == p->chapters)
! 1597: teximdocopen(p);
! 1598: dosection(p, cmd, pos);
! 1599: }
! 1600:
! 1601: static void
1.46 kristaps 1602: dosp(struct texi *p, enum texicmd cmd, size_t *pos)
1.3 kristaps 1603: {
1604:
1.37 kristaps 1605: if (p->literal)
1606: texiputchar(p, '\n');
1607: else
1608: texivspace(p);
1.12 kristaps 1609: /* FIXME: ignore and parseeoln. */
1.46 kristaps 1610: advanceeoln(p, pos, 1);
1.1 kristaps 1611: }
1612:
1613: static void
1.46 kristaps 1614: doitem(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1615: {
1616:
1.18 kristaps 1617: /* Multitable is using raw tbl(7). */
1618: if (TEXILIST_TABLE == p->list) {
1619: texiputchar(p, '\n');
1620: return;
1621: }
1622:
1.3 kristaps 1623: if (p->outmacro)
1624: texierr(p, "item in open line scope!?");
1625: else if (p->literal)
1626: texierr(p, "item in a literal scope!?");
1627:
1628: switch (p->list) {
1629: case (TEXILIST_ITEM):
1.5 kristaps 1630: teximacroopen(p, "It");
1.3 kristaps 1631: break;
1632: case (TEXILIST_NOITEM):
1.5 kristaps 1633: teximacro(p, "It");
1.3 kristaps 1634: break;
1635: default:
1.11 kristaps 1636: texivspace(p);
1.3 kristaps 1637: break;
1638: }
1.18 kristaps 1639:
1640: /* Trick so we don't start with Pp. */
1.11 kristaps 1641: p->seenvs = 1;
1.46 kristaps 1642: parseeoln(p, pos);
1.1 kristaps 1643:
1.3 kristaps 1644: if (TEXILIST_ITEM == p->list)
1645: teximacroclose(p);
1.9 kristaps 1646: else if (p->outcol > 0)
1.1 kristaps 1647: texiputchar(p, '\n');
1.18 kristaps 1648: }
1649:
1650: static void
1.46 kristaps 1651: dotab(struct texi *p, enum texicmd cmd, size_t *pos)
1.18 kristaps 1652: {
1653:
1654: /* This command is only useful in @multitable. */
1655: if (TEXILIST_TABLE == p->list)
1656: texiputchar(p, '\t');
1657: }
1658:
1659: static void
1.46 kristaps 1660: domultitable(struct texi *p, enum texicmd cmd, size_t *pos)
1.18 kristaps 1661: {
1662: enum texilist sv = p->list;
1.32 kristaps 1663: int svliteral = p->literal;
1.18 kristaps 1664: enum texicmd type;
1665: size_t i, end, columns;
1666:
1667: p->list = TEXILIST_TABLE;
1.32 kristaps 1668: /*
1669: * TS/TE blocks aren't "in mdoc(7)", so we can disregard the
1670: * fact that we're in literal mode right now.
1671: */
1672: p->literal = 0;
1.18 kristaps 1673: teximacro(p, "TS");
1674: columns = 0;
1675:
1676: /* Advance to the first argument... */
1.46 kristaps 1677: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1678: advance(p, pos);
1.18 kristaps 1679:
1680: /* Make sure we don't print anything when scanning. */
1681: p->ign++;
1.46 kristaps 1682: if ('@' == BUF(p)[*pos]) {
1.18 kristaps 1683: /*
1684: * Look for @columnfractions.
1685: * We ignore these, but we do use the number of
1686: * arguments to set the number of columns that we'll
1687: * have.
1688: */
1.46 kristaps 1689: type = texicmd(p, *pos, &end, NULL);
1690: advanceto(p, pos, end);
1.18 kristaps 1691: if (TEXICMD_COLUMNFRACTIONS != type)
1.25 kristaps 1692: texierr(p, "unknown multitable command");
1.46 kristaps 1693: while (*pos < BUFSZ(p) && '\n' != BUF(p)[*pos]) {
1694: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1695: advance(p, pos);
1696: while (*pos < BUFSZ(p) && ! isws(BUF(p)[*pos])) {
1697: if ('\n' == BUF(p)[*pos])
1.18 kristaps 1698: break;
1.46 kristaps 1699: advance(p, pos);
1.18 kristaps 1700: }
1701: columns++;
1702: }
1703: } else
1704: /*
1705: * We have arguments.
1706: * We could parse these, but it's easier to just let
1707: * tbl(7) figure it out.
1708: * So use this only to count arguments.
1709: */
1.46 kristaps 1710: while (parselinearg(p, pos) > 0)
1.18 kristaps 1711: columns++;
1712: p->ign--;
1713:
1714: /* Left-justify each table entry. */
1715: for (i = 0; i < columns; i++) {
1716: if (i > 0)
1717: texiputchar(p, ' ');
1718: texiputchar(p, 'l');
1719: }
1720: texiputchars(p, ".\n");
1721: p->outmacro++;
1.46 kristaps 1722: parseto(p, pos, texitoks[cmd].tok);
1.18 kristaps 1723: p->outmacro--;
1724: teximacro(p, "TE");
1.32 kristaps 1725: p->literal = svliteral;
1.18 kristaps 1726: p->list = sv;
1.1 kristaps 1727: }
1728:
1729: static void
1.46 kristaps 1730: dotable(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1731: {
1.3 kristaps 1732: enum texilist sv = p->list;
1733:
1734: p->list = TEXILIST_ITEM;
1.5 kristaps 1735: teximacro(p, "Bl -tag -width Ds");
1.12 kristaps 1736: /* FIXME: ignore and parseeoln. */
1.46 kristaps 1737: advanceeoln(p, pos, 1);
1.11 kristaps 1738: p->seenvs = 1;
1.46 kristaps 1739: parseto(p, pos, texitoks[cmd].tok);
1.5 kristaps 1740: teximacro(p, "El");
1.3 kristaps 1741: p->list = sv;
1.44 kristaps 1742: }
1743:
1744: static void
1.46 kristaps 1745: doend(struct texi *p, enum texicmd cmd, size_t *pos)
1.44 kristaps 1746: {
1747: size_t start;
1748:
1.46 kristaps 1749: while (*pos < BUFSZ(p) && isws(BUF(p)[*pos]))
1750: advance(p, pos);
1.44 kristaps 1751: start = *pos;
1.46 kristaps 1752: while (*pos < BUFSZ(p) && '\n' != BUF(p)[*pos])
1753: advance(p, pos);
1.44 kristaps 1754:
1.46 kristaps 1755: texiwarn(p, "unexpected \"end\": %.*s", (int)(*pos - start), &BUF(p)[start]);
1756: advanceeoln(p, pos, 1);
1.1 kristaps 1757: }
1758:
1759: static void
1.46 kristaps 1760: doenumerate(struct texi *p, enum texicmd cmd, size_t *pos)
1.2 kristaps 1761: {
1.3 kristaps 1762: enum texilist sv = p->list;
1.2 kristaps 1763:
1.3 kristaps 1764: p->list = TEXILIST_NOITEM;
1.5 kristaps 1765: teximacro(p, "Bl -enum");
1.11 kristaps 1766: p->seenvs = 1;
1.12 kristaps 1767: /* FIXME: ignore and parseeoln. */
1.46 kristaps 1768: advanceeoln(p, pos, 1);
1769: parseto(p, pos, "enumerate");
1.5 kristaps 1770: teximacro(p, "El");
1.3 kristaps 1771: p->list = sv;
1.2 kristaps 1772: }
1773:
1774: static void
1.46 kristaps 1775: doitemize(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1776: {
1.3 kristaps 1777: enum texilist sv = p->list;
1.1 kristaps 1778:
1.21 kristaps 1779: p->list = TEXILIST_NOITEM;
1.5 kristaps 1780: teximacro(p, "Bl -bullet");
1.11 kristaps 1781: p->seenvs = 1;
1.12 kristaps 1782: /* FIXME: ignore and parseeoln. */
1.46 kristaps 1783: advanceeoln(p, pos, 1);
1784: parseto(p, pos, "itemize");
1.5 kristaps 1785: teximacro(p, "El");
1.3 kristaps 1786: p->list = sv;
1.1 kristaps 1787: }
1788:
1789: static void
1.46 kristaps 1790: doignbracket(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1791: {
1792:
1.3 kristaps 1793: p->ign++;
1.53 kristaps 1794: parsebracket(p, pos, 0);
1.3 kristaps 1795: p->ign--;
1.1 kristaps 1796: }
1797:
1798: static void
1.46 kristaps 1799: doignline(struct texi *p, enum texicmd cmd, size_t *pos)
1.1 kristaps 1800: {
1801:
1.12 kristaps 1802: /* FIXME: ignore and parseeoln. */
1.46 kristaps 1803: advanceeoln(p, pos, 1);
1.1 kristaps 1804: }
1805:
1.8 kristaps 1806: /*
1807: * Parse colon-separated directories from "cp" (if not NULL) and returns
1808: * the array of pointers.
1.40 kristaps 1809: * Prepends "base" to the array, if found.
1.8 kristaps 1810: * This does NOT sanitise the directories!
1811: */
1.5 kristaps 1812: static char **
1.27 kristaps 1813: parsedirs(struct texi *p, const char *base, const char *cp, size_t *sz)
1.5 kristaps 1814: {
1815: char *tok, *str, *tofree;
1816: const char *cpp;
1.40 kristaps 1817: size_t i = 0;
1.5 kristaps 1818: char **dirs;
1819:
1.40 kristaps 1820: /* Count up our expected arguments. */
1821: *sz = NULL != base;
1822: if (NULL != (cpp = cp))
1823: for ((*sz)++; NULL != (cpp = strchr(cpp, ':')); (*sz)++)
1.5 kristaps 1824: cpp++;
1825:
1.40 kristaps 1826: if (0 == *sz)
1827: return(NULL);
1.27 kristaps 1828: if (NULL == (dirs = calloc(*sz, sizeof(char *))))
1829: texiabort(p, NULL);
1.40 kristaps 1830: if (NULL != base && NULL == (dirs[i++] = strdup(base)))
1.27 kristaps 1831: texiabort(p, NULL);
1.5 kristaps 1832: if (NULL == cp)
1833: return(dirs);
1.27 kristaps 1834: if (NULL == (tofree = tok = str = strdup(cp)))
1835: texiabort(p, NULL);
1.5 kristaps 1836:
1.40 kristaps 1837: for ( ; NULL != (tok = strsep(&str, ":")); i++)
1.27 kristaps 1838: if (NULL == (dirs[i] = strdup(tok)))
1839: texiabort(p, NULL);
1.5 kristaps 1840:
1841: free(tofree);
1842: return(dirs);
1843: }
1844:
1.1 kristaps 1845: int
1846: main(int argc, char *argv[])
1847: {
1848: struct texi texi;
1.2 kristaps 1849: int c;
1.37 kristaps 1850: char *dirpath, *dir, *ccp;
1.10 kristaps 1851: const char *progname, *Idir, *cp;
1.1 kristaps 1852:
1853: progname = strrchr(argv[0], '/');
1854: if (progname == NULL)
1855: progname = argv[0];
1856: else
1857: ++progname;
1858:
1.10 kristaps 1859: memset(&texi, 0, sizeof(struct texi));
1.40 kristaps 1860: texi.ign = 1;
1.55 ! kristaps 1861: texi.outfile = stdout;
1.5 kristaps 1862: Idir = NULL;
1.10 kristaps 1863:
1.55 ! kristaps 1864: while (-1 != (c = getopt(argc, argv, "C:I:")))
1.1 kristaps 1865: switch (c) {
1.55 ! kristaps 1866: case ('C'):
! 1867: texi.chapters = optarg;
! 1868: break;
1.5 kristaps 1869: case ('I'):
1870: Idir = optarg;
1871: break;
1.1 kristaps 1872: default:
1873: goto usage;
1874: }
1875:
1876: argv += optind;
1.40 kristaps 1877: argc -= optind;
1.1 kristaps 1878:
1.40 kristaps 1879: if (argc > 0) {
1880: if (NULL == (dirpath = strdup(argv[0])))
1881: texiabort(&texi, NULL);
1882: if (NULL == (dir = dirname(dirpath)))
1883: texiabort(&texi, NULL);
1884: if (NULL != (cp = strrchr(argv[0], '/')))
1885: texi.title = strdup(cp + 1);
1886: else
1887: texi.title = strdup(argv[0]);
1888: if (NULL == texi.title)
1889: texiabort(&texi, NULL);
1890: else if (NULL != (ccp = strchr(texi.title, '.')))
1891: *ccp = '\0';
1892: texi.dirs = parsedirs(&texi, dir, Idir, &texi.dirsz);
1893: free(dirpath);
1894: parsefile(&texi, argv[0], 1);
1895: } else {
1896: texi.title = strdup("Unknown Manual");
1897: texi.dirs = parsedirs(&texi, NULL, Idir, &texi.dirsz);
1898: parsestdin(&texi);
1899: }
1.27 kristaps 1900:
1.2 kristaps 1901: texiexit(&texi);
1902: return(EXIT_FAILURE);
1.1 kristaps 1903: usage:
1.55 ! kristaps 1904: fprintf(stderr, "usage: %s [-Cdir] [-Idirs] [file]\n", progname);
1.1 kristaps 1905: return(EXIT_FAILURE);
1906: }
CVSweb