=================================================================== RCS file: /cvs/texi2mdoc/main.c,v retrieving revision 1.14 retrieving revision 1.22 diff -u -p -r1.14 -r1.22 --- texi2mdoc/main.c 2015/02/19 08:09:55 1.14 +++ texi2mdoc/main.c 2015/02/19 16:44:26 1.22 @@ -1,4 +1,4 @@ -/* $Id: main.c,v 1.14 2015/02/19 08:09:55 kristaps Exp $ */ +/* $Id: main.c,v 1.22 2015/02/19 16:44:26 kristaps Exp $ */ /* * Copyright (c) 2015 Kristaps Dzonsons * @@ -37,10 +37,12 @@ */ enum texicmd { TEXICMD_ACRONYM, + TEXICMD_ACUTE, TEXICMD_A4PAPER, TEXICMD_ANCHOR, TEXICMD_APPENDIX, TEXICMD_APPENDIXSEC, + TEXICMD_APPENDIXSUBSEC, TEXICMD_ASTERISK, TEXICMD_AT, TEXICMD_AUTHOR, @@ -51,21 +53,37 @@ enum texicmd { TEXICMD_CENTER, TEXICMD_CHAPTER, TEXICMD_CINDEX, + TEXICMD_CIRCUMFLEX, TEXICMD_CITE, TEXICMD_CODE, TEXICMD_COLON, + TEXICMD_COLUMNFRACTIONS, TEXICMD_COMMAND, TEXICMD_COMMENT, TEXICMD_COMMENT_LONG, TEXICMD_CONTENTS, TEXICMD_COPYING, TEXICMD_COPYRIGHT, + TEXICMD_DEFFN, + TEXICMD_DEFFNX, + TEXICMD_DEFMAC, + TEXICMD_DEFMACX, + TEXICMD_DEFTP, + TEXICMD_DEFTPX, TEXICMD_DEFTYPEFN, TEXICMD_DEFTYPEFNX, TEXICMD_DEFTYPEFUN, TEXICMD_DEFTYPEFUNX, TEXICMD_DEFTYPEVAR, + TEXICMD_DEFTYPEVARX, TEXICMD_DEFTYPEVR, + TEXICMD_DEFTYPEVRX, + TEXICMD_DEFUN, + TEXICMD_DEFUNX, + TEXICMD_DEFVAR, + TEXICMD_DEFVARX, + TEXICMD_DEFVR, + TEXICMD_DEFVRX, TEXICMD_DETAILMENU, TEXICMD_DFN, TEXICMD_DIRCATEGORY, @@ -77,11 +95,19 @@ enum texicmd { TEXICMD_END, TEXICMD_ENUMERATE, TEXICMD_ENV, + TEXICMD_ERROR, TEXICMD_EXAMPLE, + TEXICMD_EXPANSION, TEXICMD_FILE, + TEXICMD_FINALOUT, + TEXICMD_FINDEX, + TEXICMD_FTABLE, + TEXICMD_FORMAT, + TEXICMD_GRAVE, TEXICMD_GROUP, TEXICMD_HEADING, TEXICMD_HEADINGS, + TEXICMD_HEADITEM, TEXICMD_HYPHEN, TEXICMD_I, TEXICMD_IFCLEAR, @@ -98,19 +124,26 @@ enum texicmd { TEXICMD_IFTEX, TEXICMD_IFSET, TEXICMD_IFXML, + TEXICMD_IGNORE, TEXICMD_IMAGE, TEXICMD_INCLUDE, TEXICMD_INDENTBLOCK, TEXICMD_INSERTCOPYING, TEXICMD_ITEM, TEXICMD_ITEMIZE, + TEXICMD_ITEMX, TEXICMD_KBD, + TEXICMD_KEY, + TEXICMD_KINDEX, TEXICMD_LATEX, TEXICMD_MATH, TEXICMD_MENU, + TEXICMD_MULTITABLE, + TEXICMD_NEED, TEXICMD_NEWLINE, TEXICMD_NODE, TEXICMD_NOINDENT, + TEXICMD_OPTION, TEXICMD_PXREF, TEXICMD_QUESTIONMARK, TEXICMD_QUOTATION, @@ -119,6 +152,7 @@ enum texicmd { TEXICMD_PRINTINDEX, TEXICMD_R, TEXICMD_REF, + TEXICMD_RESULT, TEXICMD_SAMP, TEXICMD_SANSSERIF, TEXICMD_SC, @@ -130,29 +164,40 @@ enum texicmd { TEXICMD_SLANTED, TEXICMD_SP, TEXICMD_SPACE, + TEXICMD_SMALLBOOK, TEXICMD_SMALLDISPLAY, TEXICMD_SMALLEXAMPLE, + TEXICMD_SMALLFORMAT, TEXICMD_SMALLINDENTBLOCK, TEXICMD_SQUIGGLE_LEFT, TEXICMD_SQUIGGLE_RIGHT, TEXICMD_STRONG, + TEXICMD_SUBHEADING, TEXICMD_SUBSECTION, TEXICMD_SUBTITLE, + TEXICMD_SYNCODEINDEX, TEXICMD_T, TEXICMD_TAB, + TEXICMD_TABSYM, TEXICMD_TABLE, TEXICMD_TEX, TEXICMD_TEXSYM, + TEXICMD_TILDE, TEXICMD_TITLE, TEXICMD_TITLEFONT, TEXICMD_TITLEPAGE, TEXICMD_TOP, + TEXICMD_UMLAUT, TEXICMD_UNNUMBERED, TEXICMD_UNNUMBEREDSEC, + TEXICMD_UNNUMBEREDSUBSEC, TEXICMD_UREF, TEXICMD_URL, TEXICMD_VAR, + TEXICMD_VERBATIMINCLUDE, + TEXICMD_VINDEX, TEXICMD_VSKIP, + TEXICMD_VTABLE, TEXICMD_W, TEXICMD_XREF, TEXICMD__MAX @@ -191,6 +236,7 @@ enum texilist { TEXILIST_NONE = 0, TEXILIST_ITEM, TEXILIST_NOITEM, + TEXILIST_TABLE }; /* @@ -223,15 +269,14 @@ struct texi { #define ismspace(_x) \ (isws((_x)) || '\n' == (_x)) +static void doaccent(struct texi *, enum texicmd, const char *, size_t, size_t *); static void doblock(struct texi *, enum texicmd, const char *, size_t, size_t *); static void dobracket(struct texi *, enum texicmd, const char *, size_t, size_t *); static void dobye(struct texi *, enum texicmd, const char *, size_t, size_t *); -static void dodeftypefun(struct texi *, enum texicmd, const char *, size_t, size_t *); -static void dodeftypevar(struct texi *, enum texicmd, const char *, size_t, size_t *); +static void dodefn(struct texi *, enum texicmd, const char *, size_t, size_t *); static void dodisplay(struct texi *, enum texicmd, const char *, size_t, size_t *); static void doenumerate(struct texi *, enum texicmd, const char *, size_t, size_t *); static void doexample(struct texi *, enum texicmd, const char *, size_t, size_t *); -static void dofont(struct texi *, enum texicmd, const char *, size_t, size_t *); static void doignargn(struct texi *, enum texicmd, const char *, size_t, size_t *); static void doignblock(struct texi *, enum texicmd, const char *, size_t, size_t *); static void doignbracket(struct texi *, enum texicmd, const char *, size_t, size_t *); @@ -242,6 +287,7 @@ static void doitem(struct texi *, enum texicmd, const static void doitemize(struct texi *, enum texicmd, const char *, size_t, size_t *); static void dolink(struct texi *, enum texicmd, const char *, size_t, size_t *); static void domath(struct texi *, enum texicmd, const char *, size_t, size_t *); +static void domultitable(struct texi *, enum texicmd, const char *, size_t, size_t *); static void doquotation(struct texi *, enum texicmd, const char *, size_t, size_t *); static void dotable(struct texi *, enum texicmd, const char *, size_t, size_t *); static void dotop(struct texi *, enum texicmd, const char *, size_t, size_t *); @@ -249,57 +295,86 @@ static void dosection(struct texi *, enum texicmd, con static void dosp(struct texi *, enum texicmd, const char *, size_t, size_t *); static void dosubsection(struct texi *, enum texicmd, const char *, size_t, size_t *); static void dosymbol(struct texi *, enum texicmd, const char *, size_t, size_t *); +static void dotab(struct texi *, enum texicmd, const char *, size_t, size_t *); static void dotitle(struct texi *, enum texicmd, const char *, size_t, size_t *); +static void doverbinclude(struct texi *, enum texicmd, const char *, size_t, size_t *); static const struct texitok texitoks[TEXICMD__MAX] = { + /* TEXICMD__BEGIN */ { doignargn, "acronym", 7 }, /* TEXICMD_ACRONYM */ + { doaccent, "'", 1 }, /* TEXICMD_ACUTE */ { doignline, "afourpaper", 10 }, /* TEXICMD_A4PAPER */ { doignbracket, "anchor", 6 }, /* TEXICMD_ANCHOR */ { dosection, "appendix", 8 }, /* TEXICMD_APPENDIX */ { dosection, "appendixsec", 11 }, /* TEXICMD_APPENDIXSEC */ + { dosubsection, "appendixsubsec", 14 }, /* TEXICMD_APPENDIXSUBSEC */ { dosymbol, "*", 1 }, /* TEXICMD_ASTERISK */ { dosymbol, "@", 1 }, /* TEXICMD_AT */ { doignline, "author", 6 }, /* TEXICMD_AUTHOR */ - { dofont, "b", 1 }, /* TEXICMD_BOLD */ + { doinline, "b", 1 }, /* TEXICMD_BOLD */ { dosymbol, "!", 1 }, /* TEXICMD_BANG */ { dosymbol, "bullet", 6 }, /* TEXICMD_BULLET */ { dobye, "bye", 3 }, /* TEXICMD_BYE */ { doignline, "center", 6 }, /* TEXICMD_CENTER */ { dosection, "chapter", 7 }, /* TEXICMD_CHAPTER */ { doignline, "cindex", 6 }, /* TEXICMD_CINDEX */ - { dofont, "code", 4 }, /* TEXICMD_CODE */ - { dofont, "cite", 4 }, /* TEXICMD_CITE */ + { doaccent, "^", 1 }, /* TEXICMD_CIRCUMFLEX */ + { doinline, "code", 4 }, /* TEXICMD_CODE */ + { doinline, "cite", 4 }, /* TEXICMD_CITE */ { dosymbol, ":", 1 }, /* TEXICMD_COLON */ + { NULL, "columnfractions", 15 }, /* TEXICMD_COLUMNFRACTIONS */ { doinline, "command", 7 }, /* TEXICMD_COMMAND */ { doignline, "c", 1 }, /* TEXICMD_COMMENT */ { doignline, "comment", 7 }, /* TEXICMD_COMMENT_LONG */ { doignline, "contents", 8 }, /* TEXICMD_CONTENTS */ { doignblock, "copying", 7 }, /* TEXICMD_COPYING */ { dosymbol, "copyright", 9 }, /* TEXICMD_COPYRIGHT */ - { dodeftypefun, "deftypefn", 9 }, /* TEXICMD_DEFTYPEFN */ - { dodeftypefun, "deftypefnx", 10 }, /* TEXICMD_DEFTYPEFNX */ - { dodeftypefun, "deftypefun", 10 }, /* TEXICMD_DEFTYPEFUN */ - { dodeftypefun, "deftypefunx", 11 }, /* TEXICMD_DEFTYPEFUNX */ - { dodeftypevar, "deftypevar", 10 }, /* TEXICMD_DEFTYPEVAR */ - { dodeftypevar, "deftypevr", 9 }, /* TEXICMD_DEFTYPEVR */ + { dodefn, "deffn", 5 }, /* TEXICMD_DEFFN */ + { dodefn, "deffnx", 6 }, /* TEXICMD_DEFFNX */ + { dodefn, "defmac", 6 }, /* TEXICMD_DEFMAC */ + { dodefn, "defmacx", 7 }, /* TEXICMD_DEFMACX */ + { dodefn, "deftp", 5 }, /* TEXICMD_DEFTP */ + { dodefn, "deftpx", 6 }, /* TEXICMD_DEFTPX */ + { dodefn, "deftypefn", 9 }, /* TEXICMD_DEFTYPEFN */ + { dodefn, "deftypefnx", 10 }, /* TEXICMD_DEFTYPEFNX */ + { dodefn, "deftypefun", 10 }, /* TEXICMD_DEFTYPEFUN */ + { dodefn, "deftypefunx", 11 }, /* TEXICMD_DEFTYPEFUNX */ + { dodefn, "deftypevar", 10 }, /* TEXICMD_DEFTYPEVAR */ + { dodefn, "deftypevarx", 11 }, /* TEXICMD_DEFTYPEVARX */ + { dodefn, "deftypevr", 9 }, /* TEXICMD_DEFTYPEVR */ + { dodefn, "deftypevrx", 10 }, /* TEXICMD_DEFTYPEVRX */ + { dodefn, "defun", 5 }, /* TEXICMD_DEFUN */ + { dodefn, "defunx", 6 }, /* TEXICMD_DEFUNX */ + { dodefn, "defvar", 6 }, /* TEXICMD_DEFVAR */ + { dodefn, "defvarx", 7 }, /* TEXICMD_DEFVARX */ + { dodefn, "defvr", 5 }, /* TEXICMD_DEFVR */ + { dodefn, "defvrx", 6 }, /* TEXICMD_DEFVRX */ { doignblock, "detailmenu", 10 }, /* TEXICMD_DETAILMENU */ - { dofont, "dfn", 3 }, /* TEXICMD_DFN */ + { doinline, "dfn", 3 }, /* TEXICMD_DFN */ { doignline, "dircategory", 11 }, /* TEXICMD_DIRCATEGORY */ { doignblock, "direntry", 8 }, /* TEXICMD_DIRENTRY */ { dodisplay, "display", 7 }, /* TEXICMD_DISPLAY */ { dosymbol, "dots", 4 }, /* TEXICMD_DOTS */ { dolink, "email", 5 }, /* TEXICMD_EMAIL */ - { dofont, "emph", 4 }, /* TEXICMD_EMPH */ + { doinline, "emph", 4 }, /* TEXICMD_EMPH */ { NULL, "end", 3 }, /* TEXICMD_END */ { doenumerate, "enumerate", 9 }, /* TEXICMD_ENUMERATE */ { doinline, "env", 3 }, /* TEXICMD_ENV */ + { dosymbol, "error", 5 }, /* TEXICMD_ERROR */ { doexample, "example", 7 }, /* TEXICMD_EXAMPLE */ + { dosymbol, "expansion", 9 }, /* TEXICMD_EXPANSION */ { doinline, "file", 4 }, /* TEXICMD_FILE */ + { doignline, "finalout", 8 }, /* TEXICMD_FINALOUT */ + { doignline, "findex", 6 }, /* TEXICMD_FINDEX */ + { dotable, "ftable", 6 }, /* TEXICMD_FTABLE */ + { dodisplay, "format", 6 }, /* TEXICMD_FORMAT */ + { doaccent, "`", 1 }, /* TEXICMD_GRAVE */ { doblock, "group", 5 }, /* TEXICMD_GROUP */ { dosection, "heading", 7 }, /* TEXICMD_HEADING */ { doignline, "headings", 8 }, /* TEXICMD_HEADINGS */ + { doitem, "headitem", 8 }, /* TEXICMD_HEADITEM */ { dosymbol, "-", 1 }, /* TEXICMD_HYPHEN */ - { dofont, "i", 1 }, /* TEXICMD_I */ + { doinline, "i", 1 }, /* TEXICMD_I */ { doignblock, "ifclear", 7 }, /* TEXICMD_IFCLEAR */ { doignblock, "ifdocbook", 9 }, /* TEXICMD_IFDOCBOOK */ { doignblock, "ifhtml", 6 }, /* TEXICMD_IFHTML */ @@ -314,63 +389,83 @@ static const struct texitok texitoks[TEXICMD__MAX] = { { doignblock, "iftex", 5 }, /* TEXICMD_IFTEX */ { doignblock, "ifset", 5 }, /* TEXICMD_IFSET */ { doignblock, "ifxml", 5 }, /* TEXICMD_IFXML */ + { doignblock, "ignore", 6 }, /* TEXICMD_IGNORE */ { doignbracket, "image", 5 }, /* TEXICMD_IMAGE */ { doinclude, "include", 7 }, /* TEXICMD_INCLUDE */ { dodisplay, "indentblock", 11 }, /* TEXICMD_INDENTBLOCK */ { doignline, "insertcopying", 13 }, /* TEXICMD_INSERTCOPYING */ { doitem, "item", 4 }, /* TEXICMD_ITEM */ { doitemize, "itemize", 7 }, /* TEXICMD_ITEMIZE */ - { dofont, "kbd", 3 }, /* TEXICMD_KBD */ + { doitem, "itemx", 5 }, /* TEXICMD_ITEMX */ + { doinline, "kbd", 3 }, /* TEXICMD_KBD */ + { dobracket, "key", 3 }, /* TEXICMD_KEY */ + { doignline, "kindex", 6 }, /* TEXICMD_KINDEX */ { dosymbol, "LaTeX", 5 }, /* TEXICMD_LATEX */ { domath, "math", 4 }, /* TEXICMD_MATH */ { doignblock, "menu", 4 }, /* TEXICMD_MENU */ + { domultitable, "multitable", 10 }, /* TEXICMD_MULTITABLE */ + { doignline, "need", 4 }, /* TEXICMD_NEED */ { dosymbol, "\n", 1 }, /* TEXICMD_NEWLINE */ { doignline, "node", 4 }, /* TEXICMD_NODE */ { doignline, "noindent", 8 }, /* TEXICMD_NOINDENT */ + { doinline, "option", 6 }, /* TEXICMD_OPTION */ { dolink, "pxref", 5 }, /* TEXICMD_PXREF */ { dosymbol, "?", 1 }, /* TEXICMD_QUESTIONMARK */ { doquotation, "quotation", 9 }, /* TEXICMD_QUOTATION */ { doignline, "page", 4 }, /* TEXICMD_PAGE */ { doignline, "paragraphindent", 14 }, /* TEXICMD_PARINDENT */ { doignline, "printindex", 10 }, /* TEXICMD_PRINTINDEX */ - { dofont, "r", 1 }, /* TEXICMD_R */ + { doinline, "r", 1 }, /* TEXICMD_R */ { dobracket, "ref", 3 }, /* TEXICMD_REF */ - { dofont, "samp", 4 }, /* TEXICMD_SAMP */ - { dofont, "sansserif", 9 }, /* TEXICMD_SANSSERIF */ + { dosymbol, "result", 6 }, /* TEXICMD_RESULT */ + { doinline, "samp", 4 }, /* TEXICMD_SAMP */ + { doinline, "sansserif", 9 }, /* TEXICMD_SANSSERIF */ { dobracket, "sc", 2 }, /* TEXICMD_SC */ { dosection, "section", 7 }, /* TEXICMD_SECTION */ { doignline, "set", 3 }, /* TEXICMD_SET */ { doignline, "setchapternewpage", 17 }, /* TEXICMD_SETCHAPNEWPAGE */ { doignline, "setfilename", 11 }, /* TEXICMD_SETFILENAME */ { dotitle, "settitle", 8 }, /* TEXICMD_SETTITLE */ - { dofont, "slanted", 7 }, /* TEXICMD_SLANTED */ + { doinline, "slanted", 7 }, /* TEXICMD_SLANTED */ { dosp, "sp", 2 }, /* TEXICMD_SP */ { dosymbol, " ", 1 }, /* TEXICMD_SPACE */ + { doignline, "smallbook", 9 }, /* TEXICMD_SMALLBOOK */ { dodisplay, "smalldisplay", 12 }, /* TEXICMD_SMALLDISPLAY */ { doexample, "smallexample", 12 }, /* TEXICMD_SMALLEXAMPLE */ + { dodisplay, "smallformat", 11 }, /* TEXICMD_SMALLFORMAT */ { dodisplay, "smallindentblock", 16 }, /* TEXICMD_SMALLINDENTBLOCK */ { dosymbol, "{", 1 }, /* TEXICMD_SQUIGGLE_LEFT */ { dosymbol, "}", 1 }, /* TEXICMD_SQUIGGLE_RIGHT */ - { dofont, "strong", 6 }, /* TEXICMD_STRONG */ + { doinline, "strong", 6 }, /* TEXICMD_STRONG */ + { dosubsection, "subheading", 10 }, /* TEXICMD_SUBHEADING */ { dosubsection, "subsection", 10 }, /* TEXICMD_SUBSECTION */ { doignline, "subtitle", 8 }, /* TEXICMD_SUBTITLE */ - { dofont, "t", 1 }, /* TEXICMD_T */ - { dosymbol, "\t", 1 }, /* TEXICMD_TAB */ + { doignline, "syncodeindex", 12 }, /* TEXICMD_SYNCODEINDEX */ + { doinline, "t", 1 }, /* TEXICMD_T */ + { dotab, "tab", 3 }, /* TEXICMD_TAB */ + { dosymbol, "\t", 1 }, /* TEXICMD_TABSYM */ { dotable, "table", 5 }, /* TEXICMD_TABLE */ { doignblock, "tex", 3 }, /* TEXICMD_TEX */ { dosymbol, "TeX", 3 }, /* TEXICMD_TEXSYM */ + { doaccent, "~", 1 }, /* TEXICMD_TILDE */ { doignline, "title", 5 }, /* TEXICMD_TITLE */ { dobracket, "titlefont", 9 }, /* TEXICMD_TITLEFONT */ { doignblock, "titlepage", 9 }, /* TEXICMD_TITLEPAGE */ { dotop, "top", 3 }, /* TEXICMD_TOP */ + { doaccent, "\"", 1 }, /* TEXICMD_UMLAUT */ { dosection, "unnumbered", 10 }, /* TEXICMD_UNNUMBERED */ { dosection, "unnumberedsec", 13 }, /* TEXICMD_UNNUMBEREDSEC */ + { dosubsection, "unnumberedsubsec", 16 }, /* TEXICMD_UNNUMBEREDSUBSEC */ { dolink, "uref", 4 }, /* TEXICMD_UREF */ { dolink, "url", 3 }, /* TEXICMD_URL */ { doinline, "var", 3 }, /* TEXICMD_VAR */ + { doverbinclude, "verbatiminclude", 15 }, /* TEXICMD_VERBATIMINCLUDE */ + { doignline, "vindex", 6 }, /* TEXICMD_VINDEX */ { dosp, "vskip", 5 }, /* TEXICMD_VSKIP */ + { dotable, "vtable", 6 }, /* TEXICMD_VTABLE */ { dobracket, "w", 1 }, /* TEXICMD_W */ { dolink, "xref", 4 }, /* TEXICMD_XREF */ + /* TEXICMD__END */ }; /* @@ -466,6 +561,7 @@ texierr(struct texi *p, const char *fmt, ...) /* * Put a single data character to the output if we're not ignoring. * Adjusts our output status. + * This shouldn't be called for macros: just for ordinary text. */ static void texiputchar(struct texi *p, char c) @@ -473,6 +569,10 @@ texiputchar(struct texi *p, char c) if (p->ign) return; + + if ('.' == c && 0 == p->outcol) + fputs("\\&", stdout); + putchar(c); p->seenvs = 0; if ('\n' == c) { @@ -484,6 +584,7 @@ texiputchar(struct texi *p, char c) /* * Put multiple characters (see texiputchar()). + * This shouldn't be called for macros: just for ordinary text. */ static void texiputchars(struct texi *p, const char *s) @@ -501,9 +602,13 @@ static void teximacroclose(struct texi *p) { - /* FIXME: punctuation. */ - if (0 == --p->outmacro) - texiputchar(p, '\n'); + if (p->ign) + return; + + if (0 == --p->outmacro) { + putchar('\n'); + p->outcol = p->seenws = 0; + } } /* @@ -514,15 +619,26 @@ teximacroclose(struct texi *p) static void teximacroopen(struct texi *p, const char *s) { + int rc; - if (p->outcol && 0 == p->outmacro) - texiputchar(p, '\n'); + if (p->ign) + return; + + if (p->outcol && 0 == p->outmacro) { + putchar('\n'); + p->outcol = 0; + } + if (0 == p->outmacro) - texiputchar(p, '.'); + putchar('.'); else - texiputchar(p, ' '); - texiputchars(p, s); - texiputchar(p, ' '); + putchar(' '); + + if (EOF != (rc = fputs(s, stdout))) + p->outcol += rc; + + putchar(' '); + p->outcol++; p->outmacro++; p->seenws = 0; } @@ -534,17 +650,20 @@ static void teximacro(struct texi *p, const char *s) { + if (p->ign) + return; + if (p->outmacro) texierr(p, "\"%s\" in open line scope!?", s); - else if (p->literal) + if (p->literal) texierr(p, "\"%s\" in a literal scope!?", s); if (p->outcol) - texiputchar(p, '\n'); + putchar('\n'); - texiputchar(p, '.'); - texiputchars(p, s); - texiputchar(p, '\n'); + putchar('.'); + puts(s); + p->outcol = p->seenws = 0; } static void @@ -680,7 +799,7 @@ texiword(struct texi *p, const char *buf, size_t sz, size_t *pos, char extra) { - if (0 == p->outmacro && p->outcol > 72 && 0 == p->literal) + if (p->seenws && 0 == p->outmacro && p->outcol > 72 && 0 == p->literal) texiputchar(p, '\n'); /* FIXME: abstract this: we use it elsewhere. */ if (p->seenws && p->outcol && 0 == p->literal) @@ -868,11 +987,11 @@ parseeoln(struct texi *p, const char *buf, size_t sz, size_t end; enum texicmd cmd; - assert(0 == p->literal); - while (*pos < sz && '\n' != buf[*pos]) { while (*pos < sz && isws(buf[*pos])) { p->seenws = 1; + if (p->literal) + texiputchar(p, buf[*pos]); advance(p, buf, pos); } switch (buf[*pos]) { @@ -941,6 +1060,25 @@ parsesingle(struct texi *p, const char *buf, size_t sz (*texitoks[cmd].fp)(p, cmd, buf, sz, pos); } +static int +parselinearg(struct texi *p, const char *buf, size_t sz, size_t *pos) +{ + + while (*pos < sz && isws(buf[*pos])) { + p->seenws = 1; + advance(p, buf, pos); + } + + if (*pos < sz && '{' == buf[*pos]) + parsebracket(p, buf, sz, pos); + else if ('\n' != buf[*pos]) + parsesingle(p, buf, sz, pos); + else + return(0); + + return(1); +} + /* * Parse til the end of the buffer. */ @@ -1017,11 +1155,12 @@ parseto(struct texi *p, const char *buf, * This can be called in a nested context. */ static void -parsefile(struct texi *p, const char *fname) +parsefile(struct texi *p, const char *fname, int parse) { - struct texifile *f; - int fd; - struct stat st; + struct texifile *f; + int fd; + struct stat st; + size_t i; assert(p->filepos < 64); f = &p->files[p->filepos]; @@ -1044,46 +1183,43 @@ parsefile(struct texi *p, const char *fname) texiabort(p, fname); p->filepos++; - parseeof(p, f->map, f->mapsz); + if ( ! parse) { + /* + * We're printing verbatim output. + * Make sure it doesn't get interpreted as mdoc by + * escaping escapes and making sure leading dots don't + * trigger mdoc(7) expansion. + */ + for (i = 0; i < f->mapsz; i++) { + if (i > 0 && '.' == f->map[i]) + if ('\n' == f->map[i - 1]) + fputs("\\&", stdout); + putchar(f->map[i]); + if ('\\' == f->map[i]) + putchar('e'); + } + } else + parseeof(p, f->map, f->mapsz); texifilepop(p); } static void -dodeftypevar(struct texi *p, enum texicmd cmd, +dodefn(struct texi *p, enum texicmd cmd, const char *buf, size_t sz, size_t *pos) { const char *blk; - blk = TEXICMD_DEFTYPEVR == cmd ? - "deftypevr" : "deftypevar"; - - if (p->ign) { - parseto(p, buf, sz, pos, blk); - return; - } - - texivspace(p); - if (TEXICMD_DEFTYPEVR == cmd) { - parsebracket(p, buf, sz, pos); - texiputchars(p, ":\n"); - } - teximacroopen(p, "Vt"); - parseeoln(p, buf, sz, pos); - teximacroclose(p); - texivspace(p); - parseto(p, buf, sz, pos, blk); -} - -static void -dodeftypefun(struct texi *p, enum texicmd cmd, - const char *buf, size_t sz, size_t *pos) -{ - const char *blk; - blk = NULL; switch (cmd) { + case (TEXICMD_DEFFN): + case (TEXICMD_DEFTP): case (TEXICMD_DEFTYPEFN): case (TEXICMD_DEFTYPEFUN): + case (TEXICMD_DEFTYPEVAR): + case (TEXICMD_DEFTYPEVR): + case (TEXICMD_DEFUN): + case (TEXICMD_DEFVAR): + case (TEXICMD_DEFVR): blk = texitoks[cmd].tok; break; default: @@ -1091,33 +1227,100 @@ dodeftypefun(struct texi *p, enum texicmd cmd, } if (p->ign) { - if (NULL != blk) - parseto(p, buf, sz, pos, blk); + NULL != blk ? + parseto(p, buf, sz, pos, blk) : + parseeoln(p, buf, sz, pos); return; } + if (NULL != blk) + texivspace(p); + switch (cmd) { - case (TEXICMD_DEFTYPEFN): + case (TEXICMD_DEFMAC): + case (TEXICMD_DEFMACX): + texiputchars(p, "Macro"); + break; + case (TEXICMD_DEFTYPEVAR): + case (TEXICMD_DEFTYPEVARX): + case (TEXICMD_DEFVAR): + case (TEXICMD_DEFVARX): + texiputchars(p, "Variable"); + break; case (TEXICMD_DEFTYPEFUN): - texivspace(p); + case (TEXICMD_DEFTYPEFUNX): + case (TEXICMD_DEFUN): + case (TEXICMD_DEFUNX): + texiputchars(p, "Function"); break; default: + parselinearg(p, buf, sz, pos); break; } - if (TEXICMD_DEFTYPEFN == cmd || - TEXICMD_DEFTYPEFNX == cmd) { - parsebracket(p, buf, sz, pos); - texiputchars(p, ":\n"); + + texiputchars(p, ":\n"); + + switch (cmd) { + case (TEXICMD_DEFMAC): + case (TEXICMD_DEFMACX): + teximacroopen(p, "Dv"); + while (parselinearg(p, buf, sz, pos)) + /* Spin. */ ; + teximacroclose(p); + break; + case (TEXICMD_DEFFN): + case (TEXICMD_DEFFNX): + case (TEXICMD_DEFUN): + case (TEXICMD_DEFUNX): + teximacroopen(p, "Fo"); + parselinearg(p, buf, sz, pos); + teximacroclose(p); + teximacroopen(p, "Fa"); + while (parselinearg(p, buf, sz, pos)) + /* Spin. */ ; + teximacroclose(p); + teximacro(p, "Fc"); + break; + case (TEXICMD_DEFTYPEFUN): + case (TEXICMD_DEFTYPEFUNX): + case (TEXICMD_DEFTYPEFN): + case (TEXICMD_DEFTYPEFNX): + teximacroopen(p, "Ft"); + parselinearg(p, buf, sz, pos); + teximacroclose(p); + teximacroopen(p, "Fo"); + parselinearg(p, buf, sz, pos); + teximacroclose(p); + teximacroopen(p, "Fa"); + while (parselinearg(p, buf, sz, pos)) + /* Spin. */ ; + teximacroclose(p); + teximacro(p, "Fc"); + break; + case (TEXICMD_DEFTP): + case (TEXICMD_DEFTPX): + case (TEXICMD_DEFTYPEVAR): + case (TEXICMD_DEFTYPEVARX): + case (TEXICMD_DEFTYPEVR): + case (TEXICMD_DEFTYPEVRX): + teximacroopen(p, "Vt"); + while (parselinearg(p, buf, sz, pos)) + /* Spin. */ ; + teximacroclose(p); + break; + case (TEXICMD_DEFVAR): + case (TEXICMD_DEFVARX): + case (TEXICMD_DEFVR): + case (TEXICMD_DEFVRX): + teximacroopen(p, "Va"); + while (parselinearg(p, buf, sz, pos)) + /* Spin. */ ; + teximacroclose(p); + break; + default: + abort(); } - teximacroopen(p, "Ft"); - parsesingle(p, buf, sz, pos); - teximacroclose(p); - teximacroopen(p, "Fn"); - parsesingle(p, buf, sz, pos); - teximacroclose(p); - teximacroopen(p, "Li"); - parseeoln(p, buf, sz, pos); - teximacroclose(p); + texivspace(p); if (NULL != blk) parseto(p, buf, sz, pos, blk); @@ -1145,9 +1348,26 @@ static void doinline(struct texi *p, enum texicmd cmd, const char *buf, size_t sz, size_t *pos) { - const char *macro; + const char *macro = NULL; switch (cmd) { + case (TEXICMD_CODE): + case (TEXICMD_KBD): + case (TEXICMD_SAMP): + case (TEXICMD_T): + macro = "Li"; + break; + case (TEXICMD_CITE): + case (TEXICMD_DFN): + case (TEXICMD_EMPH): + case (TEXICMD_I): + case (TEXICMD_SLANTED): + macro = "Em"; + break; + case (TEXICMD_B): + case (TEXICMD_STRONG): + macro = "Sy"; + break; case (TEXICMD_COMMAND): macro = "Xr"; break; @@ -1157,14 +1377,17 @@ doinline(struct texi *p, enum texicmd cmd, case (TEXICMD_FILE): macro = "Pa"; break; + case (TEXICMD_OPTION): + macro = "Op"; + break; case (TEXICMD_VAR): macro = "Va"; break; default: - abort(); + break; } - if (p->literal) { + if (NULL == macro || p->literal) { parsebracket(p, buf, sz, pos); return; } @@ -1177,6 +1400,46 @@ doinline(struct texi *p, enum texicmd cmd, } static void +doverbinclude(struct texi *p, enum texicmd cmd, + const char *buf, size_t sz, size_t *pos) +{ + char fname[PATH_MAX], path[PATH_MAX]; + int rc; + size_t i; + + while (*pos < sz && ' ' == buf[*pos]) + advance(p, buf, pos); + + /* Read in the filename. */ + for (i = 0; *pos < sz && '\n' != buf[*pos]; i++) { + if (i == sizeof(fname) - 1) + break; + fname[i] = buf[*pos]; + advance(p, buf, pos); + } + + if (i == 0) + texierr(p, "path too short"); + else if ('\n' != buf[*pos]) + texierr(p, "path too long"); + else if ('/' == fname[0]) + texierr(p, "no absolute paths"); + fname[i] = '\0'; + + if (strstr(fname, "../") || strstr(fname, "/..")) + texierr(p, "insecure path"); + + rc = snprintf(path, sizeof(path), + "%s/%s", p->dirs[0], fname); + if (rc < 0) + texierr(p, "couldn't format path"); + else if ((size_t)rc >= sizeof(path)) + texierr(p, "path too long"); + + parsefile(p, path, 0); +} + +static void doinclude(struct texi *p, enum texicmd cmd, const char *buf, size_t sz, size_t *pos) { @@ -1216,7 +1479,7 @@ doinclude(struct texi *p, enum texicmd cmd, else if (-1 == access(path, R_OK)) continue; - parsefile(p, path); + parsefile(p, path, 1); return; } @@ -1224,41 +1487,6 @@ doinclude(struct texi *p, enum texicmd cmd, } static void -dofont(struct texi *p, enum texicmd cmd, - const char *buf, size_t sz, size_t *pos) -{ - const char *font; - - switch (cmd) { - case (TEXICMD_B): - case (TEXICMD_STRONG): - font = "\\fB"; - break; - case (TEXICMD_CITE): - case (TEXICMD_DFN): - case (TEXICMD_EMPH): - case (TEXICMD_I): - case (TEXICMD_SLANTED): - font = "\\fI"; - break; - case (TEXICMD_CODE): - case (TEXICMD_KBD): - case (TEXICMD_R): - case (TEXICMD_SAMP): - case (TEXICMD_SANSSERIF): - case (TEXICMD_T): - font = "\\fR"; - break; - default: - abort(); - } - - texiputchars(p, font); - parsebracket(p, buf, sz, pos); - texiputchars(p, "\\fP"); -} - -static void dobracket(struct texi *p, enum texicmd cmd, const char *buf, size_t sz, size_t *pos) { @@ -1271,7 +1499,16 @@ dodisplay(struct texi *p, enum texicmd cmd, const char *buf, size_t sz, size_t *pos) { - teximacro(p, "Bd -filled -offset indent"); + switch (cmd) { + case (TEXICMD_FORMAT): + case (TEXICMD_SMALLFORMAT): + teximacro(p, "Bd -filled"); + break; + default: + teximacro(p, "Bd -filled -offset indent"); + break; + } + p->seenvs = 1; /* FIXME: ignore and parseeoln. */ advanceeoln(p, buf, sz, pos, 1); @@ -1320,6 +1557,89 @@ dotitle(struct texi *p, enum texicmd cmd, } static void +doaccent(struct texi *p, enum texicmd cmd, + const char *buf, size_t sz, size_t *pos) +{ + + if (*pos == sz) + return; + advance(p, buf, pos); + switch (cmd) { + case (TEXICMD_ACUTE): + switch (buf[*pos]) { + case ('a'): case ('A'): + case ('e'): case ('E'): + case ('i'): case ('I'): + case ('o'): case ('O'): + case ('u'): case ('U'): + texiputchars(p, "\\(\'"); + texiputchar(p, buf[*pos]); + break; + default: + texiputchar(p, buf[*pos]); + } + break; + case (TEXICMD_CIRCUMFLEX): + switch (buf[*pos]) { + case ('a'): case ('A'): + case ('e'): case ('E'): + case ('i'): case ('I'): + case ('o'): case ('O'): + case ('u'): case ('U'): + texiputchars(p, "\\(^"); + texiputchar(p, buf[*pos]); + break; + default: + texiputchar(p, buf[*pos]); + } + break; + case (TEXICMD_GRAVE): + switch (buf[*pos]) { + case ('a'): case ('A'): + case ('e'): case ('E'): + case ('i'): case ('I'): + case ('o'): case ('O'): + case ('u'): case ('U'): + texiputchars(p, "\\(`"); + texiputchar(p, buf[*pos]); + break; + default: + texiputchar(p, buf[*pos]); + } + break; + case (TEXICMD_TILDE): + switch (buf[*pos]) { + case ('a'): case ('A'): + case ('n'): case ('N'): + case ('o'): case ('O'): + texiputchars(p, "\\(~"); + texiputchar(p, buf[*pos]); + break; + default: + texiputchar(p, buf[*pos]); + } + break; + case (TEXICMD_UMLAUT): + switch (buf[*pos]) { + case ('a'): case ('A'): + case ('e'): case ('E'): + case ('i'): case ('I'): + case ('o'): case ('O'): + case ('u'): case ('U'): + case ('y'): + texiputchars(p, "\\(:"); + texiputchar(p, buf[*pos]); + break; + default: + texiputchar(p, buf[*pos]); + } + break; + default: + abort(); + } +} + +static void dosymbol(struct texi *p, enum texicmd cmd, const char *buf, size_t sz, size_t *pos) { @@ -1333,7 +1653,7 @@ dosymbol(struct texi *p, enum texicmd cmd, case (TEXICMD_ASTERISK): case (TEXICMD_NEWLINE): case (TEXICMD_SPACE): - case (TEXICMD_TAB): + case (TEXICMD_TABSYM): texiputchar(p, ' '); break; case (TEXICMD_AT): @@ -1351,12 +1671,21 @@ dosymbol(struct texi *p, enum texicmd cmd, case (TEXICMD_DOTS): texiputchars(p, "..."); break; + case (TEXICMD_ERROR): + texiputchars(p, "error\\(->"); + break; + case (TEXICMD_EXPANSION): + texiputchars(p, "\\(->"); + break; case (TEXICMD_LATEX): texiputchars(p, "LaTeX"); break; case (TEXICMD_QUESTIONMARK): texiputchar(p, '?'); break; + case (TEXICMD_RESULT): + texiputchars(p, "\\(rA"); + break; case (TEXICMD_SQUIGGLE_LEFT): texiputchars(p, "{"); break; @@ -1482,6 +1811,7 @@ dosubsection(struct texi *p, enum texicmd cmd, else if (p->literal) texierr(p, "\"Em\" in a literal scope!?"); + /* We don't have a subsubsection, so make one up. */ texivspace(p); teximacroopen(p, "Em"); parseeoln(p, buf, sz, pos); @@ -1541,6 +1871,13 @@ dotop(struct texi *p, enum texicmd cmd, time_t t; char date[32]; + /* + * Here we print our standard mdoc(7) prologue. + * We use the title set with @settitle for the `Nd' description + * and the source document filename (the first one as invoked on + * the command line) for the title. + * The date is set to the current date. + */ t = time(NULL); strftime(date, sizeof(date), "%F", localtime(&t)); @@ -1571,6 +1908,12 @@ doitem(struct texi *p, enum texicmd cmd, const char *buf, size_t sz, size_t *pos) { + /* Multitable is using raw tbl(7). */ + if (TEXILIST_TABLE == p->list) { + texiputchar(p, '\n'); + return; + } + if (p->outmacro) texierr(p, "item in open line scope!?"); else if (p->literal) @@ -1587,8 +1930,9 @@ doitem(struct texi *p, enum texicmd cmd, texivspace(p); break; } - p->seenvs = 1; + /* Trick so we don't start with Pp. */ + p->seenvs = 1; parseeoln(p, buf, sz, pos); if (TEXILIST_ITEM == p->list) @@ -1598,6 +1942,80 @@ doitem(struct texi *p, enum texicmd cmd, } static void +dotab(struct texi *p, enum texicmd cmd, + const char *buf, size_t sz, size_t *pos) +{ + + /* This command is only useful in @multitable. */ + if (TEXILIST_TABLE == p->list) + texiputchar(p, '\t'); +} + +static void +domultitable(struct texi *p, enum texicmd cmd, + const char *buf, size_t sz, size_t *pos) +{ + enum texilist sv = p->list; + enum texicmd type; + size_t i, end, columns; + + p->list = TEXILIST_TABLE; + teximacro(p, "TS"); + columns = 0; + + /* Advance to the first argument... */ + while (*pos < sz && isws(buf[*pos])) + advance(p, buf, pos); + + /* Make sure we don't print anything when scanning. */ + p->ign++; + if ('@' == buf[*pos]) { + /* + * Look for @columnfractions. + * We ignore these, but we do use the number of + * arguments to set the number of columns that we'll + * have. + */ + type = texicmd(p, buf, *pos, sz, &end); + advanceto(p, buf, pos, end); + if (TEXICMD_COLUMNFRACTIONS != type) + texierr(p, "unknown multitable type"); + while (*pos < sz && '\n' != buf[*pos]) { + while (*pos < sz && isws(buf[*pos])) + advance(p, buf, pos); + while (*pos < sz && ! isws(buf[*pos])) { + if ('\n' == buf[*pos]) + break; + advance(p, buf, pos); + } + columns++; + } + } else + /* + * We have arguments. + * We could parse these, but it's easier to just let + * tbl(7) figure it out. + * So use this only to count arguments. + */ + while (parselinearg(p, buf, sz, pos) > 0) + columns++; + p->ign--; + + /* Left-justify each table entry. */ + for (i = 0; i < columns; i++) { + if (i > 0) + texiputchar(p, ' '); + texiputchar(p, 'l'); + } + texiputchars(p, ".\n"); + p->outmacro++; + parseto(p, buf, sz, pos, texitoks[cmd].tok); + p->outmacro--; + teximacro(p, "TE"); + p->list = sv; +} + +static void dotable(struct texi *p, enum texicmd cmd, const char *buf, size_t sz, size_t *pos) { @@ -1608,7 +2026,7 @@ dotable(struct texi *p, enum texicmd cmd, /* FIXME: ignore and parseeoln. */ advanceeoln(p, buf, sz, pos, 1); p->seenvs = 1; - parseto(p, buf, sz, pos, "table"); + parseto(p, buf, sz, pos, texitoks[cmd].tok); teximacro(p, "El"); p->list = sv; } @@ -1635,7 +2053,7 @@ doitemize(struct texi *p, enum texicmd cmd, { enum texilist sv = p->list; - p->list = TEXILIST_ITEM; + p->list = TEXILIST_NOITEM; teximacro(p, "Bl -bullet"); p->seenvs = 1; /* FIXME: ignore and parseeoln. */ @@ -1763,7 +2181,7 @@ main(int argc, char *argv[]) texi.ign = 1; texi.dirs = parsedirs(dir, Idir, &texi.dirsz); - parsefile(&texi, argv[0]); + parsefile(&texi, argv[0], 1); /* We shouldn't get here. */ texiexit(&texi); return(EXIT_FAILURE);