===================================================================
RCS file: /cvs/docbook2mdoc/docbook2mdoc.c,v
retrieving revision 1.5
retrieving revision 1.62
diff -u -p -r1.5 -r1.62
--- docbook2mdoc/docbook2mdoc.c	2014/03/28 10:03:36	1.5
+++ docbook2mdoc/docbook2mdoc.c	2019/03/22 17:42:53	1.62
@@ -1,6 +1,7 @@
-/*	$Id: docbook2mdoc.c,v 1.5 2014/03/28 10:03:36 kristaps Exp $ */
+/* $Id: docbook2mdoc.c,v 1.62 2019/03/22 17:42:53 schwarze Exp $ */
 /*
  * Copyright (c) 2014 Kristaps Dzonsons <kristaps@bsd.lv>
+ * Copyright (c) 2019 Ingo Schwarze <schwarze@openbsd.org>
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
@@ -24,345 +25,219 @@
 #include <stdio.h>
 #include <stdlib.h>
 #include <string.h>
+#include <unistd.h>
 
-/*
- * All recognised node types.
- */
-enum	nodeid {
-	NODE_ROOT = 0, /* Must comes first. */
-	/* Alpha-ordered hereafter. */
-	NODE_ARG,
-	NODE_CITEREFENTRY,
-	NODE_CMDSYNOPSIS,
-	NODE_CODE,
-	NODE_COMMAND,
-	NODE_FUNCDEF,
-	NODE_FUNCPROTOTYPE,
-	NODE_FUNCSYNOPSIS,
-	NODE_FUNCSYNOPSISINFO,
-	NODE_FUNCTION,
-	NODE_MANVOLNUM, 
-	NODE_OPTION,
-	NODE_PARA,
-	NODE_PARAMDEF,
-	NODE_PARAMETER,
-	NODE_PROGRAMLISTING,
-	NODE_REFCLASS,
-	NODE_REFDESCRIPTOR,
-	NODE_REFENTRY,
-	NODE_REFENTRYTITLE,
-	NODE_REFMETA,
-	NODE_REFMISCINFO,
-	NODE_REFNAME,
-	NODE_REFNAMEDIV,
-	NODE_REFPURPOSE,
-	NODE_REFSECT1,
-	NODE_REFSYNOPSISDIV,
-	NODE_SYNOPSIS,
-	NODE_TEXT, 
-	NODE_TITLE,
-	NODE__MAX
-};
+#include "extern.h"
 
 /*
  * Global parse state.
  * Keep this as simple and small as possible.
  */
 struct	parse {
+	XML_Parser	 xml;
 	enum nodeid	 node; /* current (NODE_ROOT if pre-tree) */
+	const char	*fname; /* filename */
 	int		 stop; /* should we stop now? */
+#define	PARSE_EQN	 1
+	unsigned int	 flags; /* document-wide flags */
 	struct pnode	*root; /* root of parse tree */
 	struct pnode	*cur; /* current node in tree */
-	char		*b;
-	size_t		 bsz;
-	size_t		 mbsz;
+	char		*b; /* NUL-terminated buffer for pre-print */
+	size_t		 bsz; /* current length of b */
+	size_t		 mbsz; /* max bsz allocation */
+	int		 level; /* header level, starting at 1 */
+	int		 newln; /* output: are we on a fresh line */
 };
 
 struct	node {
-	const char	*name;
-	unsigned int	 flags;
-#define	NODE_IGNTEXT	 1 /* ignore all contained text */
+	const char	*name; /* docbook element name */
+	enum nodeid	 node; /* docbook element to generate */
 };
 
 TAILQ_HEAD(pnodeq, pnode);
+TAILQ_HEAD(pattrq, pattr);
 
+struct	pattr {
+	enum attrkey	 key;
+	enum attrval	 val;
+	char		*rawval;
+	TAILQ_ENTRY(pattr) child;
+};
+
 struct	pnode {
 	enum nodeid	 node; /* node type */
 	char		*b; /* binary data buffer */
+	char		*real; /* store for "b" */
 	size_t		 bsz; /* data buffer size */
 	struct pnode	*parent; /* parent (or NULL if top) */
 	struct pnodeq	 childq; /* queue of children */
+	struct pattrq	 attrq; /* attributes of node */
 	TAILQ_ENTRY(pnode) child;
 };
 
-static	const struct node nodes[NODE__MAX] = {
-	{ NULL, 0 }, 
-	{ "arg", 0 }, 
-	{ "citerefentry", NODE_IGNTEXT }, 
-	{ "cmdsynopsis", NODE_IGNTEXT }, 
-	{ "code", 0 }, 
-	{ "command", 0 }, 
-	{ "funcdef", 0 },
-	{ "funcprototype", NODE_IGNTEXT }, 
-	{ "funcsynopsis", NODE_IGNTEXT }, 
-	{ "funcsynopsisinfo", 0 }, 
-	{ "function", 0 }, 
-	{ "manvolnum", 0 }, 
-	{ "option", 0 }, 
-	{ "para", 0 }, 
-	{ "paramdef", 0 },
-	{ "parameter", 0 }, 
-	{ "programlisting", 0 }, 
-	{ "refclass", NODE_IGNTEXT }, 
-	{ "refdescriptor", NODE_IGNTEXT }, 
-	{ "refentry", NODE_IGNTEXT }, 
-	{ "refentrytitle", 0 }, 
-	{ "refmeta", NODE_IGNTEXT }, 
-	{ "refmiscinfo", NODE_IGNTEXT }, 
-	{ "refname", 0 }, 
-	{ "refnamediv", NODE_IGNTEXT }, 
-	{ "refpurpose", 0 }, 
-	{ "refsect1", 0 }, 
-	{ "refsynopsisdiv", NODE_IGNTEXT }, 
-	{ "synopsis", 0 }, 
-	{ NULL, 0 }, 
-	{ "title", 0 }, 
+static	const char *attrkeys[ATTRKEY__MAX] = {
+	"choice",
+	"class",
+	"close",
+	"id",
+	"linkend",
+	"open",
+	"rep"
 };
 
-/*
- * Look up whether "parent" is a valid parent for "node".
- */
-static int
-isparent(enum nodeid node, enum nodeid parent)
-{
+static	const char *attrvals[ATTRVAL__MAX] = {
+	"monospaced",
+	"norepeat",
+	"opt",
+	"plain",
+	"repeat",
+	"req"
+};
 
-	switch (node) {
-	case (NODE_ROOT):
-		return(0);
-	case (NODE_ARG):
-		switch (parent) {
-		case (NODE_ARG):
-		case (NODE_CMDSYNOPSIS):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_CITEREFENTRY):
-		switch (parent) {
-		case (NODE_FUNCSYNOPSISINFO):
-		case (NODE_PARA):
-		case (NODE_PROGRAMLISTING):
-		case (NODE_REFDESCRIPTOR):
-		case (NODE_REFENTRYTITLE):
-		case (NODE_REFNAME):
-		case (NODE_REFPURPOSE):
-		case (NODE_SYNOPSIS):
-		case (NODE_TITLE):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_CMDSYNOPSIS):
-		switch (parent) {
-		case (NODE_PARA):
-		case (NODE_REFSECT1):
-		case (NODE_REFSYNOPSISDIV):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_CODE):
-		switch (parent) {
-		case (NODE_FUNCSYNOPSISINFO):
-		case (NODE_PARA):
-		case (NODE_PROGRAMLISTING):
-		case (NODE_REFDESCRIPTOR):
-		case (NODE_REFENTRYTITLE):
-		case (NODE_REFNAME):
-		case (NODE_REFPURPOSE):
-		case (NODE_SYNOPSIS):
-		case (NODE_TITLE):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_COMMAND):
-		switch (parent) {
-		case (NODE_CMDSYNOPSIS):
-		case (NODE_FUNCSYNOPSISINFO):
-		case (NODE_PARA):
-		case (NODE_PROGRAMLISTING):
-		case (NODE_REFDESCRIPTOR):
-		case (NODE_REFENTRYTITLE):
-		case (NODE_REFNAME):
-		case (NODE_REFPURPOSE):
-		case (NODE_SYNOPSIS):
-		case (NODE_TITLE):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_FUNCDEF):
-		return(NODE_FUNCPROTOTYPE == parent);
-	case (NODE_FUNCPROTOTYPE):
-		return(NODE_FUNCSYNOPSIS == parent);
-	case (NODE_FUNCSYNOPSIS):
-		switch (parent) {
-		case (NODE_PARA):
-		case (NODE_REFSECT1):
-		case (NODE_REFSYNOPSISDIV):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_FUNCSYNOPSISINFO):
-		return(NODE_FUNCSYNOPSIS == parent);
-	case (NODE_FUNCTION):
-		switch (parent) {
-		case (NODE_CODE):
-		case (NODE_FUNCDEF):
-		case (NODE_FUNCSYNOPSISINFO):
-		case (NODE_PARA):
-		case (NODE_PROGRAMLISTING):
-		case (NODE_REFDESCRIPTOR):
-		case (NODE_REFENTRYTITLE):
-		case (NODE_REFNAME):
-		case (NODE_REFPURPOSE):
-		case (NODE_SYNOPSIS):
-		case (NODE_TITLE):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_MANVOLNUM):
-		switch (parent) {
-		case (NODE_CITEREFENTRY):
-		case (NODE_REFMETA):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_OPTION):
-		switch (parent) {
-		case (NODE_ARG):
-		case (NODE_FUNCSYNOPSISINFO):
-		case (NODE_PARA):
-		case (NODE_PROGRAMLISTING):
-		case (NODE_REFDESCRIPTOR):
-		case (NODE_REFENTRYTITLE):
-		case (NODE_REFNAME):
-		case (NODE_REFPURPOSE):
-		case (NODE_SYNOPSIS):
-		case (NODE_TITLE):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_PARA):
-		switch (parent) {
-		case (NODE_REFSECT1):
-		case (NODE_REFSYNOPSISDIV):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_PARAMDEF):
-		return(NODE_FUNCPROTOTYPE == parent);
-	case (NODE_PARAMETER):
-		switch (parent) {
-		case (NODE_CODE):
-		case (NODE_FUNCSYNOPSISINFO):
-		case (NODE_PARA):
-		case (NODE_PARAMDEF):
-		case (NODE_PROGRAMLISTING):
-		case (NODE_REFDESCRIPTOR):
-		case (NODE_REFENTRYTITLE):
-		case (NODE_REFNAME):
-		case (NODE_REFPURPOSE):
-		case (NODE_SYNOPSIS):
-		case (NODE_TITLE):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_PROGRAMLISTING):
-		switch (parent) {
-		case (NODE_PARA):
-		case (NODE_REFSECT1):
-		case (NODE_REFSYNOPSISDIV):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_REFCLASS):
-		return(parent == NODE_REFNAMEDIV);
-	case (NODE_REFDESCRIPTOR):
-		return(parent == NODE_REFNAMEDIV);
-	case (NODE_REFENTRY):
-		return(parent == NODE_ROOT);
-	case (NODE_REFENTRYTITLE):
-		switch (parent) {
-		case (NODE_CITEREFENTRY):
-		case (NODE_REFMETA):
-			return(1);
-		default:
-			break;
-		}
-	case (NODE_REFMETA):
-		return(parent == NODE_REFENTRY);
-	case (NODE_REFMISCINFO):
-		return(parent == NODE_REFMETA);
-	case (NODE_REFNAME):
-		return(parent == NODE_REFNAMEDIV);
-	case (NODE_REFNAMEDIV):
-		return(parent == NODE_REFENTRY);
-	case (NODE_REFPURPOSE):
-		return(parent == NODE_REFNAMEDIV);
-	case (NODE_REFSECT1):
-		return(parent == NODE_REFENTRY);
-	case (NODE_REFSYNOPSISDIV):
-		return(parent == NODE_REFENTRY);
-	case (NODE_SYNOPSIS):
-		switch (parent) {
-		case (NODE_REFSYNOPSISDIV):
-		case (NODE_REFSECT1):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_TITLE):
-		switch (parent) {
-		case (NODE_REFSECT1):
-		case (NODE_REFSYNOPSISDIV):
-			return(1);
-		default:
-			break;
-		}
-		return(0);
-	case (NODE_TEXT):
-		return(1);
-	case (NODE__MAX):
-		break;
-	}
+static	const struct node nodes[] = {
+	{ "acronym",		NODE_ACRONYM },
+	{ "affiliation",	NODE_AFFILIATION },
+	{ "anchor",		NODE_ANCHOR },
+	{ "application",	NODE_APPLICATION },
+	{ "arg",		NODE_ARG },
+	{ "author",		NODE_AUTHOR },
+	{ "authorgroup",	NODE_AUTHORGROUP },
+	{ "blockquote",		NODE_BLOCKQUOTE },
+	{ "book",		NODE_BOOK },
+	{ "bookinfo",		NODE_BOOKINFO },
+	{ "caution",		NODE_CAUTION },
+	{ "chapter",		NODE_SECTION },
+	{ "citerefentry",	NODE_CITEREFENTRY },
+	{ "citetitle",		NODE_CITETITLE },
+	{ "cmdsynopsis",	NODE_CMDSYNOPSIS },
+	{ "code",		NODE_CODE },
+	{ "colspec",		NODE_COLSPEC },
+	{ "command",		NODE_COMMAND },
+	{ "constant",		NODE_CONSTANT },
+	{ "copyright",		NODE_COPYRIGHT },
+	{ "date",		NODE_DATE },
+	{ "editor",		NODE_EDITOR },
+	{ "emphasis",		NODE_EMPHASIS },
+	{ "entry",		NODE_ENTRY },
+	{ "envar",		NODE_ENVAR },
+	{ "fieldsynopsis",	NODE_FIELDSYNOPSIS },
+	{ "filename",		NODE_FILENAME },
+	{ "firstname",		NODE_FIRSTNAME },
+	{ "firstterm",		NODE_FIRSTTERM },
+	{ "footnote",		NODE_FOOTNOTE },
+	{ "funcdef",		NODE_FUNCDEF },
+	{ "funcprototype",	NODE_FUNCPROTOTYPE },
+	{ "funcsynopsis",	NODE_FUNCSYNOPSIS },
+	{ "funcsynopsisinfo",	NODE_FUNCSYNOPSISINFO },
+	{ "function",		NODE_FUNCTION },
+	{ "glossterm",		NODE_GLOSSTERM },
+	{ "group",		NODE_GROUP },
+	{ "holder",		NODE_HOLDER },
+	{ "index",		NODE_INDEX },
+	{ "indexterm",		NODE_INDEXTERM },
+	{ "info",		NODE_INFO },
+	{ "informalequation",	NODE_INFORMALEQUATION },
+	{ "informaltable",	NODE_INFORMALTABLE },
+	{ "inlineequation",	NODE_INLINEEQUATION },
+	{ "itemizedlist",	NODE_ITEMIZEDLIST },
+	{ "keysym",		NODE_KEYSYM },
+	{ "legalnotice",	NODE_LEGALNOTICE },
+	{ "link",		NODE_LINK },
+	{ "listitem",		NODE_LISTITEM },
+	{ "literal",		NODE_LITERAL },
+	{ "literallayout",	NODE_LITERALLAYOUT },
+	{ "manvolnum",		NODE_MANVOLNUM },
+	{ "member",		NODE_MEMBER },
+	{ "mml:math",		NODE_MML_MATH },
+	{ "mml:mfenced",	NODE_MML_MFENCED },
+	{ "mml:mfrac",		NODE_MML_MFRAC },
+	{ "mml:mi",		NODE_MML_MI },
+	{ "mml:mn",		NODE_MML_MN },
+	{ "mml:mo",		NODE_MML_MO },
+	{ "mml:mrow",		NODE_MML_MROW },
+	{ "mml:msub",		NODE_MML_MSUB },
+	{ "mml:msup",		NODE_MML_MSUP },
+	{ "modifier",		NODE_MODIFIER },
+	{ "note",		NODE_NOTE },
+	{ "option",		NODE_OPTION },
+	{ "orderedlist",	NODE_ORDEREDLIST },
+	{ "orgname",		NODE_ORGNAME },
+	{ "othername",		NODE_OTHERNAME },
+	{ "para",		NODE_PARA },
+	{ "paramdef",		NODE_PARAMDEF },
+	{ "parameter",		NODE_PARAMETER },
+	{ "part",		NODE_SECTION },
+	{ "phrase",		NODE_PHRASE },
+	{ "preface",		NODE_PREFACE },
+	{ "primary",		NODE_PRIMARY },
+	{ "programlisting",	NODE_PROGRAMLISTING },
+	{ "prompt",		NODE_PROMPT },
+	{ "quote",		NODE_QUOTE },
+	{ "refclass",		NODE_REFCLASS },
+	{ "refdescriptor",	NODE_REFDESCRIPTOR },
+	{ "refentry",		NODE_REFENTRY },
+	{ "refentryinfo",	NODE_REFENTRYINFO },
+	{ "refentrytitle",	NODE_REFENTRYTITLE },
+	{ "refmeta",		NODE_REFMETA },
+	{ "refmetainfo",	NODE_REFMETAINFO },
+	{ "refmiscinfo",	NODE_REFMISCINFO },
+	{ "refname",		NODE_REFNAME },
+	{ "refnamediv",		NODE_REFNAMEDIV },
+	{ "refpurpose",		NODE_REFPURPOSE },
+	{ "refsect1",		NODE_SECTION },
+	{ "refsect2",		NODE_SECTION },
+	{ "refsect3",		NODE_SECTION },
+	{ "refsection",		NODE_SECTION },
+	{ "refsynopsisdiv",	NODE_REFSYNOPSISDIV },
+	{ "releaseinfo",	NODE_RELEASEINFO },
+	{ "replaceable",	NODE_REPLACEABLE },
+	{ "row",		NODE_ROW },
+	{ "sbr",		NODE_SBR },
+	{ "screen",		NODE_SCREEN },
+	{ "secondary",		NODE_SECONDARY },
+	{ "sect1",		NODE_SECTION },
+	{ "sect2",		NODE_SECTION },
+	{ "section",		NODE_SECTION },
+	{ "sgmltag",		NODE_SGMLTAG },
+	{ "simplelist",		NODE_SIMPLELIST },
+	{ "spanspec",		NODE_SPANSPEC },
+	{ "structname",		NODE_STRUCTNAME },
+	{ "subtitle",		NODE_SUBTITLE },
+	{ "surname",		NODE_SURNAME },
+	{ "synopsis",		NODE_SYNOPSIS },
+	{ "table",		NODE_TABLE },
+	{ "tbody",		NODE_TBODY },
+	{ "term",		NODE_TERM },
+	{ "tfoot",		NODE_TFOOT },
+	{ "tgroup",		NODE_TGROUP },
+	{ "thead",		NODE_THEAD },
+	{ "tip",		NODE_TIP },
+	{ "title",		NODE_TITLE },
+	{ "trademark",		NODE_TRADEMARK },
+	{ "type",		NODE_TYPE },
+	{ "ulink",		NODE_ULINK },
+	{ "userinput",		NODE_USERINPUT },
+	{ "variablelist",	NODE_VARIABLELIST },
+	{ "varlistentry",	NODE_VARLISTENTRY },
+	{ "varname",		NODE_VARNAME },
+	{ "warning",		NODE_WARNING },
+	{ "wordasword",		NODE_WORDASWORD },
+	{ "year",		NODE_YEAR },
+	{ NULL,			NODE__MAX }
+};
 
-	abort();
-	return(0);
-}
+static	int warn = 0;
 
 static void
+pnode_print(struct parse *p, struct pnode *pn);
+
+/*
+ * Process a stream of characters.
+ * We store text as nodes in and of themselves.
+ * If a text node is already open, append to it.
+ * If it's not open, open one under the current context.
+ */
+static void
 xml_char(void *arg, const XML_Char *p, int sz)
 {
 	struct parse	*ps = arg;
@@ -373,24 +248,23 @@ xml_char(void *arg, const XML_Char *p, int sz)
 	if (ps->stop || NODE_ROOT == ps->node)
 		return;
 
-	/* Not supposed to be collecting text. */
 	assert(NULL != ps->cur);
-	if (NODE_IGNTEXT & nodes[ps->node].flags)
-		return;
 
 	/*
 	 * Are we in the midst of processing text?
 	 * If we're not processing text right now, then create a text
 	 * node for doing so.
 	 * However, don't do so unless we have some non-whitespace to
-	 * process!
+	 * process: strip out all leading whitespace to be sure.
 	 */
 	if (NODE_TEXT != ps->node) {
 		for (i = 0; i < sz; i++)
-			if ( ! isspace((int)p[i]))
+			if ( ! isspace((unsigned char)p[i]))
 				break;
 		if (i == sz)
 			return;
+		p += i;
+		sz -= i;
 		dat = calloc(1, sizeof(struct pnode));
 		if (NULL == dat) {
 			perror(NULL);
@@ -400,15 +274,15 @@ xml_char(void *arg, const XML_Char *p, int sz)
 		dat->node = ps->node = NODE_TEXT;
 		dat->parent = ps->cur;
 		TAILQ_INIT(&dat->childq);
+		TAILQ_INIT(&dat->attrq);
 		TAILQ_INSERT_TAIL(&ps->cur->childq, dat, child);
 		ps->cur = dat;
 		assert(NULL != ps->root);
-
 	}
 
 	/* Append to current buffer. */
 	assert(sz >= 0);
-	ps->cur->b = realloc(ps->cur->b, 
+	ps->cur->b = realloc(ps->cur->b,
 		ps->cur->bsz + (size_t)sz);
 	if (NULL == ps->cur->b) {
 		perror(NULL);
@@ -416,71 +290,89 @@ xml_char(void *arg, const XML_Char *p, int sz)
 	}
 	memcpy(ps->cur->b + ps->cur->bsz, p, sz);
 	ps->cur->bsz += (size_t)sz;
+	ps->cur->real = ps->cur->b;
 }
 
+static void
+pnode_trim(struct pnode *pn)
+{
+
+	assert(NODE_TEXT == pn->node);
+	for ( ; pn->bsz > 0; pn->bsz--)
+		if ( ! isspace((unsigned char)pn->b[pn->bsz - 1]))
+			break;
+}
+
 /*
  * Begin an element.
  * First, look for the element.
  * If we don't find it and we're not parsing, keep going.
- * If we don't find it (and we're parsing), puke and exit.
+ * If we don't find it and we're parsing, puke and exit.
  * If we find it but we're not parsing yet (i.e., it's not a refentry
  * and thus out of context), keep going.
- * If we're at the root and already have a tree, puke and exit.
+ * If we find it and we're at the root and already have a tree, puke and
+ * exit (FIXME: I don't think this is right?).
+ * If we find it but we're parsing a text node, close out the text node,
+ * return to its parent, and keep going.
  * Make sure that the element is in the right context.
  * Lastly, put the node onto our parse tree and continue.
  */
 static void
 xml_elem_start(void *arg, const XML_Char *name, const XML_Char **atts)
 {
-	struct parse	*ps = arg;
-	enum nodeid	 node;
-	struct pnode	*dat;
+	struct parse	 *ps = arg;
+	const struct node *node;
+	enum attrkey	  key;
+	enum attrval	  val;
+	struct pnode	 *dat;
+	struct pattr	 *pattr;
+	const XML_Char	**att;
 
-	if (ps->stop)
+	/* FIXME: find a better way to ditch other namespaces. */
+	if (ps->stop || 0 == strcmp(name, "xi:include"))
 		return;
 
 	/* Close out text node, if applicable... */
 	if (NODE_TEXT == ps->node) {
 		assert(NULL != ps->cur);
+		pnode_trim(ps->cur);
 		ps->cur = ps->cur->parent;
 		assert(NULL != ps->cur);
 		ps->node = ps->cur->node;
 	}
 
-	for (node = 0; node < NODE__MAX; node++)
-		if (NULL == nodes[node].name)
-			continue;
-		else if (0 == strcmp(nodes[node].name, name))
+	for (node = nodes; NULL != node->name; node++)
+		if (0 == strcmp(node->name, name))
 			break;
 
-	if (NODE__MAX == node && NODE_ROOT == ps->node) {
-		fprintf(stderr, "%s: ignoring node\n", name);
-		return;
-	} else if (NODE__MAX == node) {
-		fprintf(stderr, "%s: unknown node\n", name);
+	if (NULL == node->name) {
+		if (NODE_ROOT == ps->node)
+			return;
+		fprintf(stderr, "%s:%zu:%zu: unknown node \"%s\"\n",
+			ps->fname, XML_GetCurrentLineNumber(ps->xml),
+			XML_GetCurrentColumnNumber(ps->xml), name);
 		ps->stop = 1;
 		return;
 	} else if (NODE_ROOT == ps->node && NULL != ps->root) {
-		fprintf(stderr, "%s: reentering?\n", name);
+		fprintf(stderr, "%s:%zu:%zu: multiple refentries\n",
+			ps->fname, XML_GetCurrentLineNumber(ps->xml),
+			XML_GetCurrentColumnNumber(ps->xml));
 		ps->stop = 1;
 		return;
-	} else if (NODE_ROOT == ps->node && NODE_REFENTRY != node) {
-		fprintf(stderr, "%s: known node w/o context\n", name);
-		return;
-	} else if ( ! isparent(node, ps->node)) {
-		fprintf(stderr, "%s: bad parent\n", name);
-		ps->stop = 1;
-		return;
 	}
 
+	if (NODE_INLINEEQUATION == node->node)
+		ps->flags |= PARSE_EQN;
+
 	if (NULL == (dat = calloc(1, sizeof(struct pnode)))) {
 		perror(NULL);
 		exit(EXIT_FAILURE);
 	}
 
-	dat->node = ps->node = node;
+	dat->node = ps->node = node->node;
 	dat->parent = ps->cur;
 	TAILQ_INIT(&dat->childq);
+	TAILQ_INIT(&dat->attrq);
 
 	if (NULL != ps->cur)
 		TAILQ_INSERT_TAIL(&ps->cur->childq, dat, child);
@@ -488,11 +380,40 @@ xml_elem_start(void *arg, const XML_Char *name, const 
 	ps->cur = dat;
 	if (NULL == ps->root)
 		ps->root = dat;
+
+	/*
+	 * Process attributes.
+	 */
+	for (att = atts; NULL != *att; att += 2) {
+		for (key = 0; key < ATTRKEY__MAX; key++)
+			if (0 == strcmp(*att, attrkeys[key]))
+				break;
+		if (ATTRKEY__MAX == key) {
+			if (warn)
+				fprintf(stderr, "%s:%zu:%zu: warning: "
+					"unknown attribute \"%s\"\n",
+					ps->fname,
+					XML_GetCurrentLineNumber(ps->xml),
+					XML_GetCurrentColumnNumber(ps->xml),
+					*att);
+			continue;
+		}
+		for (val = 0; val < ATTRVAL__MAX; val++)
+			if (0 == strcmp(*(att + 1), attrvals[val]))
+				break;
+		pattr = calloc(1, sizeof(struct pattr));
+		pattr->key = key;
+		pattr->val = val;
+		if (ATTRVAL__MAX == val)
+			pattr->rawval = strdup(*(att + 1));
+		TAILQ_INSERT_TAIL(&dat->attrq, pattr, child);
+	}
+
 }
 
 /*
  * Roll up the parse tree.
- * Does nothing else special.
+ * If we're at a text node, roll that one up first.
  * If we hit the root, then assign ourselves as the NODE_ROOT.
  */
 static void
@@ -500,12 +421,16 @@ xml_elem_end(void *arg, const XML_Char *name)
 {
 	struct parse	*ps = arg;
 
+	/* FIXME: find a better way to ditch other namespaces. */
 	if (ps->stop || NODE_ROOT == ps->node)
 		return;
+	else if (0 == strcmp(name, "xi:include"))
+		return;
 
 	/* Close out text node, if applicable... */
 	if (NODE_TEXT == ps->node) {
 		assert(NULL != ps->cur);
+		pnode_trim(ps->cur);
 		ps->cur = ps->cur->parent;
 		assert(NULL != ps->cur);
 		ps->node = ps->cur->node;
@@ -517,10 +442,14 @@ xml_elem_end(void *arg, const XML_Char *name)
 		ps->node = ps->cur->node;
 }
 
+/*
+ * Recursively free a node (NULL is ok).
+ */
 static void
 pnode_free(struct pnode *pn)
 {
 	struct pnode	*pp;
+	struct pattr	*ap;
 
 	if (NULL == pn)
 		return;
@@ -530,10 +459,19 @@ pnode_free(struct pnode *pn)
 		pnode_free(pp);
 	}
 
-	free(pn->b);
+	while (NULL != (ap = TAILQ_FIRST(&pn->attrq))) {
+		TAILQ_REMOVE(&pn->attrq, ap, child);
+		free(ap->rawval);
+		free(ap);
+	}
+
+	free(pn->real);
 	free(pn);
 }
 
+/*
+ * Unlink a node from its parent and pnode_free() it.
+ */
 static void
 pnode_unlink(struct pnode *pn)
 {
@@ -543,6 +481,9 @@ pnode_unlink(struct pnode *pn)
 	pnode_free(pn);
 }
 
+/*
+ * Unlink all children of a node and pnode_free() them.
+ */
 static void
 pnode_unlinksub(struct pnode *pn)
 {
@@ -551,6 +492,40 @@ pnode_unlinksub(struct pnode *pn)
 		pnode_unlink(TAILQ_FIRST(&pn->childq));
 }
 
+/*
+ * Retrieve an enumeration attribute from a node.
+ * Return ATTRVAL__MAX if the node has no such attribute.
+ */
+enum attrval
+pnode_getattr(struct pnode *pn, enum attrkey key)
+{
+	struct pattr	*ap;
+
+	TAILQ_FOREACH(ap, &pn->attrq, child)
+		if (ap->key == key)
+			return ap->val;
+	return(ATTRVAL__MAX);
+}
+
+/*
+ * Retrieve an attribute string from a node.
+ * Return defval if the node has no such attribute.
+ */
+const char *
+pnode_getattr_raw(struct pnode *pn, enum attrkey key, const char *defval)
+{
+	struct pattr	*ap;
+
+	TAILQ_FOREACH(ap, &pn->attrq, child)
+		if (ap->key == key)
+			return ATTRVAL__MAX == ap->val ? ap->rawval :
+			    attrvals[ap->val];
+	return(defval);
+}
+
+/*
+ * Reset the lookaside buffer.
+ */
 static void
 bufclear(struct parse *p)
 {
@@ -558,6 +533,11 @@ bufclear(struct parse *p)
 	p->b[p->bsz = 0] = '\0';
 }
 
+/*
+ * Append NODE_TEXT contents to the current buffer, reallocating its
+ * size if necessary.
+ * The buffer is ALWAYS NUL-terminated.
+ */
 static void
 bufappend(struct parse *p, struct pnode *pn)
 {
@@ -575,6 +555,12 @@ bufappend(struct parse *p, struct pnode *pn)
 	p->b[p->bsz] = '\0';
 }
 
+/*
+ * Recursively append all NODE_TEXT nodes to the buffer.
+ * This descends into non-text nodes, but doesn't do anything beyond
+ * them.
+ * In other words, this is a recursive text grok.
+ */
 static void
 bufappend_r(struct parse *p, struct pnode *pn)
 {
@@ -587,44 +573,78 @@ bufappend_r(struct parse *p, struct pnode *pn)
 }
 
 /*
- * Print text presumably on a macro line.
- * Ignore any child macros.
+ * Recursively search and return the first instance of "node".
+ */
+static struct pnode *
+pnode_findfirst(struct pnode *pn, enum nodeid node)
+{
+	struct pnode	*pp, *res;
+
+	res = NULL;
+	TAILQ_FOREACH(pp, &pn->childq, child) {
+		res = pp->node == node ? pp :
+			pnode_findfirst(pp, node);
+		if (NULL != res)
+			break;
+	}
+
+	return(res);
+}
+
+#define MACROLINE_NORM	0
+#define MACROLINE_UPPER	1
+#define	MACROLINE_NOWS 2
+/*
+ * Recursively print text presumably on a macro line.
  * Convert all whitespace to regular spaces.
  */
 static void
-pnode_printmacrolinepart(struct parse *p, struct pnode *pn)
+pnode_printmacrolinetext(struct parse *p, struct pnode *pn, int fl)
 {
 	char		*cp;
 
+	if (0 == p->newln && ! (MACROLINE_NOWS & fl))
+		putchar(' ');
+
 	bufclear(p);
 	bufappend_r(p, pn);
 
 	/* Convert all space to spaces. */
 	for (cp = p->b; '\0' != *cp; cp++)
-		if (isspace((int)*cp))
+		if (isspace((unsigned char)*cp))
 			*cp = ' ';
 
-	for (cp = p->b; isspace((int)*cp); cp++)
+	for (cp = p->b; isspace((unsigned char)*cp); cp++)
 		/* Spin past whitespace (XXX: necessary?) */ ;
 	for ( ; '\0' != *cp; cp++) {
 		/* Escape us if we look like a macro. */
 		if ((cp == p->b || ' ' == *(cp - 1)) &&
-			isupper((int)*cp) &&
-			'\0' != *(cp + 1) && 
-			islower((int)*(cp + 1)) &&
-			('\0' == *(cp + 2) || 
+			isupper((unsigned char)*cp) &&
+			'\0' != *(cp + 1) &&
+			islower((unsigned char)*(cp + 1)) &&
+			('\0' == *(cp + 2) ||
 			 ' ' == *(cp + 2) ||
-			 (islower((int)*(cp + 2)) &&
-			  ('\0' == *(cp + 3) || 
+			 (islower((unsigned char)*(cp + 2)) &&
+			  ('\0' == *(cp + 3) ||
 			   ' ' == *(cp + 3)))))
 			fputs("\\&", stdout);
-		putchar(*cp);
+		if (MACROLINE_UPPER & fl)
+			putchar(toupper((unsigned char)*cp));
+		else
+			putchar(*cp);
 		/* If we're a character escape, escape us. */
 		if ('\\' == *cp)
 			putchar('e');
 	}
 }
 
+static void
+pnode_printmacrolinepart(struct parse *p, struct pnode *pn)
+{
+
+	pnode_printmacrolinetext(p, pn, 0);
+}
+
 /*
  * Just pnode_printmacrolinepart() but with a newline.
  * If no text, just the newline.
@@ -633,28 +653,187 @@ static void
 pnode_printmacroline(struct parse *p, struct pnode *pn)
 {
 
-	pnode_printmacrolinepart(p, pn);
+	assert(0 == p->newln);
+	pnode_printmacrolinetext(p, pn, 0);
 	putchar('\n');
+	p->newln = 1;
 }
 
 static void
+pnode_printmopen(struct parse *p)
+{
+	if (p->newln) {
+		putchar('.');
+		p->newln = 0;
+	} else
+		putchar(' ');
+}
+
+static void
+pnode_printmclose(struct parse *p, int sv)
+{
+
+	if (sv && ! p->newln) {
+		putchar('\n');
+		p->newln = 1;
+	}
+}
+
+/*
+ * Like pnode_printmclose() except we look to the next node, and, if
+ * found, see if it starts with punctuation.
+ * If it does, then we print that punctuation before the newline.
+ */
+static void
+pnode_printmclosepunct(struct parse *p, struct pnode *pn, int sv)
+{
+	/* We wouldn't have done anything anyway. */
+	if ( ! (sv && ! p->newln))
+		return;
+
+	/* No next node or it's not text. */
+	if (NULL == (pn = TAILQ_NEXT(pn, child))) {
+		pnode_printmclose(p, sv);
+		return;
+	} else if (NODE_TEXT != pn->node) {
+		pnode_printmclose(p, sv);
+		return;
+	}
+
+	/* Only do this for the comma/period. */
+	if (pn->bsz > 0 &&
+		(',' == pn->b[0] || '.' == pn->b[0]) &&
+		(1 == pn->bsz || isspace((unsigned char)pn->b[1]))) {
+		putchar(' ');
+		putchar(pn->b[0]);
+		pn->b++;
+		pn->bsz--;
+	}
+
+	putchar('\n');
+	p->newln = 1;
+}
+
+static void
+pnode_printpara(struct parse *p, struct pnode *pn)
+{
+	struct pnode	*pp;
+
+	assert(p->newln);
+	if ((pp = TAILQ_PREV(pn, pnodeq, child)) == NULL &&
+	    (pp = pn->parent) == NULL)
+		return;
+
+	switch (pp->node) {
+	case NODE_ENTRY:
+	case NODE_LISTITEM:
+		return;
+	case NODE_PREFACE:
+	case NODE_SECTION:
+		if (p->level < 3)
+			return;
+		break;
+	default:
+		break;
+	}
+	puts(".Pp");
+}
+
+/*
+ * If the SYNOPSIS macro has a superfluous title, kill it.
+ */
+static void
+pnode_printrefsynopsisdiv(struct parse *p, struct pnode *pn)
+{
+	struct pnode	*pp;
+
+	TAILQ_FOREACH(pp, &pn->childq, child)
+		if (NODE_TITLE == pp->node) {
+			pnode_unlink(pp);
+			return;
+		}
+}
+
+/*
+ * Start a hopefully-named `Sh' section.
+ */
+static void
 pnode_printrefsect(struct parse *p, struct pnode *pn)
 {
 	struct pnode	*pp;
+	const char	*title;
+	int		 flags, level;
 
+	if (NULL == pn->parent)
+		return;
+
+	level = ++p->level;
+	flags = 1 == level ? MACROLINE_UPPER : 0;
+	if (3 > level) {
+		switch (pn->node) {
+		case NODE_CAUTION:
+		case NODE_NOTE:
+		case NODE_TIP:
+		case NODE_WARNING:
+			level = 3;
+			break;
+		default:
+			break;
+		}
+	}
+
 	TAILQ_FOREACH(pp, &pn->childq, child)
 		if (NODE_TITLE == pp->node)
 			break;
 
-	fputs(".Sh ", stdout);
+	if (NULL == pp) {
+		switch (pn->node) {
+		case NODE_PREFACE:
+			title = "Preface";
+			break;
+		case NODE_CAUTION:
+			title = "Caution";
+			break;
+		case NODE_NOTE:
+			title = "Note";
+			break;
+		case NODE_TIP:
+			title = "Tip";
+			break;
+		case NODE_WARNING:
+			title = "Warning";
+			break;
+		default:
+			title = "Unknown";
+			break;
+		}
+	}
 
+	switch (level) {
+	case 1:
+		fputs(".Sh", stdout);
+		break;
+	case 2:
+		fputs(".Ss", stdout);
+		break;
+	default:
+		pnode_printpara(p, pn);
+		fputs(".Sy", stdout);
+		break;
+	}
+
 	if (NULL != pp) {
-		pnode_printmacroline(p, pp);
+		p->newln = 0;
+		pnode_printmacrolinetext(p, pp, flags);
+		pnode_printmclose(p, 1);
 		pnode_unlink(pp);
 	} else
-		puts("UNKNOWN");
+		printf(" %s\n", title);
 }
 
+/*
+ * Start a reference, extracting the title and volume.
+ */
 static void
 pnode_printciterefentry(struct parse *p, struct pnode *pn)
 {
@@ -667,18 +846,16 @@ pnode_printciterefentry(struct parse *p, struct pnode 
 		else if (NODE_REFENTRYTITLE == pp->node)
 			title = pp;
 
-	fputs(".Xr ", stdout);
-
 	if (NULL != title) {
 		pnode_printmacrolinepart(p, title);
-		putchar(' ');
 	} else
-		fputs("unknown ", stdout);
+		fputs(" unknown ", stdout);
 
-	if (NULL != manvol)
-		pnode_printmacroline(p, manvol);
-	else
-		puts("1");
+	if (NULL == manvol) {
+		puts(" 1");
+		p->newln = 1;
+	} else
+		pnode_printmacrolinepart(p, manvol);
 }
 
 static void
@@ -687,27 +864,26 @@ pnode_printrefmeta(struct parse *p, struct pnode *pn)
 	struct pnode	*pp, *title, *manvol;
 
 	title = manvol = NULL;
+	assert(p->newln);
 	TAILQ_FOREACH(pp, &pn->childq, child)
 		if (NODE_MANVOLNUM == pp->node)
 			manvol = pp;
 		else if (NODE_REFENTRYTITLE == pp->node)
 			title = pp;
 
-	puts(".Dd $Mdocdate" "$");
-	fputs(".Dt ", stdout);
+	fputs(".Dt", stdout);
+	p->newln = 0;
 
-	if (NULL != title) {
-		pnode_printmacrolinepart(p, title);
-		putchar(' ');
-	} else
-		fputs("UNKNOWN ", stdout);
-
-	if (NULL != manvol)
-		pnode_printmacroline(p, manvol);
+	if (NULL != title)
+		pnode_printmacrolinetext(p, title, MACROLINE_UPPER);
 	else
-		puts("1");
+		fputs(" UNKNOWN ", stdout);
 
-	puts(".Os");
+	if (NULL == manvol) {
+		puts(" 1");
+		p->newln = 1;
+	} else
+		pnode_printmacroline(p, manvol);
 }
 
 static void
@@ -715,6 +891,7 @@ pnode_printfuncdef(struct parse *p, struct pnode *pn)
 {
 	struct pnode	*pp, *ftype, *func;
 
+	assert(p->newln);
 	ftype = func = NULL;
 	TAILQ_FOREACH(pp, &pn->childq, child)
 		if (NODE_TEXT == pp->node)
@@ -723,15 +900,19 @@ pnode_printfuncdef(struct parse *p, struct pnode *pn)
 			func = pp;
 
 	if (NULL != ftype) {
-		fputs(".Ft ", stdout);
+		fputs(".Ft", stdout);
+		p->newln = 0;
 		pnode_printmacroline(p, ftype);
 	}
 
 	if (NULL != func) {
-		fputs(".Fo ", stdout);
+		fputs(".Fo", stdout);
+		p->newln = 0;
 		pnode_printmacroline(p, func);
-	} else 
+	} else {
 		puts(".Fo UNKNOWN");
+		p->newln = 1;
+	}
 }
 
 static void
@@ -739,6 +920,7 @@ pnode_printparamdef(struct parse *p, struct pnode *pn)
 {
 	struct pnode	*pp, *ptype, *param;
 
+	assert(p->newln);
 	ptype = param = NULL;
 	TAILQ_FOREACH(pp, &pn->childq, child)
 		if (NODE_TEXT == pp->node)
@@ -747,26 +929,83 @@ pnode_printparamdef(struct parse *p, struct pnode *pn)
 			param = pp;
 
 	fputs(".Fa \"", stdout);
+	p->newln = 0;
 	if (NULL != ptype) {
-		pnode_printmacrolinepart(p, ptype);
+		pnode_printmacrolinetext(p, ptype, MACROLINE_NOWS);
 		putchar(' ');
 	}
 
 	if (NULL != param)
 		pnode_printmacrolinepart(p, param);
-	else
-		fputs("UNKNOWN", stdout);
 
 	puts("\"");
+	p->newln = 1;
 }
 
+/*
+ * The <mml:mfenced> node is a little peculiar.
+ * First, it can have arbitrary open and closing tokens, which default
+ * to parentheses.
+ * Second, >1 arguments are separated by commas.
+ */
 static void
+pnode_printmathfenced(struct parse *p, struct pnode *pn)
+{
+	struct pnode	*pp;
+
+	printf("left %s ", pnode_getattr_raw(pn, ATTRKEY_OPEN, "("));
+
+	pp = TAILQ_FIRST(&pn->childq);
+	pnode_print(p, pp);
+
+	while (NULL != (pp = TAILQ_NEXT(pp, child))) {
+		putchar(',');
+		pnode_print(p, pp);
+	}
+
+	printf("right %s ", pnode_getattr_raw(pn, ATTRKEY_CLOSE, ")"));
+}
+
+/*
+ * These math nodes require special handling because they have infix
+ * syntax, instead of the usual prefix or prefix.
+ * So we need to break up the first and second child node with a
+ * particular eqn(7) word.
+ */
+static void
+pnode_printmath(struct parse *p, struct pnode *pn)
+{
+	struct pnode	*pp;
+
+	pp = TAILQ_FIRST(&pn->childq);
+	pnode_print(p, pp);
+
+	switch (pn->node) {
+	case NODE_MML_MSUP:
+		fputs(" sup ", stdout);
+		break;
+	case NODE_MML_MFRAC:
+		fputs(" over ", stdout);
+		break;
+	case NODE_MML_MSUB:
+		fputs(" sub ", stdout);
+		break;
+	default:
+		break;
+	}
+
+	pp = TAILQ_NEXT(pp, child);
+	pnode_print(p, pp);
+}
+
+static void
 pnode_printfuncprototype(struct parse *p, struct pnode *pn)
 {
 	struct pnode	*pp, *fdef;
 
+	assert(p->newln);
 	TAILQ_FOREACH(fdef, &pn->childq, child)
-		if (NODE_FUNCDEF == fdef->node) 
+		if (NODE_FUNCDEF == fdef->node)
 			break;
 
 	if (NULL != fdef)
@@ -774,138 +1013,534 @@ pnode_printfuncprototype(struct parse *p, struct pnode
 	else
 		puts(".Fo UNKNOWN");
 
-	TAILQ_FOREACH(pp, &pn->childq, child) 
+	TAILQ_FOREACH(pp, &pn->childq, child)
 		if (NODE_PARAMDEF == pp->node)
 			pnode_printparamdef(p, pp);
 
 	puts(".Fc");
+	p->newln = 1;
 }
 
-/* TODO: handle "optional" values. */
+/*
+ * The <arg> element is more complicated than it should be because text
+ * nodes are treated like ".Ar foo", but non-text nodes need to be
+ * re-sent into the printer (i.e., without the preceding ".Ar").
+ * This also handles the case of "repetition" (or in other words, the
+ * ellipsis following an argument) and optionality.
+ */
 static void
-pnode_printarg(struct parse *p, struct pnode *pn, int nested)
+pnode_printarg(struct parse *p, struct pnode *pn)
 {
 	struct pnode	*pp;
-	int		 sv = nested;
+	struct pattr	*ap;
+	int		 isop, isrep;
 
-	if ( ! nested) 
-		fputs(".", stdout);
-	nested = 1;
+	isop = 1;
+	isrep = 0;
+	TAILQ_FOREACH(ap, &pn->attrq, child)
+		if (ATTRKEY_CHOICE == ap->key &&
+			(ATTRVAL_PLAIN == ap->val ||
+			 ATTRVAL_REQ == ap->val))
+			isop = 0;
+		else if (ATTRKEY_REP == ap->key &&
+			(ATTRVAL_REPEAT == ap->val))
+			isrep = 1;
+
+	if (isop) {
+		pnode_printmopen(p);
+		fputs("Op", stdout);
+	}
+
+	TAILQ_FOREACH(pp, &pn->childq, child) {
+		if (NODE_TEXT == pp->node) {
+			pnode_printmopen(p);
+			fputs("Ar", stdout);
+		}
+		pnode_print(p, pp);
+		if (NODE_TEXT == pp->node && isrep)
+			fputs("...", stdout);
+	}
+}
+
+static void
+pnode_printgroup(struct parse *p, struct pnode *pn)
+{
+	struct pnode	*pp, *np;
+	struct pattr	*ap;
+	int		 isop, sv;
+
+	isop = 1;
+	TAILQ_FOREACH(ap, &pn->attrq, child)
+		if (ATTRKEY_CHOICE == ap->key &&
+			(ATTRVAL_PLAIN == ap->val ||
+			 ATTRVAL_REQ == ap->val)) {
+			isop = 0;
+			break;
+		}
+
+	/*
+	 * Make sure we're on a macro line.
+	 * This will prevent pnode_print() for putting us on a
+	 * subsequent line.
+	 */
+	sv = p->newln;
+	pnode_printmopen(p);
+	if (isop)
+		fputs("Op", stdout);
+	else if (sv)
+		fputs("No", stdout);
+
+	/*
+	 * Keep on printing text separated by the vertical bar as long
+	 * as we're within the same origin node as the group.
+	 * This is kind of a nightmare.
+	 * Eh, DocBook...
+	 * FIXME: if there's a "Fl", we don't cut off the leading "-"
+	 * like we do in pnode_print().
+	 */
+	TAILQ_FOREACH(pp, &pn->childq, child) {
+		pnode_print(p, pp);
+		np = TAILQ_NEXT(pp, child);
+		while (NULL != np) {
+			if (pp->node != np->node)
+				break;
+			fputs(" |", stdout);
+			pnode_printmacrolinepart(p, np);
+			pp = np;
+			np = TAILQ_NEXT(np, child);
+		}
+	}
+
+	pnode_printmclose(p, sv);
+}
+
+static void
+pnode_printprologue(struct parse *p, struct pnode *pn)
+{
+	struct pnode	*pp;
+
+	pp = NULL == p->root ? NULL :
+		pnode_findfirst(p->root, NODE_REFMETA);
+
+	puts(".Dd $Mdocdate" "$");
+	if (NULL != pp) {
+		pnode_printrefmeta(p, pp);
+		pnode_unlink(pp);
+	} else
+		printf(".Dt %s 1\n",
+		    pnode_getattr_raw(p->root, ATTRKEY_ID, "UNKNOWN"));
+	puts(".Os");
+
+	if (PARSE_EQN & p->flags) {
+		puts(".EQ");
+		puts("delim $$");
+		puts(".EN");
+	}
+}
+
+/*
+ * We can have multiple <term> elements within a <varlistentry>, which
+ * we should comma-separate as list headers.
+ */
+static void
+pnode_printvarlistentry(struct parse *p, struct pnode *pn)
+{
+	struct pnode	*pp;
+	int		 first = 1;
+
+	assert(p->newln);
+	fputs(".It", stdout);
+	p->newln = 0;
+
 	TAILQ_FOREACH(pp, &pn->childq, child)
-		if (NODE_OPTION == pp->node) {
-			fputs("Fl ", stdout);
-			pnode_printmacrolinepart(p, pp);
-		} else if (NODE_TEXT == pp->node) {
-			fputs("Ar ", stdout);
-			pnode_printmacrolinepart(p, pp);
-		} else if (NODE_ARG == pp->node)
-			pnode_printarg(p, pp, nested);
+		if (NODE_TERM == pp->node) {
+			if ( ! first)
+				putchar(',');
+			pnode_print(p, pp);
+			pnode_unlink(pp);
+			first = 0;
+		} else
+			break;
 
-	if ( ! sv)
-		puts("");
+	putchar('\n');
+	p->newln = 1;
 }
 
+static void
+pnode_printrow(struct parse *p, struct pnode *pn)
+{
+	struct pnode	*pp;
+
+	puts(".Bl -dash -compact");
+
+	TAILQ_FOREACH(pp, &pn->childq, child) {
+		assert(p->newln);
+		puts(".It");
+		pnode_print(p, pp);
+		pnode_printmclose(p, 1);
+	}
+	assert(p->newln);
+	puts(".El");
+}
+
+static void
+pnode_printtable(struct parse *p, struct pnode *pn)
+{
+	struct pnode	*pp;
+
+	assert(p->newln);
+	TAILQ_FOREACH(pp, &pn->childq, child)
+		if (NODE_TITLE == pp->node) {
+			pnode_printpara(p, pp);
+			pnode_print(p, pp);
+			pnode_unlink(pp);
+		}
+	assert(p->newln);
+	puts(".Bl -ohang");
+	while (NULL != (pp = pnode_findfirst(pn, NODE_ROW))) {
+		puts(".It Table Row");
+		pnode_printrow(p, pp);
+		pnode_printmclose(p, 1);
+		pnode_unlink(pp);
+	}
+	assert(p->newln);
+	puts(".El");
+}
+
+static void
+pnode_printlist(struct parse *p, struct pnode *pn)
+{
+	struct pnode	*pp;
+
+	assert(p->newln);
+	TAILQ_FOREACH(pp, &pn->childq, child)
+		if (NODE_TITLE == pp->node) {
+			pnode_printpara(p, pp);
+			pnode_print(p, pp);
+			pnode_unlink(pp);
+		}
+	assert(p->newln);
+
+	if (NODE_ORDEREDLIST == pn->node)
+		puts(".Bl -enum");
+	else
+		puts(".Bl -bullet");
+
+	TAILQ_FOREACH(pp, &pn->childq, child) {
+		assert(p->newln);
+		puts(".It");
+		pnode_print(p, pp);
+		pnode_printmclose(p, 1);
+	}
+	assert(p->newln);
+	puts(".El");
+}
+
+static void
+pnode_printvariablelist(struct parse *p, struct pnode *pn)
+{
+	struct pnode	*pp;
+
+	assert(p->newln);
+	TAILQ_FOREACH(pp, &pn->childq, child)
+		if (NODE_TITLE == pp->node) {
+			pnode_printpara(p, pp);
+			pnode_print(p, pp);
+			pnode_unlink(pp);
+		}
+
+	assert(p->newln);
+	puts(".Bl -tag -width Ds");
+	TAILQ_FOREACH(pp, &pn->childq, child)
+		if (NODE_VARLISTENTRY != pp->node) {
+			assert(p->newln);
+			fputs(".It", stdout);
+			pnode_printmacroline(p, pp);
+		} else {
+			assert(p->newln);
+			pnode_print(p, pp);
+		}
+	assert(p->newln);
+	puts(".El");
+}
+
 /*
  * Print a parsed node (or ignore it--whatever).
  * This is a recursive function.
- * FIXME: macro line continuation?
+ * FIXME: if we're in a literal context (<screen> or <programlisting> or
+ * whatever), don't print inline macros.
  */
 static void
 pnode_print(struct parse *p, struct pnode *pn)
 {
 	struct pnode	*pp;
+	const char	*ccp;
 	char		*cp;
-	int		 last;
+	int		 last, sv;
 
 	if (NULL == pn)
 		return;
 
-	if (NODE_TEXT != pn->node && NODE_ROOT != pn->node)
-		printf(".\\\" %s\n", nodes[pn->node].name);
+	sv = p->newln;
 
 	switch (pn->node) {
-	case (NODE_ARG):
-		pnode_printarg(p, pn, 0);
+	case NODE_APPLICATION:
+		pnode_printmopen(p);
+		fputs("Nm", stdout);
+		break;
+	case NODE_ANCHOR:
+		/* Don't print anything! */
+		return;
+	case NODE_ARG:
+		pnode_printarg(p, pn);
 		pnode_unlinksub(pn);
 		break;
-	case (NODE_CITEREFENTRY):
+	case NODE_AUTHOR:
+		pnode_printmopen(p);
+		fputs("An", stdout);
+		break;
+	case NODE_AUTHORGROUP:
+		assert(p->newln);
+		puts(".An -split");
+		break;
+	case NODE_BOOKINFO:
+		assert(p->newln);
+		puts(".Sh NAME");
+		break;
+	case NODE_CITEREFENTRY:
+		pnode_printmopen(p);
+		fputs("Xr", stdout);
 		pnode_printciterefentry(p, pn);
 		pnode_unlinksub(pn);
 		break;
-	case (NODE_CODE):
-		fputs(".Li ", stdout);
-		pnode_printmacroline(p, pn);
+	case NODE_CODE:
+		pnode_printmopen(p);
+		fputs("Li", stdout);
+		break;
+	case NODE_COMMAND:
+		pnode_printmopen(p);
+		fputs("Nm", stdout);
+		break;
+	case NODE_CONSTANT:
+		pnode_printmopen(p);
+		fputs("Dv", stdout);
+		break;
+	case NODE_EDITOR:
+		puts("editor: ");
+		pnode_printmopen(p);
+		fputs("An", stdout);
+		break;
+	case NODE_EMPHASIS:
+	case NODE_FIRSTTERM:
+		pnode_printmopen(p);
+		fputs("Em", stdout);
+		break;
+	case NODE_ENVAR:
+		pnode_printmopen(p);
+		fputs("Ev", stdout);
+		break;
+	case NODE_FILENAME:
+		pnode_printmopen(p);
+		fputs("Pa", stdout);
+		break;
+	case NODE_FUNCTION:
+		pnode_printmopen(p);
+		fputs("Fn", stdout);
+		break;
+	case NODE_FUNCPROTOTYPE:
+		assert(p->newln);
+		pnode_printfuncprototype(p, pn);
 		pnode_unlinksub(pn);
 		break;
-	case (NODE_COMMAND):
-		fputs(".Nm ", stdout);
-		pnode_printmacroline(p, pn);
+	case NODE_FUNCSYNOPSISINFO:
+		pnode_printmopen(p);
+		fputs("Fd", stdout);
+		break;
+	case NODE_INDEXTERM:
+		return;
+	case NODE_INFORMALEQUATION:
+		if ( ! p->newln)
+			putchar('\n');
+		puts(".EQ");
+		p->newln = 0;
+		break;
+	case NODE_INLINEEQUATION:
+		fputc('$', stdout);
+		p->newln = 0;
+		break;
+	case NODE_ITEMIZEDLIST:
+		assert(p->newln);
+		pnode_printlist(p, pn);
 		pnode_unlinksub(pn);
 		break;
-	case (NODE_FUNCTION):
-		fputs(".Fn ", stdout);
-		pnode_printmacroline(p, pn);
+	case NODE_GROUP:
+		pnode_printgroup(p, pn);
 		pnode_unlinksub(pn);
 		break;
-	case (NODE_FUNCPROTOTYPE):
-		pnode_printfuncprototype(p, pn);
+	case NODE_LEGALNOTICE:
+		assert(p->newln);
+		puts(".Sh LEGAL NOTICE");
+		break;
+	case NODE_LINK:
+		ccp = pnode_getattr_raw(pn, ATTRKEY_LINKEND, NULL);
+		if (NULL == ccp)
+			break;
+		pnode_printmopen(p);
+		printf("Sx %s\n", ccp);
+		p->newln = 1;
+		return;
+	case NODE_LITERAL:
+		pnode_printmopen(p);
+		fputs("Li", stdout);
+		break;
+	case NODE_LITERALLAYOUT:
+		assert(p->newln);
+		puts(".Bd -literal");
+		break;
+	case NODE_MML_MFENCED:
+		pnode_printmathfenced(p, pn);
 		pnode_unlinksub(pn);
 		break;
-	case (NODE_FUNCSYNOPSISINFO):
-		fputs(".Fd ", stdout);
-		pnode_printmacroline(p, pn);
+	case NODE_MML_MROW:
+	case NODE_MML_MI:
+	case NODE_MML_MN:
+	case NODE_MML_MO:
+		if (TAILQ_EMPTY(&pn->childq))
+			break;
+		fputs(" { ", stdout);
+		break;
+	case NODE_MML_MFRAC:
+	case NODE_MML_MSUB:
+	case NODE_MML_MSUP:
+		pnode_printmath(p, pn);
 		pnode_unlinksub(pn);
 		break;
-	case (NODE_PARA):
-		/* FIXME: not always. */
-		puts(".Pp");
+	case NODE_OPTION:
+		pnode_printmopen(p);
+		fputs("Fl", stdout);
 		break;
-	case (NODE_PARAMETER):
-		fputs(".Fa \"", stdout);
-		pnode_printmacrolinepart(p, pn);
-		puts("\"");
+	case NODE_ORDEREDLIST:
+		assert(p->newln);
+		pnode_printlist(p, pn);
 		pnode_unlinksub(pn);
 		break;
-	case (NODE_PROGRAMLISTING):
-		puts(".Bd -literal");
+	case NODE_PARA:
+		pnode_printpara(p, pn);
 		break;
-	case (NODE_REFMETA):
-		pnode_printrefmeta(p, pn);
+	case NODE_PARAMETER:
+		/* Suppress non-text children... */
+		pnode_printmopen(p);
+		fputs("Fa \"", stdout);
+		pnode_printmacrolinetext(p, pn, MACROLINE_NOWS);
+		fputs("\"", stdout);
 		pnode_unlinksub(pn);
 		break;
-	case (NODE_REFNAME):
-		fputs(".Nm ", stdout);
-		pnode_printmacroline(p, pn);
+	case NODE_QUOTE:
+		pnode_printmopen(p);
+		fputs("Qo", stdout);
+		break;
+	case NODE_PROGRAMLISTING:
+	case NODE_SCREEN:
+		assert(p->newln);
+		printf(".Bd %s\n", ATTRVAL_MONOSPACED ==
+		    pnode_getattr(pn, ATTRKEY_CLASS) ?
+		    "-literal" : "-unfilled");
+		break;
+	case NODE_REFENTRYINFO:
+		/* Suppress. */
 		pnode_unlinksub(pn);
-		return;
-	case (NODE_REFNAMEDIV):
-		puts(".Sh NAME");
 		break;
-	case (NODE_REFPURPOSE):
-		fputs(".Nd ", stdout);
-		pnode_printmacroline(p, pn);
+	case NODE_REFMETA:
+		abort();
+		break;
+	case NODE_REFNAME:
+		/* Suppress non-text children... */
+		pnode_printmopen(p);
+		fputs("Nm", stdout);
+		p->newln = 0;
+		pnode_printmacrolinepart(p, pn);
 		pnode_unlinksub(pn);
-		return;
-	case (NODE_REFSYNOPSISDIV):
+		break;
+	case NODE_REFNAMEDIV:
+		assert(p->newln);
+		puts(".Sh NAME");
+		break;
+	case NODE_REFPURPOSE:
+		assert(p->newln);
+		pnode_printmopen(p);
+		fputs("Nd", stdout);
+		break;
+	case NODE_REFSYNOPSISDIV:
+		assert(p->newln);
+		pnode_printrefsynopsisdiv(p, pn);
 		puts(".Sh SYNOPSIS");
 		break;
-	case (NODE_REFSECT1):
+	case NODE_PREFACE:
+	case NODE_SECTION:
+	case NODE_NOTE:
+	case NODE_TIP:
+	case NODE_CAUTION:
+	case NODE_WARNING:
+		assert(p->newln);
 		pnode_printrefsect(p, pn);
 		break;
-	case (NODE_TEXT):
+	case NODE_REPLACEABLE:
+		pnode_printmopen(p);
+		fputs("Ar", stdout);
+		break;
+	case NODE_SBR:
+		assert(p->newln);
+		puts(".br");
+		break;
+	case NODE_SGMLTAG:
+		pnode_printmopen(p);
+		fputs("Li", stdout);
+		break;
+	case NODE_STRUCTNAME:
+		pnode_printmopen(p);
+		fputs("Vt", stdout);
+		break;
+	case NODE_TABLE:
+	case NODE_INFORMALTABLE:
+		assert(p->newln);
+		pnode_printtable(p, pn);
+		pnode_unlinksub(pn);
+		break;
+	case NODE_TEXT:
+		if (0 == p->newln)
+			putchar(' ');
+
 		bufclear(p);
 		bufappend(p, pn);
+
+		if (0 == p->bsz) {
+			assert(pn->real != pn->b);
+			break;
+		}
+
 		/*
 		 * Output all characters, squeezing out whitespace
-		 * between newlines. 
+		 * between newlines.
 		 * XXX: all whitespace, including tabs (?).
 		 * Remember to escape control characters and escapes.
 		 */
-		for (last = '\n', cp = p->b; '\0' != *cp; ) {
+		assert(p->bsz);
+		cp = p->b;
+
+		/*
+		 * There's often a superfluous "-" in its <option> tags
+		 * before the actual flags themselves.
+		 * "Fl" does this for us, so remove it.
+		 */
+		if (NULL != pn->parent &&
+			NODE_OPTION == pn->parent->node &&
+			'-' == *cp)
+			cp++;
+		for (last = '\n'; '\0' != *cp; ) {
 			if ('\n' == last) {
 				/* Consume all whitespace. */
-				if (isspace((int)*cp)) {
-					while (isspace((int)*cp))
+				if (isspace((unsigned char)*cp)) {
+					while (isspace((unsigned char)*cp))
 						cp++;
 					continue;
 				} else if ('\'' == *cp || '.' == *cp)
@@ -916,9 +1551,35 @@ pnode_print(struct parse *p, struct pnode *pn)
 			if ('\\' == last)
 				putchar('e');
 		}
-		if ('\n' != last)
-			putchar('\n');
+		p->newln = 0;
 		break;
+	case NODE_TITLE:
+		if (pn->parent->node == NODE_BOOKINFO) {
+			pnode_printmopen(p);
+			fputs("Nd", stdout);
+		}
+		break;
+	case NODE_TYPE:
+		pnode_printmopen(p);
+		fputs("Vt", stdout);
+		break;
+	case NODE_USERINPUT:
+		pnode_printmopen(p);
+		fputs("Li", stdout);
+		break;
+	case NODE_VARIABLELIST:
+		assert(p->newln);
+		pnode_printvariablelist(p, pn);
+		pnode_unlinksub(pn);
+		break;
+	case NODE_VARLISTENTRY:
+		assert(p->newln);
+		pnode_printvarlistentry(p, pn);
+		break;
+	case NODE_VARNAME:
+		pnode_printmopen(p);
+		fputs("Va", stdout);
+		break;
 	default:
 		break;
 	}
@@ -927,9 +1588,92 @@ pnode_print(struct parse *p, struct pnode *pn)
 		pnode_print(p, pp);
 
 	switch (pn->node) {
-	case (NODE_PROGRAMLISTING):
+	case NODE_INFORMALEQUATION:
+		if ( ! p->newln)
+			putchar('\n');
+		puts(".EN");
+		p->newln = 1;
+		break;
+	case NODE_INLINEEQUATION:
+		fputs("$ ", stdout);
+		p->newln = sv;
+		break;
+	case NODE_MML_MROW:
+	case NODE_MML_MI:
+	case NODE_MML_MN:
+	case NODE_MML_MO:
+		if (TAILQ_EMPTY(&pn->childq))
+			break;
+		fputs(" } ", stdout);
+		break;
+	case NODE_APPLICATION:
+	case NODE_ARG:
+	case NODE_AUTHOR:
+	case NODE_CITEREFENTRY:
+	case NODE_CODE:
+	case NODE_COMMAND:
+	case NODE_CONSTANT:
+	case NODE_EDITOR:
+	case NODE_EMPHASIS:
+	case NODE_ENVAR:
+	case NODE_FILENAME:
+	case NODE_FIRSTTERM:
+	case NODE_FUNCTION:
+	case NODE_FUNCSYNOPSISINFO:
+	case NODE_LITERAL:
+	case NODE_OPTION:
+	case NODE_PARAMETER:
+	case NODE_REPLACEABLE:
+	case NODE_REFPURPOSE:
+	case NODE_SGMLTAG:
+	case NODE_STRUCTNAME:
+	case NODE_TEXT:
+	case NODE_TYPE:
+	case NODE_USERINPUT:
+	case NODE_VARNAME:
+		pnode_printmclosepunct(p, pn, sv);
+		break;
+	case NODE_QUOTE:
+		pnode_printmclose(p, sv);
+		sv = p->newln;
+		pnode_printmopen(p);
+		fputs("Qc", stdout);
+		pnode_printmclose(p, sv);
+		break;
+	case NODE_REFNAME:
+		/*
+		 * If we're in the NAME macro and we have multiple
+		 * <refname> macros in sequence, then print out a
+		 * trailing comma before the newline.
+		 */
+		if (NULL != pn->parent &&
+			NODE_REFNAMEDIV == pn->parent->node &&
+			NULL != TAILQ_NEXT(pn, child) &&
+			NODE_REFNAME == TAILQ_NEXT(pn, child)->node)
+			fputs(" ,", stdout);
+		pnode_printmclose(p, sv);
+		break;
+	case NODE_PREFACE:
+	case NODE_SECTION:
+	case NODE_NOTE:
+	case NODE_TIP:
+	case NODE_CAUTION:
+	case NODE_WARNING:
+		p->level--;
+		break;
+	case NODE_LITERALLAYOUT:
+	case NODE_PROGRAMLISTING:
+	case NODE_SCREEN:
+		assert(p->newln);
 		puts(".Ed");
+		p->newln = 1;
 		break;
+	case NODE_TITLE:
+		if (pn->parent->node == NODE_BOOKINFO) {
+			pnode_printmclose(p, 1);
+			puts(".Sh AUTHORS");
+		}
+		break;
 	default:
 		break;
 	}
@@ -940,7 +1684,7 @@ pnode_print(struct parse *p, struct pnode *pn)
  * Invoke the parser context with each buffer fill.
  */
 static int
-readfile(XML_Parser xp, int fd, 
+readfile(XML_Parser xp, int fd,
 	char *b, size_t bsz, const char *fn)
 {
 	struct parse	 p;
@@ -950,6 +1694,8 @@ readfile(XML_Parser xp, int fd, 
 	memset(&p, 0, sizeof(struct parse));
 
 	p.b = malloc(p.bsz = p.mbsz = 1024);
+	p.fname = fn;
+	p.xml = xp;
 
 	XML_SetCharacterDataHandler(xp, xml_char);
 	XML_SetElementHandler(xp, xml_elem_start, xml_elem_end);
@@ -957,15 +1703,19 @@ readfile(XML_Parser xp, int fd, 
 
 	while ((ssz = read(fd, b, bsz)) >= 0) {
 		if (0 == (rc = XML_Parse(xp, b, ssz, 0 == ssz)))
-			fprintf(stderr, "%s: %s\n", fn,
+			fprintf(stderr, "%s:%zu:%zu: %s\n", fn,
+				XML_GetCurrentLineNumber(xp),
+				XML_GetCurrentColumnNumber(xp),
 				XML_ErrorString
 				(XML_GetErrorCode(xp)));
 		else if ( ! p.stop && ssz > 0)
 			continue;
-		/* 
+		/*
 		 * Exit when we've read all or errors have occured
 		 * during the parse sequence.
 		 */
+		p.newln = 1;
+		pnode_printprologue(&p, p.root);
 		pnode_print(&p, p.root);
 		pnode_free(p.root);
 		free(p.b);
@@ -985,26 +1735,40 @@ main(int argc, char *argv[])
 	XML_Parser	 xp;
 	const char	*fname;
 	char		*buf;
-	int		 fd, rc;
+	int		 fd, rc, ch;
+	const char	*progname;
 
+	progname = strrchr(argv[0], '/');
+	if (progname == NULL)
+		progname = argv[0];
+	else
+		++progname;
+
 	fname = "-";
 	xp = NULL;
 	buf = NULL;
 	rc = 0;
 
-	if (-1 != getopt(argc, argv, ""))
-		return(EXIT_FAILURE);
+	while (-1 != (ch = getopt(argc, argv, "W")))
+		switch (ch) {
+		case 'W':
+			warn = 1;
+			break;
+		default:
+			goto usage;
+		}
 
 	argc -= optind;
 	argv += optind;
 
-	if (argc > 1)
-		return(EXIT_FAILURE);
-	else if (argc > 0)
+	if (argc > 1) {
+		fprintf(stderr, "%s: Too many arguments\n", argv[1]);
+		goto usage;
+	} else if (argc > 0)
 		fname = argv[0];
 
 	/* Read from stdin or a file. */
-	fd = 0 == strcmp(fname, "-") ? 
+	fd = 0 == strcmp(fname, "-") ?
 		STDIN_FILENO : open(fname, O_RDONLY, 0);
 
 	/*
@@ -1027,4 +1791,8 @@ main(int argc, char *argv[])
 	if (STDIN_FILENO != fd)
 		close(fd);
 	return(rc ? EXIT_SUCCESS : EXIT_FAILURE);
+
+usage:
+	fprintf(stderr, "usage: %s [-W] [input_filename]\n", progname);
+	return(EXIT_FAILURE);
 }