version 1.29, 2009/09/16 09:41:24 |
version 1.140, 2011/05/17 10:48:06 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@kth.se> |
* Copyright (c) 2008, 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv> |
|
* Copyright (c) 2011 Ingo Schwarze <schwarze@openbsd.org> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the above |
* purpose with or without fee is hereby granted, provided that the above |
|
|
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
*/ |
*/ |
|
#ifdef HAVE_CONFIG_H |
|
#include "config.h" |
|
#endif |
|
|
|
#include <sys/types.h> |
|
|
#include <assert.h> |
#include <assert.h> |
#include <err.h> |
#include <ctype.h> |
|
#include <stdarg.h> |
#include <stdio.h> |
#include <stdio.h> |
|
#include <stdint.h> |
#include <stdlib.h> |
#include <stdlib.h> |
|
#include <string.h> |
|
#include <unistd.h> |
|
|
#include "mdoc.h" |
#include "mandoc.h" |
#include "man.h" |
#include "libmandoc.h" |
|
#include "out.h" |
|
#include "html.h" |
|
#include "main.h" |
|
|
#define DOCTYPE "-//W3C//DTD HTML 4.01//EN" |
|
#define DTD "http://www.w3.org/TR/html4/strict.dtd" |
|
|
|
enum htmltag { |
|
TAG_HTML, |
|
TAG_HEAD, |
|
TAG_BODY, |
|
TAG_META, |
|
TAG_TITLE, |
|
TAG_DIV, |
|
TAG_H1, |
|
TAG_H2, |
|
TAG_P, |
|
TAG_SPAN, |
|
TAG_LINK, |
|
TAG_MAX |
|
}; |
|
|
|
enum htmlattr { |
|
ATTR_HTTPEQUIV, |
|
ATTR_CONTENT, |
|
ATTR_NAME, |
|
ATTR_REL, |
|
ATTR_HREF, |
|
ATTR_TYPE, |
|
ATTR_MEDIA, |
|
ATTR_CLASS, |
|
ATTR_MAX |
|
}; |
|
|
|
struct htmldata { |
struct htmldata { |
char *name; |
const char *name; |
int flags; |
int flags; |
#define HTML_BLOCK (1 << 0) |
#define HTML_CLRLINE (1 << 0) |
|
#define HTML_NOSTACK (1 << 1) |
|
#define HTML_AUTOCLOSE (1 << 2) /* Tag has auto-closure. */ |
}; |
}; |
|
|
static const struct htmldata htmltags[TAG_MAX] = { |
static const struct htmldata htmltags[TAG_MAX] = { |
{"html", HTML_BLOCK}, /* TAG_HTML */ |
{"html", HTML_CLRLINE}, /* TAG_HTML */ |
{"head", HTML_BLOCK}, /* TAG_HEAD */ |
{"head", HTML_CLRLINE}, /* TAG_HEAD */ |
{"body", HTML_BLOCK}, /* TAG_BODY */ |
{"body", HTML_CLRLINE}, /* TAG_BODY */ |
{"meta", HTML_BLOCK}, /* TAG_META */ |
{"meta", HTML_CLRLINE | HTML_NOSTACK | HTML_AUTOCLOSE}, /* TAG_META */ |
{"title", HTML_BLOCK}, /* TAG_TITLE */ |
{"title", HTML_CLRLINE}, /* TAG_TITLE */ |
{"div", HTML_BLOCK}, /* TAG_DIV */ |
{"div", HTML_CLRLINE}, /* TAG_DIV */ |
{"h1", 0}, /* TAG_H1 */ |
{"h1", 0}, /* TAG_H1 */ |
{"h2", 0}, /* TAG_H2 */ |
{"h2", 0}, /* TAG_H2 */ |
{"p", HTML_BLOCK}, /* TAG_P */ |
|
{"span", 0}, /* TAG_SPAN */ |
{"span", 0}, /* TAG_SPAN */ |
{"link", HTML_BLOCK}, /* TAG_LINK */ |
{"link", HTML_CLRLINE | HTML_NOSTACK | HTML_AUTOCLOSE}, /* TAG_LINK */ |
|
{"br", HTML_CLRLINE | HTML_NOSTACK | HTML_AUTOCLOSE}, /* TAG_BR */ |
|
{"a", 0}, /* TAG_A */ |
|
{"table", HTML_CLRLINE}, /* TAG_TABLE */ |
|
{"tbody", HTML_CLRLINE}, /* TAG_TBODY */ |
|
{"col", HTML_CLRLINE | HTML_NOSTACK | HTML_AUTOCLOSE}, /* TAG_COL */ |
|
{"tr", HTML_CLRLINE}, /* TAG_TR */ |
|
{"td", HTML_CLRLINE}, /* TAG_TD */ |
|
{"li", HTML_CLRLINE}, /* TAG_LI */ |
|
{"ul", HTML_CLRLINE}, /* TAG_UL */ |
|
{"ol", HTML_CLRLINE}, /* TAG_OL */ |
|
{"dl", HTML_CLRLINE}, /* TAG_DL */ |
|
{"dt", HTML_CLRLINE}, /* TAG_DT */ |
|
{"dd", HTML_CLRLINE}, /* TAG_DD */ |
|
{"blockquote", HTML_CLRLINE}, /* TAG_BLOCKQUOTE */ |
|
{"p", HTML_CLRLINE | HTML_NOSTACK | HTML_AUTOCLOSE}, /* TAG_P */ |
|
{"pre", HTML_CLRLINE }, /* TAG_PRE */ |
|
{"b", 0 }, /* TAG_B */ |
|
{"i", 0 }, /* TAG_I */ |
|
{"code", 0 }, /* TAG_CODE */ |
|
{"small", 0 }, /* TAG_SMALL */ |
}; |
}; |
|
|
static const char *const htmlattrs[ATTR_MAX] = { |
static const char *const htmlattrs[ATTR_MAX] = { |
"http-equiv", |
"http-equiv", /* ATTR_HTTPEQUIV */ |
"content", |
"content", /* ATTR_CONTENT */ |
"name", |
"name", /* ATTR_NAME */ |
"rel", |
"rel", /* ATTR_REL */ |
"href", |
"href", /* ATTR_HREF */ |
"type", |
"type", /* ATTR_TYPE */ |
"media", |
"media", /* ATTR_MEDIA */ |
"class" |
"class", /* ATTR_CLASS */ |
|
"style", /* ATTR_STYLE */ |
|
"width", /* ATTR_WIDTH */ |
|
"id", /* ATTR_ID */ |
|
"summary", /* ATTR_SUMMARY */ |
|
"align", /* ATTR_ALIGN */ |
|
"colspan", /* ATTR_COLSPAN */ |
}; |
}; |
|
|
struct htmlpair { |
static const char *const roffscales[SCALE_MAX] = { |
enum htmlattr key; |
"cm", /* SCALE_CM */ |
char *val; |
"in", /* SCALE_IN */ |
|
"pc", /* SCALE_PC */ |
|
"pt", /* SCALE_PT */ |
|
"em", /* SCALE_EM */ |
|
"em", /* SCALE_MM */ |
|
"ex", /* SCALE_EN */ |
|
"ex", /* SCALE_BU */ |
|
"em", /* SCALE_VS */ |
|
"ex", /* SCALE_FS */ |
}; |
}; |
|
|
struct html { |
static void print_num(struct html *, const char *, size_t); |
int flags; |
static void print_spec(struct html *, const char *, size_t); |
#define HTML_NOSPACE (1 << 0) |
static void print_res(struct html *, const char *, size_t); |
}; |
|
|
|
#define MDOC_ARGS const struct mdoc_meta *m, \ |
|
const struct mdoc_node *n, \ |
|
struct html *h |
|
#define MAN_ARGS const struct man_meta *m, \ |
|
const struct man_node *n, \ |
|
struct html *h |
|
struct htmlmdoc { |
|
int (*pre)(MDOC_ARGS); |
|
void (*post)(MDOC_ARGS); |
|
}; |
|
|
|
static void print_gen_doctype(struct html *); |
|
static void print_gen_head(struct html *); |
|
static void print_mdoc(MDOC_ARGS); |
|
static void print_mdoc_head(MDOC_ARGS); |
|
static void print_mdoc_node(MDOC_ARGS); |
|
static void print_man(MAN_ARGS); |
|
static void print_man_head(MAN_ARGS); |
|
static void print_man_body(MAN_ARGS); |
|
static void print_otag(struct html *, enum htmltag, |
|
int, const struct htmlpair *); |
|
static void print_ctag(struct html *, enum htmltag); |
static void print_ctag(struct html *, enum htmltag); |
static void print_encode(const char *); |
static void print_doctype(struct html *); |
static void print_text(struct html *, const char *); |
static void print_xmltype(struct html *); |
static int mdoc_root_pre(MDOC_ARGS); |
static int print_encode(struct html *, const char *, int); |
static void mdoc_root_post(MDOC_ARGS); |
static void print_metaf(struct html *, enum mandoc_esc); |
|
static void print_attr(struct html *, |
|
const char *, const char *); |
|
static void *ml_alloc(char *, enum htmltype); |
|
|
static int mdoc_nd_pre(MDOC_ARGS); |
|
static int mdoc_nm_pre(MDOC_ARGS); |
|
static void mdoc_nm_post(MDOC_ARGS); |
|
static int mdoc_pp_pre(MDOC_ARGS); |
|
static int mdoc_sh_pre(MDOC_ARGS); |
|
static void mdoc_sh_post(MDOC_ARGS); |
|
static int mdoc_ss_pre(MDOC_ARGS); |
|
static void mdoc_ss_post(MDOC_ARGS); |
|
|
|
static const struct htmlmdoc mdocs[MDOC_MAX] = { |
static void * |
{NULL, NULL}, /* Ap */ |
ml_alloc(char *outopts, enum htmltype type) |
{NULL, NULL}, /* Dd */ |
{ |
{NULL, NULL}, /* Dt */ |
struct html *h; |
{NULL, NULL}, /* Os */ |
const char *toks[4]; |
{mdoc_sh_pre, mdoc_sh_post }, /* Sh */ |
char *v; |
{mdoc_ss_pre, mdoc_ss_post }, /* Ss */ |
|
{mdoc_pp_pre, NULL}, /* Pp */ |
|
{NULL, NULL}, /* D1 */ |
|
{NULL, NULL}, /* Dl */ |
|
{NULL, NULL}, /* Bd */ |
|
{NULL, NULL}, /* Ed */ |
|
{NULL, NULL}, /* Bl */ |
|
{NULL, NULL}, /* El */ |
|
{NULL, NULL}, /* It */ |
|
{NULL, NULL}, /* Ad */ |
|
{NULL, NULL}, /* An */ |
|
{NULL, NULL}, /* Ar */ |
|
{NULL, NULL}, /* Cd */ |
|
{NULL, NULL}, /* Cm */ |
|
{NULL, NULL}, /* Dv */ |
|
{NULL, NULL}, /* Er */ |
|
{NULL, NULL}, /* Ev */ |
|
{NULL, NULL}, /* Ex */ |
|
{NULL, NULL}, /* Fa */ |
|
{NULL, NULL}, /* Fd */ |
|
{NULL, NULL}, /* Fl */ |
|
{NULL, NULL}, /* Fn */ |
|
{NULL, NULL}, /* Ft */ |
|
{NULL, NULL}, /* Ic */ |
|
{NULL, NULL}, /* In */ |
|
{NULL, NULL}, /* Li */ |
|
{mdoc_nd_pre, NULL}, /* Nd */ |
|
{mdoc_nm_pre, mdoc_nm_post}, /* Nm */ |
|
{NULL, NULL}, /* Op */ |
|
{NULL, NULL}, /* Ot */ |
|
{NULL, NULL}, /* Pa */ |
|
{NULL, NULL}, /* Rv */ |
|
{NULL, NULL}, /* St */ |
|
{NULL, NULL}, /* Va */ |
|
{NULL, NULL}, /* Vt */ |
|
{NULL, NULL}, /* Xr */ |
|
{NULL, NULL}, /* %A */ |
|
{NULL, NULL}, /* %B */ |
|
{NULL, NULL}, /* %D */ |
|
{NULL, NULL}, /* %I */ |
|
{NULL, NULL}, /* %J */ |
|
{NULL, NULL}, /* %N */ |
|
{NULL, NULL}, /* %O */ |
|
{NULL, NULL}, /* %P */ |
|
{NULL, NULL}, /* %R */ |
|
{NULL, NULL}, /* %T */ |
|
{NULL, NULL}, /* %V */ |
|
{NULL, NULL}, /* Ac */ |
|
{NULL, NULL}, /* Ao */ |
|
{NULL, NULL}, /* Aq */ |
|
{NULL, NULL}, /* At */ |
|
{NULL, NULL}, /* Bc */ |
|
{NULL, NULL}, /* Bf */ |
|
{NULL, NULL}, /* Bo */ |
|
{NULL, NULL}, /* Bq */ |
|
{NULL, NULL}, /* Bsx */ |
|
{NULL, NULL}, /* Bx */ |
|
{NULL, NULL}, /* Db */ |
|
{NULL, NULL}, /* Dc */ |
|
{NULL, NULL}, /* Do */ |
|
{NULL, NULL}, /* Dq */ |
|
{NULL, NULL}, /* Ec */ |
|
{NULL, NULL}, /* Ef */ |
|
{NULL, NULL}, /* Em */ |
|
{NULL, NULL}, /* Eo */ |
|
{NULL, NULL}, /* Fx */ |
|
{NULL, NULL}, /* Ms */ |
|
{NULL, NULL}, /* No */ |
|
{NULL, NULL}, /* Ns */ |
|
{NULL, NULL}, /* Nx */ |
|
{NULL, NULL}, /* Ox */ |
|
{NULL, NULL}, /* Pc */ |
|
{NULL, NULL}, /* Pf */ |
|
{NULL, NULL}, /* Po */ |
|
{NULL, NULL}, /* Pq */ |
|
{NULL, NULL}, /* Qc */ |
|
{NULL, NULL}, /* Ql */ |
|
{NULL, NULL}, /* Qo */ |
|
{NULL, NULL}, /* Qq */ |
|
{NULL, NULL}, /* Re */ |
|
{NULL, NULL}, /* Rs */ |
|
{NULL, NULL}, /* Sc */ |
|
{NULL, NULL}, /* So */ |
|
{NULL, NULL}, /* Sq */ |
|
{NULL, NULL}, /* Sm */ |
|
{NULL, NULL}, /* Sx */ |
|
{NULL, NULL}, /* Sy */ |
|
{NULL, NULL}, /* Tn */ |
|
{NULL, NULL}, /* Ux */ |
|
{NULL, NULL}, /* Xc */ |
|
{NULL, NULL}, /* Xo */ |
|
{NULL, NULL}, /* Fo */ |
|
{NULL, NULL}, /* Fc */ |
|
{NULL, NULL}, /* Oo */ |
|
{NULL, NULL}, /* Oc */ |
|
{NULL, NULL}, /* Bk */ |
|
{NULL, NULL}, /* Ek */ |
|
{NULL, NULL}, /* Bt */ |
|
{NULL, NULL}, /* Hf */ |
|
{NULL, NULL}, /* Fr */ |
|
{NULL, NULL}, /* Ud */ |
|
{NULL, NULL}, /* Lb */ |
|
{NULL, NULL}, /* Lp */ |
|
{NULL, NULL}, /* Lk */ |
|
{NULL, NULL}, /* Mt */ |
|
{NULL, NULL}, /* Brq */ |
|
{NULL, NULL}, /* Bro */ |
|
{NULL, NULL}, /* Brc */ |
|
{NULL, NULL}, /* %C */ |
|
{NULL, NULL}, /* Es */ |
|
{NULL, NULL}, /* En */ |
|
{NULL, NULL}, /* Dx */ |
|
{NULL, NULL}, /* %Q */ |
|
{NULL, NULL}, /* br */ |
|
{NULL, NULL}, /* sp */ |
|
}; |
|
|
|
|
toks[0] = "style"; |
|
toks[1] = "man"; |
|
toks[2] = "includes"; |
|
toks[3] = NULL; |
|
|
int |
h = mandoc_calloc(1, sizeof(struct html)); |
html_mdoc(void *arg, const struct mdoc *m) |
|
{ |
|
struct html *h; |
|
|
|
h = (struct html *)arg; |
h->type = type; |
|
h->tags.head = NULL; |
|
h->symtab = mchars_alloc(); |
|
|
print_gen_doctype(h); |
while (outopts && *outopts) |
print_otag(h, TAG_HTML, 0, NULL); |
switch (getsubopt(&outopts, UNCONST(toks), &v)) { |
print_mdoc(mdoc_meta(m), mdoc_node(m), h); |
case (0): |
print_ctag(h, TAG_HTML); |
h->style = v; |
printf("\n"); |
break; |
return(1); |
case (1): |
|
h->base_man = v; |
|
break; |
|
case (2): |
|
h->base_includes = v; |
|
break; |
|
default: |
|
break; |
|
} |
|
|
|
return(h); |
} |
} |
|
|
|
void * |
int |
html_alloc(char *outopts) |
html_man(void *arg, const struct man *m) |
|
{ |
{ |
struct html *h; |
|
|
|
h = (struct html *)arg; |
return(ml_alloc(outopts, HTML_HTML_4_01_STRICT)); |
|
|
print_gen_doctype(h); |
|
print_otag(h, TAG_HTML, 0, NULL); |
|
print_man(man_meta(m), man_node(m), h); |
|
print_ctag(h, TAG_HTML); |
|
printf("\n"); |
|
return(1); |
|
} |
} |
|
|
|
|
void * |
void * |
html_alloc(void) |
xhtml_alloc(char *outopts) |
{ |
{ |
|
|
return(calloc(1, sizeof(struct html))); |
return(ml_alloc(outopts, HTML_XHTML_1_0_STRICT)); |
} |
} |
|
|
|
|
void |
void |
html_free(void *p) |
html_free(void *p) |
{ |
{ |
|
struct tag *tag; |
|
struct html *h; |
|
|
free(p); |
h = (struct html *)p; |
} |
|
|
|
|
while ((tag = h->tags.head) != NULL) { |
|
h->tags.head = tag->next; |
|
free(tag); |
|
} |
|
|
|
if (h->symtab) |
|
mchars_free(h->symtab); |
|
|
static void |
free(h); |
print_mdoc(MDOC_ARGS) |
|
{ |
|
|
|
print_otag(h, TAG_HEAD, 0, NULL); |
|
print_mdoc_head(m, n, h); |
|
print_ctag(h, TAG_HEAD); |
|
print_otag(h, TAG_BODY, 0, NULL); |
|
print_mdoc_node(m, n, h); |
|
print_ctag(h, TAG_BODY); |
|
} |
} |
|
|
|
|
static void |
void |
print_gen_head(struct html *h) |
print_gen_head(struct html *h) |
{ |
{ |
struct htmlpair meta0[2]; |
struct htmlpair tag[4]; |
struct htmlpair meta1[2]; |
|
struct htmlpair link[4]; |
|
|
|
meta0[0].key = ATTR_HTTPEQUIV; |
tag[0].key = ATTR_HTTPEQUIV; |
meta0[0].val = "Content-Type"; |
tag[0].val = "Content-Type"; |
meta0[1].key = ATTR_CONTENT; |
tag[1].key = ATTR_CONTENT; |
meta0[1].val = "text/html; charest-utf-8"; |
tag[1].val = "text/html; charset=utf-8"; |
|
print_otag(h, TAG_META, 2, tag); |
|
|
meta1[0].key = ATTR_NAME; |
tag[0].key = ATTR_NAME; |
meta1[0].val = "resource-type"; |
tag[0].val = "resource-type"; |
meta1[1].key = ATTR_CONTENT; |
tag[1].key = ATTR_CONTENT; |
meta1[1].val = "document"; |
tag[1].val = "document"; |
|
print_otag(h, TAG_META, 2, tag); |
|
|
link[0].key = ATTR_REL; |
if (h->style) { |
link[0].val = "stylesheet"; |
tag[0].key = ATTR_REL; |
link[1].key = ATTR_HREF; |
tag[0].val = "stylesheet"; |
link[1].val = "style.css"; |
tag[1].key = ATTR_HREF; |
link[2].key = ATTR_TYPE; |
tag[1].val = h->style; |
link[2].val = "text/css"; |
tag[2].key = ATTR_TYPE; |
link[3].key = ATTR_MEDIA; |
tag[2].val = "text/css"; |
link[3].val = "all"; |
tag[3].key = ATTR_MEDIA; |
|
tag[3].val = "all"; |
print_otag(h, TAG_META, 2, meta0); |
print_otag(h, TAG_LINK, 4, tag); |
print_otag(h, TAG_META, 2, meta1); |
} |
print_otag(h, TAG_LINK, 4, link); |
|
} |
} |
|
|
|
/* ARGSUSED */ |
|
static void |
|
print_num(struct html *h, const char *p, size_t len) |
|
{ |
|
char c; |
|
|
|
if ('\0' != (c = mchars_num2char(p, len))) |
|
putchar((int)c); |
|
} |
|
|
static void |
static void |
print_mdoc_head(MDOC_ARGS) |
print_spec(struct html *h, const char *p, size_t len) |
{ |
{ |
|
int cp; |
|
const char *rhs; |
|
size_t sz; |
|
|
print_gen_head(h); |
if ((cp = mchars_spec2cp(h->symtab, p, len)) > 0) { |
print_otag(h, TAG_TITLE, 0, NULL); |
printf("&#%d;", cp); |
print_encode(m->title); |
return; |
print_ctag(h, TAG_TITLE); |
} else if (-1 == cp && 1 == len) { |
|
fwrite(p, 1, len, stdout); |
|
return; |
|
} else if (-1 == cp) |
|
return; |
|
|
|
if (NULL != (rhs = mchars_spec2str(h->symtab, p, len, &sz))) |
|
fwrite(rhs, 1, sz, stdout); |
} |
} |
|
|
|
|
static int |
static void |
mdoc_root_pre(MDOC_ARGS) |
print_res(struct html *h, const char *p, size_t len) |
{ |
{ |
struct htmlpair div; |
int cp; |
|
const char *rhs; |
|
size_t sz; |
|
|
div.key = ATTR_CLASS; |
if ((cp = mchars_res2cp(h->symtab, p, len)) > 0) { |
div.val = "body"; |
printf("&#%d;", cp); |
|
return; |
|
} else if (-1 == cp) |
|
return; |
|
|
print_otag(h, TAG_DIV, 1, &div); |
if (NULL != (rhs = mchars_res2str(h->symtab, p, len, &sz))) |
return(1); |
fwrite(rhs, 1, sz, stdout); |
} |
} |
|
|
|
|
static void |
static void |
mdoc_root_post(MDOC_ARGS) |
print_metaf(struct html *h, enum mandoc_esc deco) |
{ |
{ |
|
enum htmlfont font; |
|
|
print_ctag(h, TAG_DIV); |
switch (deco) { |
|
case (ESCAPE_FONTPREV): |
|
font = h->metal; |
|
break; |
|
case (ESCAPE_FONTITALIC): |
|
font = HTMLFONT_ITALIC; |
|
break; |
|
case (ESCAPE_FONTBOLD): |
|
font = HTMLFONT_BOLD; |
|
break; |
|
case (ESCAPE_FONTROMAN): |
|
font = HTMLFONT_NONE; |
|
break; |
|
default: |
|
abort(); |
|
/* NOTREACHED */ |
|
} |
|
|
|
if (h->metaf) { |
|
print_tagq(h, h->metaf); |
|
h->metaf = NULL; |
|
} |
|
|
|
h->metal = h->metac; |
|
h->metac = font; |
|
|
|
if (HTMLFONT_NONE != font) |
|
h->metaf = HTMLFONT_BOLD == font ? |
|
print_otag(h, TAG_B, 0, NULL) : |
|
print_otag(h, TAG_I, 0, NULL); |
} |
} |
|
|
|
int |
|
html_strlen(const char *cp) |
|
{ |
|
int ssz, sz; |
|
const char *seq, *p; |
|
|
|
/* |
|
* Account for escaped sequences within string length |
|
* calculations. This follows the logic in term_strlen() as we |
|
* must calculate the width of produced strings. |
|
* Assume that characters are always width of "1". This is |
|
* hacky, but it gets the job done for approximation of widths. |
|
*/ |
|
|
|
sz = 0; |
|
while (NULL != (p = strchr(cp, '\\'))) { |
|
sz += (int)(p - cp); |
|
++cp; |
|
switch (mandoc_escape(&cp, &seq, &ssz)) { |
|
case (ESCAPE_ERROR): |
|
return(sz); |
|
case (ESCAPE_NUMBERED): |
|
/* FALLTHROUGH */ |
|
case (ESCAPE_PREDEF): |
|
/* FALLTHROUGH */ |
|
case (ESCAPE_SPECIAL): |
|
sz++; |
|
break; |
|
default: |
|
break; |
|
} |
|
} |
|
|
|
assert(sz >= 0); |
|
return(sz + strlen(cp)); |
|
} |
|
|
static int |
static int |
mdoc_ss_pre(MDOC_ARGS) |
print_encode(struct html *h, const char *p, int norecurse) |
{ |
{ |
|
size_t sz; |
|
int len, nospace; |
|
const char *seq; |
|
enum mandoc_esc esc; |
|
static const char rejs[6] = { '\\', '<', '>', '&', ASCII_HYPH, '\0' }; |
|
|
if (MDOC_BODY == n->type) |
nospace = 0; |
print_otag(h, TAG_P, 0, NULL); |
|
if (MDOC_HEAD == n->type) |
while ('\0' != *p) { |
print_otag(h, TAG_H2, 0, NULL); |
sz = strcspn(p, rejs); |
return(1); |
|
|
fwrite(p, 1, sz, stdout); |
|
p += (int)sz; |
|
|
|
if ('\0' == *p) |
|
break; |
|
|
|
switch (*p++) { |
|
case ('<'): |
|
printf("<"); |
|
continue; |
|
case ('>'): |
|
printf(">"); |
|
continue; |
|
case ('&'): |
|
printf("&"); |
|
continue; |
|
case (ASCII_HYPH): |
|
putchar('-'); |
|
continue; |
|
default: |
|
break; |
|
} |
|
|
|
esc = mandoc_escape(&p, &seq, &len); |
|
if (ESCAPE_ERROR == esc) |
|
break; |
|
|
|
switch (esc) { |
|
case (ESCAPE_NUMBERED): |
|
print_num(h, seq, len); |
|
break; |
|
case (ESCAPE_PREDEF): |
|
print_res(h, seq, len); |
|
break; |
|
case (ESCAPE_SPECIAL): |
|
print_spec(h, seq, len); |
|
break; |
|
case (ESCAPE_FONTPREV): |
|
/* FALLTHROUGH */ |
|
case (ESCAPE_FONTBOLD): |
|
/* FALLTHROUGH */ |
|
case (ESCAPE_FONTITALIC): |
|
/* FALLTHROUGH */ |
|
case (ESCAPE_FONTROMAN): |
|
if (norecurse) |
|
break; |
|
print_metaf(h, esc); |
|
break; |
|
case (ESCAPE_NOSPACE): |
|
if ('\0' == *p) |
|
nospace = 1; |
|
break; |
|
default: |
|
break; |
|
} |
|
} |
|
|
|
return(nospace); |
} |
} |
|
|
|
|
static void |
static void |
mdoc_ss_post(MDOC_ARGS) |
print_attr(struct html *h, const char *key, const char *val) |
{ |
{ |
|
printf(" %s=\"", key); |
if (MDOC_BODY == n->type) |
(void)print_encode(h, val, 1); |
print_ctag(h, TAG_P); |
putchar('\"'); |
if (MDOC_HEAD == n->type) |
|
print_ctag(h, TAG_H2); |
|
} |
} |
|
|
|
|
static int |
struct tag * |
mdoc_pp_pre(MDOC_ARGS) |
print_otag(struct html *h, enum htmltag tag, |
|
int sz, const struct htmlpair *p) |
{ |
{ |
|
int i; |
|
struct tag *t; |
|
|
print_otag(h, TAG_P, 0, NULL); |
/* Push this tags onto the stack of open scopes. */ |
return(0); |
|
} |
|
|
|
|
if ( ! (HTML_NOSTACK & htmltags[tag].flags)) { |
|
t = mandoc_malloc(sizeof(struct tag)); |
|
t->tag = tag; |
|
t->next = h->tags.head; |
|
h->tags.head = t; |
|
} else |
|
t = NULL; |
|
|
static int |
if ( ! (HTML_NOSPACE & h->flags)) |
mdoc_nd_pre(MDOC_ARGS) |
if ( ! (HTML_CLRLINE & htmltags[tag].flags)) { |
{ |
/* Manage keeps! */ |
|
if ( ! (HTML_KEEP & h->flags)) { |
|
if (HTML_PREKEEP & h->flags) |
|
h->flags |= HTML_KEEP; |
|
putchar(' '); |
|
} else |
|
printf(" "); |
|
} |
|
|
if (MDOC_BODY == n->type) |
if ( ! (h->flags & HTML_NONOSPACE)) |
print_text(h, "--"); |
h->flags &= ~HTML_NOSPACE; |
return(1); |
else |
} |
h->flags |= HTML_NOSPACE; |
|
|
|
/* Print out the tag name and attributes. */ |
|
|
static int |
printf("<%s", htmltags[tag].name); |
mdoc_nm_pre(MDOC_ARGS) |
for (i = 0; i < sz; i++) |
{ |
print_attr(h, htmlattrs[p[i].key], p[i].val); |
struct htmlpair class; |
|
|
|
class.key = ATTR_CLASS; |
/* Add non-overridable attributes. */ |
class.val = "name"; |
|
|
|
print_otag(h, TAG_SPAN, 1, &class); |
if (TAG_HTML == tag && HTML_XHTML_1_0_STRICT == h->type) { |
if (NULL == n->child) |
print_attr(h, "xmlns", "http://www.w3.org/1999/xhtml"); |
print_text(h, m->name); |
print_attr(h, "xml:lang", "en"); |
|
print_attr(h, "lang", "en"); |
|
} |
|
|
return(1); |
/* Accommodate for XML "well-formed" singleton escaping. */ |
|
|
|
if (HTML_AUTOCLOSE & htmltags[tag].flags) |
|
switch (h->type) { |
|
case (HTML_XHTML_1_0_STRICT): |
|
putchar('/'); |
|
break; |
|
default: |
|
break; |
|
} |
|
|
|
putchar('>'); |
|
|
|
h->flags |= HTML_NOSPACE; |
|
|
|
if ((HTML_AUTOCLOSE | HTML_CLRLINE) & htmltags[tag].flags) |
|
putchar('\n'); |
|
|
|
return(t); |
} |
} |
|
|
|
|
static void |
static void |
mdoc_nm_post(MDOC_ARGS) |
print_ctag(struct html *h, enum htmltag tag) |
{ |
{ |
|
|
print_ctag(h, TAG_SPAN); |
printf("</%s>", htmltags[tag].name); |
|
if (HTML_CLRLINE & htmltags[tag].flags) { |
|
h->flags |= HTML_NOSPACE; |
|
putchar('\n'); |
|
} |
} |
} |
|
|
|
|
static int |
void |
mdoc_sh_pre(MDOC_ARGS) |
print_gen_decls(struct html *h) |
{ |
{ |
|
|
if (MDOC_BODY == n->type) |
print_xmltype(h); |
print_otag(h, TAG_P, 0, NULL); |
print_doctype(h); |
if (MDOC_HEAD == n->type) |
|
print_otag(h, TAG_H1, 0, NULL); |
|
return(1); |
|
} |
} |
|
|
|
|
static void |
static void |
mdoc_sh_post(MDOC_ARGS) |
print_xmltype(struct html *h) |
{ |
{ |
|
|
if (MDOC_BODY == n->type) |
if (HTML_XHTML_1_0_STRICT == h->type) |
print_ctag(h, TAG_P); |
puts("<?xml version=\"1.0\" encoding=\"UTF-8\"?>"); |
if (MDOC_HEAD == n->type) |
|
print_ctag(h, TAG_H1); |
|
} |
} |
|
|
|
|
static void |
static void |
print_mdoc_node(MDOC_ARGS) |
print_doctype(struct html *h) |
{ |
{ |
int child; |
const char *doctype; |
|
const char *dtd; |
|
const char *name; |
|
|
child = 1; |
switch (h->type) { |
|
case (HTML_HTML_4_01_STRICT): |
switch (n->type) { |
name = "HTML"; |
case (MDOC_ROOT): |
doctype = "-//W3C//DTD HTML 4.01//EN"; |
child = mdoc_root_pre(m, n, h); |
dtd = "http://www.w3.org/TR/html4/strict.dtd"; |
break; |
break; |
case (MDOC_TEXT): |
|
print_text(h, n->string); |
|
break; |
|
default: |
default: |
if (mdocs[n->tok].pre) |
name = "html"; |
child = (*mdocs[n->tok].pre)(m, n, h); |
doctype = "-//W3C//DTD XHTML 1.0 Strict//EN"; |
|
dtd = "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"; |
break; |
break; |
} |
} |
|
|
if (child && n->child) |
printf("<!DOCTYPE %s PUBLIC \"%s\" \"%s\">\n", |
print_mdoc_node(m, n->child, h); |
name, doctype, dtd); |
|
} |
|
|
switch (n->type) { |
void |
case (MDOC_ROOT): |
print_text(struct html *h, const char *word) |
mdoc_root_post(m, n, h); |
{ |
break; |
|
case (MDOC_TEXT): |
if ( ! (HTML_NOSPACE & h->flags)) { |
break; |
/* Manage keeps! */ |
default: |
if ( ! (HTML_KEEP & h->flags)) { |
if (mdocs[n->tok].post) |
if (HTML_PREKEEP & h->flags) |
(*mdocs[n->tok].post)(m, n, h); |
h->flags |= HTML_KEEP; |
break; |
putchar(' '); |
|
} else |
|
printf(" "); |
} |
} |
|
|
if (n->next) |
assert(NULL == h->metaf); |
print_mdoc_node(m, n->next, h); |
if (HTMLFONT_NONE != h->metac) |
} |
h->metaf = HTMLFONT_BOLD == h->metac ? |
|
print_otag(h, TAG_B, 0, NULL) : |
|
print_otag(h, TAG_I, 0, NULL); |
|
|
|
assert(word); |
|
if ( ! print_encode(h, word, 0)) |
|
if ( ! (h->flags & HTML_NONOSPACE)) |
|
h->flags &= ~HTML_NOSPACE; |
|
|
static void |
if (h->metaf) { |
print_man(MAN_ARGS) |
print_tagq(h, h->metaf); |
{ |
h->metaf = NULL; |
|
} |
|
|
print_otag(h, TAG_HEAD, 0, NULL); |
h->flags &= ~HTML_IGNDELIM; |
print_man_head(m, n, h); |
|
print_ctag(h, TAG_HEAD); |
|
print_otag(h, TAG_BODY, 0, NULL); |
|
print_man_body(m, n, h); |
|
print_ctag(h, TAG_BODY); |
|
} |
} |
|
|
|
|
static void |
void |
print_man_head(MAN_ARGS) |
print_tagq(struct html *h, const struct tag *until) |
{ |
{ |
|
struct tag *tag; |
|
|
print_gen_head(h); |
while ((tag = h->tags.head) != NULL) { |
print_otag(h, TAG_TITLE, 0, NULL); |
/* |
print_encode(m->title); |
* Remember to close out and nullify the current |
print_ctag(h, TAG_TITLE); |
* meta-font and table, if applicable. |
|
*/ |
|
if (tag == h->metaf) |
|
h->metaf = NULL; |
|
if (tag == h->tblt) |
|
h->tblt = NULL; |
|
print_ctag(h, tag->tag); |
|
h->tags.head = tag->next; |
|
free(tag); |
|
if (until && tag == until) |
|
return; |
|
} |
} |
} |
|
|
|
|
static void |
void |
print_man_body(MAN_ARGS) |
print_stagq(struct html *h, const struct tag *suntil) |
{ |
{ |
|
struct tag *tag; |
|
|
|
while ((tag = h->tags.head) != NULL) { |
|
if (suntil && tag == suntil) |
|
return; |
|
/* |
|
* Remember to close out and nullify the current |
|
* meta-font and table, if applicable. |
|
*/ |
|
if (tag == h->metaf) |
|
h->metaf = NULL; |
|
if (tag == h->tblt) |
|
h->tblt = NULL; |
|
print_ctag(h, tag->tag); |
|
h->tags.head = tag->next; |
|
free(tag); |
|
} |
} |
} |
|
|
|
|
static void |
void |
print_encode(const char *p) |
bufinit(struct html *h) |
{ |
{ |
|
|
printf("%s", p); /* XXX */ |
h->buf[0] = '\0'; |
|
h->buflen = 0; |
} |
} |
|
|
|
|
static void |
void |
print_otag(struct html *h, enum htmltag tag, |
bufcat_style(struct html *h, const char *key, const char *val) |
int sz, const struct htmlpair *p) |
|
{ |
{ |
int i; |
|
|
|
if ( ! (HTML_NOSPACE & h->flags)) |
bufcat(h, key); |
if ( ! (HTML_BLOCK & htmltags[tag].flags)) |
bufncat(h, ":", 1); |
printf(" "); |
bufcat(h, val); |
|
bufncat(h, ";", 1); |
|
} |
|
|
printf("<%s", htmltags[tag].name); |
|
for (i = 0; i < sz; i++) { |
|
printf(" %s=\"", htmlattrs[p[i].key]); |
|
assert(p->val); |
|
print_encode(p[i].val); |
|
printf("\""); |
|
} |
|
printf(">"); |
|
|
|
h->flags |= HTML_NOSPACE; |
void |
|
bufcat(struct html *h, const char *p) |
|
{ |
|
|
|
bufncat(h, p, strlen(p)); |
} |
} |
|
|
|
|
/* ARGSUSED */ |
void |
static void |
buffmt(struct html *h, const char *fmt, ...) |
print_ctag(struct html *h, enum htmltag tag) |
|
{ |
{ |
|
va_list ap; |
printf("</%s>", htmltags[tag].name); |
|
if (HTML_BLOCK & htmltags[tag].flags) |
va_start(ap, fmt); |
h->flags |= HTML_NOSPACE; |
(void)vsnprintf(h->buf + (int)h->buflen, |
|
BUFSIZ - h->buflen - 1, fmt, ap); |
|
va_end(ap); |
|
h->buflen = strlen(h->buf); |
} |
} |
|
|
|
|
/* ARGSUSED */ |
void |
static void |
bufncat(struct html *h, const char *p, size_t sz) |
print_gen_doctype(struct html *h) |
|
{ |
{ |
|
|
printf("<!DOCTYPE HTML PUBLIC \"%s\" \"%s\">\n", DOCTYPE, DTD); |
if (h->buflen + sz > BUFSIZ - 1) |
|
sz = BUFSIZ - 1 - h->buflen; |
|
|
|
(void)strncat(h->buf, p, sz); |
|
h->buflen += sz; |
} |
} |
|
|
|
|
static void |
void |
print_text(struct html *h, const char *p) |
buffmt_includes(struct html *h, const char *name) |
{ |
{ |
|
const char *p, *pp; |
|
|
if (*p && 0 == *(p + 1)) |
pp = h->base_includes; |
switch (*p) { |
|
case('.'): |
while (NULL != (p = strchr(pp, '%'))) { |
/* FALLTHROUGH */ |
bufncat(h, pp, (size_t)(p - pp)); |
case(','): |
switch (*(p + 1)) { |
/* FALLTHROUGH */ |
case('I'): |
case(';'): |
bufcat(h, name); |
/* FALLTHROUGH */ |
break; |
case(':'): |
|
/* FALLTHROUGH */ |
|
case('?'): |
|
/* FALLTHROUGH */ |
|
case('!'): |
|
/* FALLTHROUGH */ |
|
case(')'): |
|
/* FALLTHROUGH */ |
|
case(']'): |
|
/* FALLTHROUGH */ |
|
case('}'): |
|
h->flags |= HTML_NOSPACE; |
|
default: |
default: |
|
bufncat(h, p, 2); |
break; |
break; |
} |
} |
|
pp = p + 2; |
|
} |
|
if (pp) |
|
bufcat(h, pp); |
|
} |
|
|
if ( ! (h->flags & HTML_NOSPACE)) |
|
printf(" "); |
|
h->flags &= ~HTML_NOSPACE; |
|
|
|
if (p) |
void |
print_encode(p); |
buffmt_man(struct html *h, |
|
const char *name, const char *sec) |
|
{ |
|
const char *p, *pp; |
|
|
if (*p && 0 == *(p + 1)) |
pp = h->base_man; |
switch (*p) { |
|
case('('): |
/* LINTED */ |
/* FALLTHROUGH */ |
while (NULL != (p = strchr(pp, '%'))) { |
case('['): |
bufncat(h, pp, (size_t)(p - pp)); |
/* FALLTHROUGH */ |
switch (*(p + 1)) { |
case('{'): |
case('S'): |
h->flags |= HTML_NOSPACE; |
bufcat(h, sec ? sec : "1"); |
|
break; |
|
case('N'): |
|
buffmt(h, name); |
|
break; |
default: |
default: |
|
bufncat(h, p, 2); |
break; |
break; |
} |
} |
|
pp = p + 2; |
|
} |
|
if (pp) |
|
bufcat(h, pp); |
|
} |
|
|
|
|
|
void |
|
bufcat_su(struct html *h, const char *p, const struct roffsu *su) |
|
{ |
|
double v; |
|
|
|
v = su->scale; |
|
if (SCALE_MM == su->unit && 0.0 == (v /= 100.0)) |
|
v = 1.0; |
|
|
|
buffmt(h, "%s: %.2f%s;", p, v, roffscales[su->unit]); |
|
} |
|
|
|
|
|
void |
|
html_idcat(char *dst, const char *src, int sz) |
|
{ |
|
int ssz; |
|
|
|
assert(sz > 2); |
|
|
|
/* Cf. <http://www.w3.org/TR/html4/types.html#h-6.2>. */ |
|
|
|
/* We can't start with a number (bah). */ |
|
|
|
if ('#' == *dst) { |
|
dst++; |
|
sz--; |
|
} |
|
if ('\0' == *dst) { |
|
*dst++ = 'x'; |
|
*dst = '\0'; |
|
sz--; |
|
} |
|
|
|
for ( ; *dst != '\0' && sz; dst++, sz--) |
|
/* Jump to end. */ ; |
|
|
|
for ( ; *src != '\0' && sz > 1; src++) { |
|
ssz = snprintf(dst, (size_t)sz, "%.2x", *src); |
|
sz -= ssz; |
|
dst += ssz; |
|
} |
} |
} |