version 1.157, 2014/04/23 16:08:33 |
version 1.178, 2014/10/27 13:31:04 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2008, 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv> |
* Copyright (c) 2008-2011, 2014 Kristaps Dzonsons <kristaps@bsd.lv> |
* Copyright (c) 2011, 2012, 2013, 2014 Ingo Schwarze <schwarze@openbsd.org> |
* Copyright (c) 2011, 2012, 2013, 2014 Ingo Schwarze <schwarze@openbsd.org> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
|
|
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
*/ |
*/ |
#ifdef HAVE_CONFIG_H |
|
#include "config.h" |
#include "config.h" |
#endif |
|
|
|
#include <sys/types.h> |
#include <sys/types.h> |
|
|
Line 70 static const struct htmldata htmltags[TAG_MAX] = { |
|
Line 68 static const struct htmldata htmltags[TAG_MAX] = { |
|
{"dt", HTML_CLRLINE}, /* TAG_DT */ |
{"dt", HTML_CLRLINE}, /* TAG_DT */ |
{"dd", HTML_CLRLINE}, /* TAG_DD */ |
{"dd", HTML_CLRLINE}, /* TAG_DD */ |
{"blockquote", HTML_CLRLINE}, /* TAG_BLOCKQUOTE */ |
{"blockquote", HTML_CLRLINE}, /* TAG_BLOCKQUOTE */ |
{"p", HTML_CLRLINE | HTML_NOSTACK | HTML_AUTOCLOSE}, /* TAG_P */ |
|
{"pre", HTML_CLRLINE }, /* TAG_PRE */ |
{"pre", HTML_CLRLINE }, /* TAG_PRE */ |
{"b", 0 }, /* TAG_B */ |
{"b", 0 }, /* TAG_B */ |
{"i", 0 }, /* TAG_I */ |
{"i", 0 }, /* TAG_I */ |
{"code", 0 }, /* TAG_CODE */ |
{"code", 0 }, /* TAG_CODE */ |
{"small", 0 }, /* TAG_SMALL */ |
{"small", 0 }, /* TAG_SMALL */ |
|
{"style", HTML_CLRLINE}, /* TAG_STYLE */ |
|
{"math", HTML_CLRLINE}, /* TAG_MATH */ |
|
{"mrow", 0}, /* TAG_MROW */ |
|
{"mi", 0}, /* TAG_MI */ |
|
{"mo", 0}, /* TAG_MO */ |
|
{"msup", 0}, /* TAG_MSUP */ |
|
{"msub", 0}, /* TAG_MSUB */ |
|
{"msubsup", 0}, /* TAG_MSUBSUP */ |
|
{"mfrac", 0}, /* TAG_MFRAC */ |
|
{"msqrt", 0}, /* TAG_MSQRT */ |
|
{"mfenced", 0}, /* TAG_MFENCED */ |
|
{"mtable", 0}, /* TAG_MTABLE */ |
|
{"mtr", 0}, /* TAG_MTR */ |
|
{"mtd", 0}, /* TAG_MTD */ |
|
{"munderover", 0}, /* TAG_MUNDEROVER */ |
|
{"munder", 0}, /* TAG_MUNDER*/ |
|
{"mover", 0}, /* TAG_MOVER*/ |
}; |
}; |
|
|
static const char *const htmlattrs[ATTR_MAX] = { |
static const char *const htmlattrs[ATTR_MAX] = { |
"http-equiv", /* ATTR_HTTPEQUIV */ |
|
"content", /* ATTR_CONTENT */ |
|
"name", /* ATTR_NAME */ |
"name", /* ATTR_NAME */ |
"rel", /* ATTR_REL */ |
"rel", /* ATTR_REL */ |
"href", /* ATTR_HREF */ |
"href", /* ATTR_HREF */ |
Line 88 static const char *const htmlattrs[ATTR_MAX] = { |
|
Line 100 static const char *const htmlattrs[ATTR_MAX] = { |
|
"media", /* ATTR_MEDIA */ |
"media", /* ATTR_MEDIA */ |
"class", /* ATTR_CLASS */ |
"class", /* ATTR_CLASS */ |
"style", /* ATTR_STYLE */ |
"style", /* ATTR_STYLE */ |
"width", /* ATTR_WIDTH */ |
|
"id", /* ATTR_ID */ |
"id", /* ATTR_ID */ |
"summary", /* ATTR_SUMMARY */ |
|
"align", /* ATTR_ALIGN */ |
|
"colspan", /* ATTR_COLSPAN */ |
"colspan", /* ATTR_COLSPAN */ |
|
"charset", /* ATTR_CHARSET */ |
|
"open", /* ATTR_OPEN */ |
|
"close", /* ATTR_CLOSE */ |
|
"mathvariant", /* ATTR_MATHVARIANT */ |
}; |
}; |
|
|
static const char *const roffscales[SCALE_MAX] = { |
static const char *const roffscales[SCALE_MAX] = { |
Line 110 static const char *const roffscales[SCALE_MAX] = { |
|
Line 123 static const char *const roffscales[SCALE_MAX] = { |
|
|
|
static void bufncat(struct html *, const char *, size_t); |
static void bufncat(struct html *, const char *, size_t); |
static void print_ctag(struct html *, enum htmltag); |
static void print_ctag(struct html *, enum htmltag); |
|
static int print_escape(char); |
static int print_encode(struct html *, const char *, int); |
static int print_encode(struct html *, const char *, int); |
static void print_metaf(struct html *, enum mandoc_esc); |
static void print_metaf(struct html *, enum mandoc_esc); |
static void print_attr(struct html *, const char *, const char *); |
static void print_attr(struct html *, const char *, const char *); |
static void *ml_alloc(char *, enum htmltype); |
static void *ml_alloc(char *); |
|
|
|
|
static void * |
static void * |
ml_alloc(char *outopts, enum htmltype type) |
ml_alloc(char *outopts) |
{ |
{ |
struct html *h; |
struct html *h; |
const char *toks[5]; |
const char *toks[5]; |
Line 131 ml_alloc(char *outopts, enum htmltype type) |
|
Line 145 ml_alloc(char *outopts, enum htmltype type) |
|
|
|
h = mandoc_calloc(1, sizeof(struct html)); |
h = mandoc_calloc(1, sizeof(struct html)); |
|
|
h->type = type; |
|
h->tags.head = NULL; |
h->tags.head = NULL; |
h->symtab = mchars_alloc(); |
h->symtab = mchars_alloc(); |
|
|
|
|
html_alloc(char *outopts) |
html_alloc(char *outopts) |
{ |
{ |
|
|
return(ml_alloc(outopts, HTML_HTML_4_01_STRICT)); |
return(ml_alloc(outopts)); |
} |
} |
|
|
void * |
void * |
xhtml_alloc(char *outopts) |
xhtml_alloc(char *outopts) |
{ |
{ |
|
|
return(ml_alloc(outopts, HTML_XHTML_1_0_STRICT)); |
return(ml_alloc(outopts)); |
} |
} |
|
|
void |
void |
|
|
print_gen_head(struct html *h) |
print_gen_head(struct html *h) |
{ |
{ |
struct htmlpair tag[4]; |
struct htmlpair tag[4]; |
|
struct tag *t; |
|
|
tag[0].key = ATTR_HTTPEQUIV; |
tag[0].key = ATTR_CHARSET; |
tag[0].val = "Content-Type"; |
tag[0].val = "utf-8"; |
tag[1].key = ATTR_CONTENT; |
print_otag(h, TAG_META, 1, tag); |
tag[1].val = "text/html; charset=utf-8"; |
|
print_otag(h, TAG_META, 2, tag); |
|
|
|
tag[0].key = ATTR_NAME; |
/* |
tag[0].val = "resource-type"; |
* Print a default style-sheet. |
tag[1].key = ATTR_CONTENT; |
*/ |
tag[1].val = "document"; |
t = print_otag(h, TAG_STYLE, 0, NULL); |
print_otag(h, TAG_META, 2, tag); |
print_text(h, "table.head, table.foot { width: 100%; }\n" |
|
"td.head-rtitle, td.foot-os { text-align: right; }\n" |
|
"td.head-vol { text-align: center; }\n" |
|
"table.foot td { width: 50%; }\n" |
|
"table.head td { width: 33%; }\n" |
|
"div.spacer { margin: 1em 0; }\n"); |
|
print_tagq(h, t); |
|
|
if (h->style) { |
if (h->style) { |
tag[0].key = ATTR_REL; |
tag[0].key = ATTR_REL; |
Line 324 html_strlen(const char *cp) |
|
Line 342 html_strlen(const char *cp) |
|
} |
} |
|
|
static int |
static int |
|
print_escape(char c) |
|
{ |
|
|
|
switch (c) { |
|
case '<': |
|
printf("<"); |
|
break; |
|
case '>': |
|
printf(">"); |
|
break; |
|
case '&': |
|
printf("&"); |
|
break; |
|
case '"': |
|
printf("""); |
|
break; |
|
case ASCII_NBRSP: |
|
putchar('-'); |
|
break; |
|
case ASCII_HYPH: |
|
putchar('-'); |
|
/* FALLTHROUGH */ |
|
case ASCII_BREAK: |
|
break; |
|
default: |
|
return(0); |
|
} |
|
return(1); |
|
} |
|
|
|
static int |
print_encode(struct html *h, const char *p, int norecurse) |
print_encode(struct html *h, const char *p, int norecurse) |
{ |
{ |
size_t sz; |
size_t sz; |
int c, len, nospace; |
int c, len, nospace; |
const char *seq; |
const char *seq; |
enum mandoc_esc esc; |
enum mandoc_esc esc; |
static const char rejs[8] = { '\\', '<', '>', '&', |
static const char rejs[9] = { '\\', '<', '>', '&', '"', |
ASCII_NBRSP, ASCII_HYPH, ASCII_BREAK, '\0' }; |
ASCII_NBRSP, ASCII_HYPH, ASCII_BREAK, '\0' }; |
|
|
nospace = 0; |
nospace = 0; |
Line 350 print_encode(struct html *h, const char *p, int norecu |
|
Line 399 print_encode(struct html *h, const char *p, int norecu |
|
if ('\0' == *p) |
if ('\0' == *p) |
break; |
break; |
|
|
switch (*p++) { |
if (print_escape(*p++)) |
case '<': |
|
printf("<"); |
|
continue; |
continue; |
case '>': |
|
printf(">"); |
|
continue; |
|
case '&': |
|
printf("&"); |
|
continue; |
|
case ASCII_NBRSP: |
|
putchar('-'); |
|
continue; |
|
case ASCII_HYPH: |
|
putchar('-'); |
|
/* FALLTHROUGH */ |
|
case ASCII_BREAK: |
|
continue; |
|
default: |
|
break; |
|
} |
|
|
|
esc = mandoc_escape(&p, &seq, &len); |
esc = mandoc_escape(&p, &seq, &len); |
if (ESCAPE_ERROR == esc) |
if (ESCAPE_ERROR == esc) |
Line 405 print_encode(struct html *h, const char *p, int norecu |
|
Line 435 print_encode(struct html *h, const char *p, int norecu |
|
|
|
switch (esc) { |
switch (esc) { |
case ESCAPE_UNICODE: |
case ESCAPE_UNICODE: |
/* Skip passed "u" header. */ |
/* Skip past "u" header. */ |
c = mchars_num2uc(seq + 1, len - 1); |
c = mchars_num2uc(seq + 1, len - 1); |
if ('\0' != c) |
|
printf("&#x%x;", c); |
/* |
|
* XXX Security warning: |
|
* For now, forbid Unicode obfuscation of ASCII |
|
* characters. An audit of the callers is |
|
* required before this can be removed. |
|
*/ |
|
|
|
if (c < 0x80) |
|
c = 0xFFFD; |
|
|
|
printf("&#x%x;", c); |
break; |
break; |
case ESCAPE_NUMBERED: |
case ESCAPE_NUMBERED: |
c = mchars_num2char(seq, len); |
c = mchars_num2char(seq, len); |
if ('\0' != c) |
if ( ! ('\0' == c || print_escape(c))) |
putchar(c); |
putchar(c); |
break; |
break; |
case ESCAPE_SPECIAL: |
case ESCAPE_SPECIAL: |
c = mchars_spec2cp(h->symtab, seq, len); |
c = mchars_spec2cp(h->symtab, seq, len); |
if (c > 0) |
if (c <= 0) |
|
break; |
|
if (c < 0x20 || c > 0x7e) |
printf("&#%d;", c); |
printf("&#%d;", c); |
else if (-1 == c && 1 == len) |
else if ( ! print_escape(c)) |
putchar((int)*seq); |
putchar(c); |
break; |
break; |
case ESCAPE_NOSPACE: |
case ESCAPE_NOSPACE: |
if ('\0' == *p) |
if ('\0' == *p) |
Line 481 print_otag(struct html *h, enum htmltag tag, |
|
Line 523 print_otag(struct html *h, enum htmltag tag, |
|
for (i = 0; i < sz; i++) |
for (i = 0; i < sz; i++) |
print_attr(h, htmlattrs[p[i].key], p[i].val); |
print_attr(h, htmlattrs[p[i].key], p[i].val); |
|
|
/* Add non-overridable attributes. */ |
/* Accommodate for "well-formed" singleton escaping. */ |
|
|
if (TAG_HTML == tag && HTML_XHTML_1_0_STRICT == h->type) { |
|
print_attr(h, "xmlns", "http://www.w3.org/1999/xhtml"); |
|
print_attr(h, "xml:lang", "en"); |
|
print_attr(h, "lang", "en"); |
|
} |
|
|
|
/* Accommodate for XML "well-formed" singleton escaping. */ |
|
|
|
if (HTML_AUTOCLOSE & htmltags[tag].flags) |
if (HTML_AUTOCLOSE & htmltags[tag].flags) |
switch (h->type) { |
putchar('/'); |
case HTML_XHTML_1_0_STRICT: |
|
putchar('/'); |
|
break; |
|
default: |
|
break; |
|
} |
|
|
|
putchar('>'); |
putchar('>'); |
|
|
Line 524 print_ctag(struct html *h, enum htmltag tag) |
|
Line 552 print_ctag(struct html *h, enum htmltag tag) |
|
void |
void |
print_gen_decls(struct html *h) |
print_gen_decls(struct html *h) |
{ |
{ |
const char *doctype; |
|
const char *dtd; |
|
const char *name; |
|
|
|
switch (h->type) { |
puts("<!DOCTYPE html>"); |
case HTML_HTML_4_01_STRICT: |
|
name = "HTML"; |
|
doctype = "-//W3C//DTD HTML 4.01//EN"; |
|
dtd = "http://www.w3.org/TR/html4/strict.dtd"; |
|
break; |
|
default: |
|
puts("<?xml version=\"1.0\" encoding=\"UTF-8\"?>"); |
|
name = "html"; |
|
doctype = "-//W3C//DTD XHTML 1.0 Strict//EN"; |
|
dtd = "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"; |
|
break; |
|
} |
|
|
|
printf("<!DOCTYPE %s PUBLIC \"%s\" \"%s\">\n", |
|
name, doctype, dtd); |
|
} |
} |
|
|
void |
void |
Line 636 print_stagq(struct html *h, const struct tag *suntil) |
|
Line 646 print_stagq(struct html *h, const struct tag *suntil) |
|
} |
} |
|
|
void |
void |
|
print_paragraph(struct html *h) |
|
{ |
|
struct tag *t; |
|
struct htmlpair tag; |
|
|
|
PAIR_CLASS_INIT(&tag, "spacer"); |
|
t = print_otag(h, TAG_DIV, 1, &tag); |
|
print_tagq(h, t); |
|
} |
|
|
|
|
|
void |
bufinit(struct html *h) |
bufinit(struct html *h) |
{ |
{ |
|
|
Line 747 bufcat_su(struct html *h, const char *p, const struct |
|
Line 769 bufcat_su(struct html *h, const char *p, const struct |
|
v = su->scale; |
v = su->scale; |
if (SCALE_MM == su->unit && 0.0 == (v /= 100.0)) |
if (SCALE_MM == su->unit && 0.0 == (v /= 100.0)) |
v = 1.0; |
v = 1.0; |
|
else if (SCALE_BU == su->unit) |
|
v /= 24.0; |
|
|
bufcat_fmt(h, "%s: %.2f%s;", p, v, roffscales[su->unit]); |
bufcat_fmt(h, "%s: %.2f%s;", p, v, roffscales[su->unit]); |
} |
} |