version 1.106, 2010/07/13 23:53:20 |
version 1.131, 2011/03/22 14:05:45 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2008, 2009, 2010 Kristaps Dzonsons <kristaps@bsd.lv> |
* Copyright (c) 2008, 2009, 2010, 2011 Kristaps Dzonsons <kristaps@bsd.lv> |
|
* Copyright (c) 2011 Ingo Schwarze <schwarze@openbsd.org> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the above |
* purpose with or without fee is hereby granted, provided that the above |
|
|
|
|
#include "mandoc.h" |
#include "mandoc.h" |
#include "out.h" |
#include "out.h" |
#include "chars.h" |
|
#include "html.h" |
#include "html.h" |
#include "main.h" |
#include "main.h" |
|
|
Line 57 static const struct htmldata htmltags[TAG_MAX] = { |
|
Line 57 static const struct htmldata htmltags[TAG_MAX] = { |
|
{"br", HTML_CLRLINE | HTML_NOSTACK | HTML_AUTOCLOSE}, /* TAG_BR */ |
{"br", HTML_CLRLINE | HTML_NOSTACK | HTML_AUTOCLOSE}, /* TAG_BR */ |
{"a", 0}, /* TAG_A */ |
{"a", 0}, /* TAG_A */ |
{"table", HTML_CLRLINE}, /* TAG_TABLE */ |
{"table", HTML_CLRLINE}, /* TAG_TABLE */ |
|
{"tbody", HTML_CLRLINE}, /* TAG_TBODY */ |
{"col", HTML_CLRLINE | HTML_NOSTACK | HTML_AUTOCLOSE}, /* TAG_COL */ |
{"col", HTML_CLRLINE | HTML_NOSTACK | HTML_AUTOCLOSE}, /* TAG_COL */ |
{"tr", HTML_CLRLINE}, /* TAG_TR */ |
{"tr", HTML_CLRLINE}, /* TAG_TR */ |
{"td", HTML_CLRLINE}, /* TAG_TD */ |
{"td", HTML_CLRLINE}, /* TAG_TD */ |
{"li", HTML_CLRLINE}, /* TAG_LI */ |
{"li", HTML_CLRLINE}, /* TAG_LI */ |
{"ul", HTML_CLRLINE}, /* TAG_UL */ |
{"ul", HTML_CLRLINE}, /* TAG_UL */ |
{"ol", HTML_CLRLINE}, /* TAG_OL */ |
{"ol", HTML_CLRLINE}, /* TAG_OL */ |
|
{"dl", HTML_CLRLINE}, /* TAG_DL */ |
|
{"dt", HTML_CLRLINE}, /* TAG_DT */ |
|
{"dd", HTML_CLRLINE}, /* TAG_DD */ |
|
{"blockquote", HTML_CLRLINE}, /* TAG_BLOCKQUOTE */ |
|
{"p", HTML_CLRLINE | HTML_NOSTACK | HTML_AUTOCLOSE}, /* TAG_P */ |
|
{"pre", HTML_CLRLINE }, /* TAG_PRE */ |
|
{"b", 0 }, /* TAG_B */ |
|
{"i", 0 }, /* TAG_I */ |
|
{"code", 0 }, /* TAG_CODE */ |
|
{"small", 0 }, /* TAG_SMALL */ |
}; |
}; |
|
|
static const char *const htmlfonts[HTMLFONT_MAX] = { |
|
"roman", |
|
"bold", |
|
"italic" |
|
}; |
|
|
|
static const char *const htmlattrs[ATTR_MAX] = { |
static const char *const htmlattrs[ATTR_MAX] = { |
"http-equiv", |
"http-equiv", /* ATTR_HTTPEQUIV */ |
"content", |
"content", /* ATTR_CONTENT */ |
"name", |
"name", /* ATTR_NAME */ |
"rel", |
"rel", /* ATTR_REL */ |
"href", |
"href", /* ATTR_HREF */ |
"type", |
"type", /* ATTR_TYPE */ |
"media", |
"media", /* ATTR_MEDIA */ |
"class", |
"class", /* ATTR_CLASS */ |
"style", |
"style", /* ATTR_STYLE */ |
"width", |
"width", /* ATTR_WIDTH */ |
"valign", |
"id", /* ATTR_ID */ |
"target", |
"summary", /* ATTR_SUMMARY */ |
"id", |
"align", /* ATTR_ALIGN */ |
"summary", |
"colspan", /* ATTR_COLSPAN */ |
}; |
}; |
|
|
static void print_spec(struct html *, const char *, size_t); |
static void print_num(struct html *, const char *, size_t); |
|
static void print_spec(struct html *, enum roffdeco, |
|
const char *, size_t); |
static void print_res(struct html *, const char *, size_t); |
static void print_res(struct html *, const char *, size_t); |
static void print_ctag(struct html *, enum htmltag); |
static void print_ctag(struct html *, enum htmltag); |
static void print_doctype(struct html *); |
static void print_doctype(struct html *); |
Line 112 ml_alloc(char *outopts, enum htmltype type) |
|
Line 119 ml_alloc(char *outopts, enum htmltype type) |
|
toks[2] = "includes"; |
toks[2] = "includes"; |
toks[3] = NULL; |
toks[3] = NULL; |
|
|
h = calloc(1, sizeof(struct html)); |
h = mandoc_calloc(1, sizeof(struct html)); |
if (NULL == h) { |
|
perror(NULL); |
|
exit(EXIT_FAILURE); |
|
} |
|
|
|
h->type = type; |
h->type = type; |
h->tags.head = NULL; |
h->tags.head = NULL; |
h->ords.head = NULL; |
|
h->symtab = chars_init(CHARS_HTML); |
h->symtab = chars_init(CHARS_HTML); |
|
|
while (outopts && *outopts) |
while (outopts && *outopts) |
|
|
html_free(void *p) |
html_free(void *p) |
{ |
{ |
struct tag *tag; |
struct tag *tag; |
struct ord *ord; |
|
struct html *h; |
struct html *h; |
|
|
h = (struct html *)p; |
h = (struct html *)p; |
|
|
while ((ord = h->ords.head) != NULL) { |
|
h->ords.head = ord->next; |
|
free(ord); |
|
} |
|
|
|
while ((tag = h->tags.head) != NULL) { |
while ((tag = h->tags.head) != NULL) { |
h->tags.head = tag->next; |
h->tags.head = tag->next; |
free(tag); |
free(tag); |
Line 213 print_gen_head(struct html *h) |
|
Line 209 print_gen_head(struct html *h) |
|
} |
} |
} |
} |
|
|
|
/* ARGSUSED */ |
|
static void |
|
print_num(struct html *h, const char *p, size_t len) |
|
{ |
|
const char *rhs; |
|
|
|
rhs = chars_num2char(p, len); |
|
if (rhs) |
|
putchar((int)*rhs); |
|
} |
|
|
static void |
static void |
print_spec(struct html *h, const char *p, size_t len) |
print_spec(struct html *h, enum roffdeco d, const char *p, size_t len) |
{ |
{ |
|
int cp; |
const char *rhs; |
const char *rhs; |
size_t sz; |
size_t sz; |
|
|
rhs = chars_a2ascii(h->symtab, p, len, &sz); |
if ((cp = chars_spec2cp(h->symtab, p, len)) > 0) { |
|
printf("&#%d;", cp); |
if (NULL == rhs) |
|
return; |
return; |
fwrite(rhs, 1, sz, stdout); |
} else if (-1 == cp && DECO_SSPECIAL == d) { |
|
fwrite(p, 1, len, stdout); |
|
return; |
|
} else if (-1 == cp) |
|
return; |
|
|
|
if (NULL != (rhs = chars_spec2str(h->symtab, p, len, &sz))) |
|
fwrite(rhs, 1, sz, stdout); |
} |
} |
|
|
|
|
static void |
static void |
print_res(struct html *h, const char *p, size_t len) |
print_res(struct html *h, const char *p, size_t len) |
{ |
{ |
|
int cp; |
const char *rhs; |
const char *rhs; |
size_t sz; |
size_t sz; |
|
|
rhs = chars_a2res(h->symtab, p, len, &sz); |
if ((cp = chars_res2cp(h->symtab, p, len)) > 0) { |
|
printf("&#%d;", cp); |
if (NULL == rhs) |
|
return; |
return; |
fwrite(rhs, 1, sz, stdout); |
} else if (-1 == cp) |
} |
return; |
|
|
|
if (NULL != (rhs = chars_res2str(h->symtab, p, len, &sz))) |
struct tag * |
fwrite(rhs, 1, sz, stdout); |
print_ofont(struct html *h, enum htmlfont font) |
|
{ |
|
struct htmlpair tag; |
|
|
|
h->metal = h->metac; |
|
h->metac = font; |
|
|
|
/* FIXME: DECO_ROMAN should just close out preexisting. */ |
|
|
|
if (h->metaf && h->tags.head == h->metaf) |
|
print_tagq(h, h->metaf); |
|
|
|
PAIR_CLASS_INIT(&tag, htmlfonts[font]); |
|
h->metaf = print_otag(h, TAG_SPAN, 1, &tag); |
|
return(h->metaf); |
|
} |
} |
|
|
|
|
Line 284 print_metaf(struct html *h, enum roffdeco deco) |
|
Line 282 print_metaf(struct html *h, enum roffdeco deco) |
|
/* NOTREACHED */ |
/* NOTREACHED */ |
} |
} |
|
|
(void)print_ofont(h, font); |
if (h->metaf) { |
|
print_tagq(h, h->metaf); |
|
h->metaf = NULL; |
|
} |
|
|
|
h->metal = h->metac; |
|
h->metac = font; |
|
|
|
if (HTMLFONT_NONE != font) |
|
h->metaf = HTMLFONT_BOLD == font ? |
|
print_otag(h, TAG_B, 0, NULL) : |
|
print_otag(h, TAG_I, 0, NULL); |
} |
} |
|
|
|
|
Line 331 print_encode(struct html *h, const char *p, int norecu |
|
Line 340 print_encode(struct html *h, const char *p, int norecu |
|
len = a2roffdeco(&deco, &seq, &sz); |
len = a2roffdeco(&deco, &seq, &sz); |
|
|
switch (deco) { |
switch (deco) { |
|
case (DECO_NUMBERED): |
|
print_num(h, seq, sz); |
|
break; |
case (DECO_RESERVED): |
case (DECO_RESERVED): |
print_res(h, seq, sz); |
print_res(h, seq, sz); |
break; |
break; |
|
case (DECO_SSPECIAL): |
|
/* FALLTHROUGH */ |
case (DECO_SPECIAL): |
case (DECO_SPECIAL): |
print_spec(h, seq, sz); |
print_spec(h, deco, seq, sz); |
break; |
break; |
case (DECO_PREVIOUS): |
case (DECO_PREVIOUS): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
Line 381 print_otag(struct html *h, enum htmltag tag, |
|
Line 395 print_otag(struct html *h, enum htmltag tag, |
|
/* Push this tags onto the stack of open scopes. */ |
/* Push this tags onto the stack of open scopes. */ |
|
|
if ( ! (HTML_NOSTACK & htmltags[tag].flags)) { |
if ( ! (HTML_NOSTACK & htmltags[tag].flags)) { |
t = malloc(sizeof(struct tag)); |
t = mandoc_malloc(sizeof(struct tag)); |
if (NULL == t) { |
|
perror(NULL); |
|
exit(EXIT_FAILURE); |
|
} |
|
t->tag = tag; |
t->tag = tag; |
t->next = h->tags.head; |
t->next = h->tags.head; |
h->tags.head = t; |
h->tags.head = t; |
Line 403 print_otag(struct html *h, enum htmltag tag, |
|
Line 413 print_otag(struct html *h, enum htmltag tag, |
|
printf(" "); |
printf(" "); |
} |
} |
|
|
|
if ( ! (h->flags & HTML_NONOSPACE)) |
|
h->flags &= ~HTML_NOSPACE; |
|
else |
|
h->flags |= HTML_NOSPACE; |
|
|
/* Print out the tag name and attributes. */ |
/* Print out the tag name and attributes. */ |
|
|
printf("<%s", htmltags[tag].name); |
printf("<%s", htmltags[tag].name); |
Line 431 print_otag(struct html *h, enum htmltag tag, |
|
Line 446 print_otag(struct html *h, enum htmltag tag, |
|
putchar('>'); |
putchar('>'); |
|
|
h->flags |= HTML_NOSPACE; |
h->flags |= HTML_NOSPACE; |
|
|
|
if ((HTML_AUTOCLOSE | HTML_CLRLINE) & htmltags[tag].flags) |
|
putchar('\n'); |
|
|
return(t); |
return(t); |
} |
} |
|
|
Line 461 print_xmltype(struct html *h) |
|
Line 480 print_xmltype(struct html *h) |
|
{ |
{ |
|
|
if (HTML_XHTML_1_0_STRICT == h->type) |
if (HTML_XHTML_1_0_STRICT == h->type) |
printf("<?xml version=\"1.0\" encoding=\"UTF-8\"?>"); |
puts("<?xml version=\"1.0\" encoding=\"UTF-8\"?>"); |
} |
} |
|
|
|
|
Line 489 print_doctype(struct html *h) |
|
Line 508 print_doctype(struct html *h) |
|
name, doctype, dtd); |
name, doctype, dtd); |
} |
} |
|
|
|
|
void |
void |
print_text(struct html *h, const char *word) |
print_text(struct html *h, const char *word) |
{ |
{ |
|
|
if (word[0] && '\0' == word[1]) |
|
switch (word[0]) { |
|
case('.'): |
|
/* FALLTHROUGH */ |
|
case(','): |
|
/* FALLTHROUGH */ |
|
case(';'): |
|
/* FALLTHROUGH */ |
|
case(':'): |
|
/* FALLTHROUGH */ |
|
case('?'): |
|
/* FALLTHROUGH */ |
|
case('!'): |
|
/* FALLTHROUGH */ |
|
case(')'): |
|
/* FALLTHROUGH */ |
|
case(']'): |
|
if ( ! (HTML_IGNDELIM & h->flags)) |
|
h->flags |= HTML_NOSPACE; |
|
break; |
|
default: |
|
break; |
|
} |
|
|
|
if ( ! (HTML_NOSPACE & h->flags)) { |
if ( ! (HTML_NOSPACE & h->flags)) { |
/* Manage keeps! */ |
/* Manage keeps! */ |
if ( ! (HTML_KEEP & h->flags)) { |
if ( ! (HTML_KEEP & h->flags)) { |
Line 528 print_text(struct html *h, const char *word) |
|
Line 522 print_text(struct html *h, const char *word) |
|
printf(" "); |
printf(" "); |
} |
} |
|
|
|
assert(NULL == h->metaf); |
|
if (HTMLFONT_NONE != h->metac) |
|
h->metaf = HTMLFONT_BOLD == h->metac ? |
|
print_otag(h, TAG_B, 0, NULL) : |
|
print_otag(h, TAG_I, 0, NULL); |
|
|
assert(word); |
assert(word); |
if ( ! print_encode(h, word, 0)) |
if ( ! print_encode(h, word, 0)) |
h->flags &= ~HTML_NOSPACE; |
if ( ! (h->flags & HTML_NONOSPACE)) |
|
h->flags &= ~HTML_NOSPACE; |
|
|
/* |
if (h->metaf) { |
* Note that we don't process the pipe: the parser sees it as |
print_tagq(h, h->metaf); |
* punctuation, but we don't in terms of typography. |
h->metaf = NULL; |
*/ |
} |
if (word[0] && '\0' == word[1]) |
|
switch (word[0]) { |
h->flags &= ~HTML_IGNDELIM; |
case('('): |
|
/* FALLTHROUGH */ |
|
case('['): |
|
h->flags |= HTML_NOSPACE; |
|
break; |
|
default: |
|
break; |
|
} |
|
} |
} |
|
|
|
|
Line 555 print_tagq(struct html *h, const struct tag *until) |
|
Line 548 print_tagq(struct html *h, const struct tag *until) |
|
struct tag *tag; |
struct tag *tag; |
|
|
while ((tag = h->tags.head) != NULL) { |
while ((tag = h->tags.head) != NULL) { |
|
/* |
|
* Remember to close out and nullify the current |
|
* meta-font and table, if applicable. |
|
*/ |
if (tag == h->metaf) |
if (tag == h->metaf) |
h->metaf = NULL; |
h->metaf = NULL; |
|
if (tag == h->tblt) |
|
h->tblt = NULL; |
print_ctag(h, tag->tag); |
print_ctag(h, tag->tag); |
h->tags.head = tag->next; |
h->tags.head = tag->next; |
free(tag); |
free(tag); |
Line 574 print_stagq(struct html *h, const struct tag *suntil) |
|
Line 573 print_stagq(struct html *h, const struct tag *suntil) |
|
while ((tag = h->tags.head) != NULL) { |
while ((tag = h->tags.head) != NULL) { |
if (suntil && tag == suntil) |
if (suntil && tag == suntil) |
return; |
return; |
|
/* |
|
* Remember to close out and nullify the current |
|
* meta-font and table, if applicable. |
|
*/ |
if (tag == h->metaf) |
if (tag == h->metaf) |
h->metaf = NULL; |
h->metaf = NULL; |
|
if (tag == h->tblt) |
|
h->tblt = NULL; |
print_ctag(h, tag->tag); |
print_ctag(h, tag->tag); |
h->tags.head = tag->next; |
h->tags.head = tag->next; |
free(tag); |
free(tag); |
Line 745 html_idcat(char *dst, const char *src, int sz) |
|
Line 750 html_idcat(char *dst, const char *src, int sz) |
|
{ |
{ |
int ssz; |
int ssz; |
|
|
assert(sz); |
assert(sz > 2); |
|
|
/* Cf. <http://www.w3.org/TR/html4/types.html#h-6.2>. */ |
/* Cf. <http://www.w3.org/TR/html4/types.html#h-6.2>. */ |
|
|
for ( ; *dst != '\0' && sz; dst++, sz--) |
|
/* Jump to end. */ ; |
|
|
|
assert(sz > 2); |
|
|
|
/* We can't start with a number (bah). */ |
/* We can't start with a number (bah). */ |
|
|
*dst++ = 'x'; |
if ('#' == *dst) { |
*dst = '\0'; |
dst++; |
sz--; |
sz--; |
|
} |
|
if ('\0' == *dst) { |
|
*dst++ = 'x'; |
|
*dst = '\0'; |
|
sz--; |
|
} |
|
|
|
for ( ; *dst != '\0' && sz; dst++, sz--) |
|
/* Jump to end. */ ; |
|
|
for ( ; *src != '\0' && sz > 1; src++) { |
for ( ; *src != '\0' && sz > 1; src++) { |
ssz = snprintf(dst, (size_t)sz, "%.2x", *src); |
ssz = snprintf(dst, (size_t)sz, "%.2x", *src); |