version 1.82, 2009/11/09 05:11:46 |
version 1.207, 2017/02/05 20:22:04 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@kth.se> |
* Copyright (c) 2008-2011, 2014 Kristaps Dzonsons <kristaps@bsd.lv> |
|
* Copyright (c) 2011-2015, 2017 Ingo Schwarze <schwarze@openbsd.org> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the above |
* purpose with or without fee is hereby granted, provided that the above |
* copyright notice and this permission notice appear in all copies. |
* copyright notice and this permission notice appear in all copies. |
* |
* |
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES |
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHORS DISCLAIM ALL WARRANTIES |
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF |
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF |
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR |
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR |
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES |
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES |
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN |
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
*/ |
*/ |
|
#include "config.h" |
|
|
#include <sys/types.h> |
#include <sys/types.h> |
|
|
#include <assert.h> |
#include <assert.h> |
|
|
#include <string.h> |
#include <string.h> |
#include <unistd.h> |
#include <unistd.h> |
|
|
|
#include "mandoc.h" |
|
#include "mandoc_aux.h" |
#include "out.h" |
#include "out.h" |
#include "chars.h" |
|
#include "html.h" |
#include "html.h" |
|
#include "manconf.h" |
#include "main.h" |
#include "main.h" |
|
|
#define UNCONST(a) ((void *)(uintptr_t)(const void *)(a)) |
|
|
|
#define DOCTYPE "-//W3C//DTD HTML 4.01//EN" |
|
#define DTD "http://www.w3.org/TR/html4/strict.dtd" |
|
|
|
struct htmldata { |
struct htmldata { |
const char *name; |
const char *name; |
int flags; |
int flags; |
#define HTML_CLRLINE (1 << 0) |
#define HTML_NOSTACK (1 << 0) |
#define HTML_NOSTACK (1 << 1) |
#define HTML_AUTOCLOSE (1 << 1) |
|
#define HTML_NLBEFORE (1 << 2) |
|
#define HTML_NLBEGIN (1 << 3) |
|
#define HTML_NLEND (1 << 4) |
|
#define HTML_NLAFTER (1 << 5) |
|
#define HTML_NLAROUND (HTML_NLBEFORE | HTML_NLAFTER) |
|
#define HTML_NLINSIDE (HTML_NLBEGIN | HTML_NLEND) |
|
#define HTML_NLALL (HTML_NLAROUND | HTML_NLINSIDE) |
|
#define HTML_INDENT (1 << 6) |
|
#define HTML_NOINDENT (1 << 7) |
}; |
}; |
|
|
static const struct htmldata htmltags[TAG_MAX] = { |
static const struct htmldata htmltags[TAG_MAX] = { |
{"html", HTML_CLRLINE}, /* TAG_HTML */ |
{"html", HTML_NLALL}, |
{"head", HTML_CLRLINE}, /* TAG_HEAD */ |
{"head", HTML_NLALL | HTML_INDENT}, |
{"body", HTML_CLRLINE}, /* TAG_BODY */ |
{"body", HTML_NLALL}, |
{"meta", HTML_CLRLINE | HTML_NOSTACK}, /* TAG_META */ |
{"meta", HTML_NOSTACK | HTML_AUTOCLOSE | HTML_NLALL}, |
{"title", HTML_CLRLINE}, /* TAG_TITLE */ |
{"title", HTML_NLAROUND}, |
{"div", HTML_CLRLINE}, /* TAG_DIV */ |
{"div", HTML_NLAROUND}, |
{"h1", 0}, /* TAG_H1 */ |
{"h1", HTML_NLAROUND}, |
{"h2", 0}, /* TAG_H2 */ |
{"h2", HTML_NLAROUND}, |
{"p", HTML_CLRLINE}, /* TAG_P */ |
{"span", 0}, |
{"span", 0}, /* TAG_SPAN */ |
{"link", HTML_NOSTACK | HTML_AUTOCLOSE | HTML_NLALL}, |
{"link", HTML_CLRLINE | HTML_NOSTACK}, /* TAG_LINK */ |
{"br", HTML_NOSTACK | HTML_AUTOCLOSE | HTML_NLALL}, |
{"br", HTML_CLRLINE | HTML_NOSTACK}, /* TAG_LINK */ |
{"a", 0}, |
{"a", 0}, /* TAG_A */ |
{"table", HTML_NLALL | HTML_INDENT}, |
{"table", HTML_CLRLINE}, /* TAG_TABLE */ |
{"colgroup", HTML_NLALL | HTML_INDENT}, |
{"col", HTML_CLRLINE | HTML_NOSTACK}, /* TAG_COL */ |
{"col", HTML_NOSTACK | HTML_AUTOCLOSE | HTML_NLALL}, |
{"tr", HTML_CLRLINE}, /* TAG_TR */ |
{"tr", HTML_NLALL | HTML_INDENT}, |
{"td", HTML_CLRLINE}, /* TAG_TD */ |
{"td", HTML_NLAROUND}, |
{"li", HTML_CLRLINE}, /* TAG_LI */ |
{"li", HTML_NLAROUND | HTML_INDENT}, |
{"ul", HTML_CLRLINE}, /* TAG_UL */ |
{"ul", HTML_NLALL | HTML_INDENT}, |
{"ol", HTML_CLRLINE}, /* TAG_OL */ |
{"ol", HTML_NLALL | HTML_INDENT}, |
{"base", HTML_CLRLINE | HTML_NOSTACK}, /* TAG_BASE */ |
{"dl", HTML_NLALL | HTML_INDENT}, |
|
{"dt", HTML_NLAROUND}, |
|
{"dd", HTML_NLAROUND | HTML_INDENT}, |
|
{"pre", HTML_NLALL | HTML_NOINDENT}, |
|
{"var", 0}, |
|
{"cite", 0}, |
|
{"b", 0}, |
|
{"i", 0}, |
|
{"code", 0}, |
|
{"small", 0}, |
|
{"style", HTML_NLALL | HTML_INDENT}, |
|
{"math", HTML_NLALL | HTML_INDENT}, |
|
{"mrow", 0}, |
|
{"mi", 0}, |
|
{"mo", 0}, |
|
{"msup", 0}, |
|
{"msub", 0}, |
|
{"msubsup", 0}, |
|
{"mfrac", 0}, |
|
{"msqrt", 0}, |
|
{"mfenced", 0}, |
|
{"mtable", 0}, |
|
{"mtr", 0}, |
|
{"mtd", 0}, |
|
{"munderover", 0}, |
|
{"munder", 0}, |
|
{"mover", 0}, |
}; |
}; |
|
|
static const char *const htmlattrs[ATTR_MAX] = { |
static const char *const roffscales[SCALE_MAX] = { |
"http-equiv", |
"cm", /* SCALE_CM */ |
"content", |
"in", /* SCALE_IN */ |
"name", |
"pc", /* SCALE_PC */ |
"rel", |
"pt", /* SCALE_PT */ |
"href", |
"em", /* SCALE_EM */ |
"type", |
"em", /* SCALE_MM */ |
"media", |
"ex", /* SCALE_EN */ |
"class", |
"ex", /* SCALE_BU */ |
"style", |
"em", /* SCALE_VS */ |
"width", |
"ex", /* SCALE_FS */ |
"valign", |
|
"target", |
|
"id", |
|
"summary", |
|
}; |
}; |
|
|
#ifdef __linux__ |
static void a2width(const char *, struct roffsu *); |
extern int getsubopt(char **, char * const *, char **); |
static void print_byte(struct html *, char); |
#endif |
static void print_endword(struct html *); |
|
static void print_indent(struct html *); |
|
static void print_word(struct html *, const char *); |
|
|
|
static void print_ctag(struct html *, struct tag *); |
|
static int print_escape(struct html *, char); |
|
static int print_encode(struct html *, const char *, const char *, int); |
|
static void print_href(struct html *, const char *, const char *, int); |
|
static void print_metaf(struct html *, enum mandoc_esc); |
|
|
static void print_spec(struct html *, const char *, int); |
|
static void print_res(struct html *, const char *, int); |
|
static void print_ctag(struct html *, enum htmltag); |
|
static void print_encode(struct html *, const char *); |
|
|
|
|
|
void * |
void * |
html_alloc(char *outopts) |
html_alloc(const struct manoutput *outopts) |
{ |
{ |
struct html *h; |
struct html *h; |
const char *toks[4]; |
|
char *v; |
|
|
|
toks[0] = "style"; |
h = mandoc_calloc(1, sizeof(struct html)); |
toks[1] = "man"; |
|
toks[2] = "includes"; |
|
toks[3] = NULL; |
|
|
|
h = calloc(1, sizeof(struct html)); |
h->tag = NULL; |
if (NULL == h) { |
h->style = outopts->style; |
perror(NULL); |
h->base_man = outopts->man; |
exit(EXIT_FAILURE); |
h->base_includes = outopts->includes; |
} |
if (outopts->fragment) |
|
h->oflags |= HTML_FRAGMENT; |
|
|
h->tags.head = NULL; |
return h; |
h->ords.head = NULL; |
|
h->symtab = chars_init(CHARS_HTML); |
|
|
|
while (outopts && *outopts) |
|
switch (getsubopt(&outopts, UNCONST(toks), &v)) { |
|
case (0): |
|
h->style = v; |
|
break; |
|
case (1): |
|
h->base_man = v; |
|
break; |
|
case (2): |
|
h->base_includes = v; |
|
break; |
|
default: |
|
break; |
|
} |
|
|
|
return(h); |
|
} |
} |
|
|
|
|
void |
void |
html_free(void *p) |
html_free(void *p) |
{ |
{ |
struct tag *tag; |
struct tag *tag; |
struct ord *ord; |
|
struct html *h; |
struct html *h; |
|
|
h = (struct html *)p; |
h = (struct html *)p; |
|
|
while ((ord = h->ords.head) != NULL) { |
while ((tag = h->tag) != NULL) { |
h->ords.head = ord->next; |
h->tag = tag->next; |
free(ord); |
|
} |
|
|
|
while ((tag = h->tags.head) != NULL) { |
|
h->tags.head = tag->next; |
|
free(tag); |
free(tag); |
} |
} |
|
|
if (h->symtab) |
|
chars_free(h->symtab); |
|
|
|
free(h); |
free(h); |
} |
} |
|
|
|
|
void |
void |
print_gen_head(struct html *h) |
print_gen_head(struct html *h) |
{ |
{ |
struct htmlpair tag[4]; |
struct tag *t; |
|
|
tag[0].key = ATTR_HTTPEQUIV; |
print_otag(h, TAG_META, "?", "charset", "utf-8"); |
tag[0].val = "Content-Type"; |
|
tag[1].key = ATTR_CONTENT; |
|
tag[1].val = "text/html; charset=utf-8"; |
|
print_otag(h, TAG_META, 2, tag); |
|
|
|
tag[0].key = ATTR_NAME; |
/* |
tag[0].val = "resource-type"; |
* Print a default style-sheet. |
tag[1].key = ATTR_CONTENT; |
*/ |
tag[1].val = "document"; |
|
print_otag(h, TAG_META, 2, tag); |
|
|
|
if (h->style) { |
t = print_otag(h, TAG_STYLE, ""); |
tag[0].key = ATTR_REL; |
print_text(h, "table.head, table.foot { width: 100%; }"); |
tag[0].val = "stylesheet"; |
print_endline(h); |
tag[1].key = ATTR_HREF; |
print_text(h, "td.head-rtitle, td.foot-os { text-align: right; }"); |
tag[1].val = h->style; |
print_endline(h); |
tag[2].key = ATTR_TYPE; |
print_text(h, "td.head-vol { text-align: center; }"); |
tag[2].val = "text/css"; |
print_endline(h); |
tag[3].key = ATTR_MEDIA; |
print_text(h, "div.Pp { margin: 1ex 0ex; }"); |
tag[3].val = "all"; |
print_tagq(h, t); |
print_otag(h, TAG_LINK, 4, tag); |
|
} |
if (h->style) |
|
print_otag(h, TAG_LINK, "?h??", "rel", "stylesheet", |
|
h->style, "type", "text/css", "media", "all"); |
} |
} |
|
|
|
|
static void |
static void |
print_spec(struct html *h, const char *p, int len) |
print_metaf(struct html *h, enum mandoc_esc deco) |
{ |
{ |
const char *rhs; |
enum htmlfont font; |
size_t sz; |
|
|
|
rhs = chars_a2ascii(h->symtab, p, (size_t)len, &sz); |
switch (deco) { |
|
case ESCAPE_FONTPREV: |
|
font = h->metal; |
|
break; |
|
case ESCAPE_FONTITALIC: |
|
font = HTMLFONT_ITALIC; |
|
break; |
|
case ESCAPE_FONTBOLD: |
|
font = HTMLFONT_BOLD; |
|
break; |
|
case ESCAPE_FONTBI: |
|
font = HTMLFONT_BI; |
|
break; |
|
case ESCAPE_FONT: |
|
case ESCAPE_FONTROMAN: |
|
font = HTMLFONT_NONE; |
|
break; |
|
default: |
|
abort(); |
|
} |
|
|
if (NULL == rhs) |
if (h->metaf) { |
return; |
print_tagq(h, h->metaf); |
fwrite(rhs, 1, sz, stdout); |
h->metaf = NULL; |
} |
} |
|
|
|
h->metal = h->metac; |
|
h->metac = font; |
|
|
static void |
switch (font) { |
print_res(struct html *h, const char *p, int len) |
case HTMLFONT_ITALIC: |
|
h->metaf = print_otag(h, TAG_I, ""); |
|
break; |
|
case HTMLFONT_BOLD: |
|
h->metaf = print_otag(h, TAG_B, ""); |
|
break; |
|
case HTMLFONT_BI: |
|
h->metaf = print_otag(h, TAG_B, ""); |
|
print_otag(h, TAG_I, ""); |
|
break; |
|
default: |
|
break; |
|
} |
|
} |
|
|
|
int |
|
html_strlen(const char *cp) |
{ |
{ |
const char *rhs; |
size_t rsz; |
size_t sz; |
int skip, sz; |
|
|
rhs = chars_a2res(h->symtab, p, (size_t)len, &sz); |
/* |
|
* Account for escaped sequences within string length |
|
* calculations. This follows the logic in term_strlen() as we |
|
* must calculate the width of produced strings. |
|
* Assume that characters are always width of "1". This is |
|
* hacky, but it gets the job done for approximation of widths. |
|
*/ |
|
|
if (NULL == rhs) |
sz = 0; |
return; |
skip = 0; |
fwrite(rhs, 1, sz, stdout); |
while (1) { |
|
rsz = strcspn(cp, "\\"); |
|
if (rsz) { |
|
cp += rsz; |
|
if (skip) { |
|
skip = 0; |
|
rsz--; |
|
} |
|
sz += rsz; |
|
} |
|
if ('\0' == *cp) |
|
break; |
|
cp++; |
|
switch (mandoc_escape(&cp, NULL, NULL)) { |
|
case ESCAPE_ERROR: |
|
return sz; |
|
case ESCAPE_UNICODE: |
|
case ESCAPE_NUMBERED: |
|
case ESCAPE_SPECIAL: |
|
case ESCAPE_OVERSTRIKE: |
|
if (skip) |
|
skip = 0; |
|
else |
|
sz++; |
|
break; |
|
case ESCAPE_SKIPCHAR: |
|
skip = 1; |
|
break; |
|
default: |
|
break; |
|
} |
|
} |
|
return sz; |
} |
} |
|
|
|
static int |
|
print_escape(struct html *h, char c) |
|
{ |
|
|
static void |
switch (c) { |
print_encode(struct html *h, const char *p) |
case '<': |
|
print_word(h, "<"); |
|
break; |
|
case '>': |
|
print_word(h, ">"); |
|
break; |
|
case '&': |
|
print_word(h, "&"); |
|
break; |
|
case '"': |
|
print_word(h, """); |
|
break; |
|
case ASCII_NBRSP: |
|
print_word(h, " "); |
|
break; |
|
case ASCII_HYPH: |
|
print_byte(h, '-'); |
|
break; |
|
case ASCII_BREAK: |
|
break; |
|
default: |
|
return 0; |
|
} |
|
return 1; |
|
} |
|
|
|
static int |
|
print_encode(struct html *h, const char *p, const char *pend, int norecurse) |
{ |
{ |
|
char numbuf[16]; |
size_t sz; |
size_t sz; |
int len; |
int c, len, nospace; |
const char *seq; |
const char *seq; |
enum roffdeco deco; |
enum mandoc_esc esc; |
|
static const char rejs[9] = { '\\', '<', '>', '&', '"', |
|
ASCII_NBRSP, ASCII_HYPH, ASCII_BREAK, '\0' }; |
|
|
for (; *p; p++) { |
if (pend == NULL) |
sz = strcspn(p, "\\<>&"); |
pend = strchr(p, '\0'); |
|
|
fwrite(p, 1, sz, stdout); |
nospace = 0; |
p += /* LINTED */ |
|
sz; |
|
|
|
if ('<' == *p) { |
while (p < pend) { |
printf("<"); |
if (HTML_SKIPCHAR & h->flags && '\\' != *p) { |
|
h->flags &= ~HTML_SKIPCHAR; |
|
p++; |
continue; |
continue; |
} else if ('>' == *p) { |
} |
printf(">"); |
|
|
for (sz = strcspn(p, rejs); sz-- && p < pend; p++) |
|
if (*p == ' ') |
|
print_endword(h); |
|
else |
|
print_byte(h, *p); |
|
|
|
if (p >= pend) |
|
break; |
|
|
|
if (print_escape(h, *p++)) |
continue; |
continue; |
} else if ('&' == *p) { |
|
printf("&"); |
esc = mandoc_escape(&p, &seq, &len); |
|
if (ESCAPE_ERROR == esc) |
|
break; |
|
|
|
switch (esc) { |
|
case ESCAPE_FONT: |
|
case ESCAPE_FONTPREV: |
|
case ESCAPE_FONTBOLD: |
|
case ESCAPE_FONTITALIC: |
|
case ESCAPE_FONTBI: |
|
case ESCAPE_FONTROMAN: |
|
if (0 == norecurse) |
|
print_metaf(h, esc); |
continue; |
continue; |
} else if ('\0' == *p) |
case ESCAPE_SKIPCHAR: |
|
h->flags |= HTML_SKIPCHAR; |
|
continue; |
|
default: |
break; |
break; |
|
} |
|
|
seq = ++p; |
if (h->flags & HTML_SKIPCHAR) { |
len = a2roffdeco(&deco, &seq, &sz); |
h->flags &= ~HTML_SKIPCHAR; |
|
continue; |
|
} |
|
|
switch (deco) { |
switch (esc) { |
case (DECO_RESERVED): |
case ESCAPE_UNICODE: |
print_res(h, seq, sz); |
/* Skip past "u" header. */ |
|
c = mchars_num2uc(seq + 1, len - 1); |
break; |
break; |
case (DECO_SPECIAL): |
case ESCAPE_NUMBERED: |
print_spec(h, seq, sz); |
c = mchars_num2char(seq, len); |
|
if (c < 0) |
|
continue; |
break; |
break; |
default: |
case ESCAPE_SPECIAL: |
|
c = mchars_spec2cp(seq, len); |
|
if (c <= 0) |
|
continue; |
break; |
break; |
|
case ESCAPE_NOSPACE: |
|
if ('\0' == *p) |
|
nospace = 1; |
|
continue; |
|
case ESCAPE_OVERSTRIKE: |
|
if (len == 0) |
|
continue; |
|
c = seq[len - 1]; |
|
break; |
|
default: |
|
continue; |
} |
} |
|
if ((c < 0x20 && c != 0x09) || |
p += len - 1; |
(c > 0x7E && c < 0xA0)) |
|
c = 0xFFFD; |
|
if (c > 0x7E) { |
|
(void)snprintf(numbuf, sizeof(numbuf), "&#%d;", c); |
|
print_word(h, numbuf); |
|
} else if (print_escape(h, c) == 0) |
|
print_byte(h, c); |
} |
} |
|
|
|
return nospace; |
} |
} |
|
|
|
static void |
|
print_href(struct html *h, const char *name, const char *sec, int man) |
|
{ |
|
const char *p, *pp; |
|
|
|
pp = man ? h->base_man : h->base_includes; |
|
while ((p = strchr(pp, '%')) != NULL) { |
|
print_encode(h, pp, p, 1); |
|
if (man && p[1] == 'S') { |
|
if (sec == NULL) |
|
print_byte(h, '1'); |
|
else |
|
print_encode(h, sec, NULL, 1); |
|
} else if ((man && p[1] == 'N') || |
|
(man == 0 && p[1] == 'I')) |
|
print_encode(h, name, NULL, 1); |
|
else |
|
print_encode(h, p, p + 2, 1); |
|
pp = p + 2; |
|
} |
|
if (*pp != '\0') |
|
print_encode(h, pp, NULL, 1); |
|
} |
|
|
struct tag * |
struct tag * |
print_otag(struct html *h, enum htmltag tag, |
print_otag(struct html *h, enum htmltag tag, const char *fmt, ...) |
int sz, const struct htmlpair *p) |
|
{ |
{ |
int i; |
va_list ap; |
|
struct roffsu mysu, *su; |
|
char numbuf[16]; |
struct tag *t; |
struct tag *t; |
|
const char *attr; |
|
char *arg1, *arg2; |
|
double v; |
|
int i, have_style, tflags; |
|
|
if ( ! (HTML_NOSTACK & htmltags[tag].flags)) { |
tflags = htmltags[tag].flags; |
t = malloc(sizeof(struct tag)); |
|
if (NULL == t) { |
/* Push this tag onto the stack of open scopes. */ |
perror(NULL); |
|
exit(EXIT_FAILURE); |
if ((tflags & HTML_NOSTACK) == 0) { |
} |
t = mandoc_malloc(sizeof(struct tag)); |
t->tag = tag; |
t->tag = tag; |
t->next = h->tags.head; |
t->next = h->tag; |
h->tags.head = t; |
h->tag = t; |
} else |
} else |
t = NULL; |
t = NULL; |
|
|
if ( ! (HTML_NOSPACE & h->flags)) |
if (tflags & HTML_NLBEFORE) |
if ( ! (HTML_CLRLINE & htmltags[tag].flags)) |
print_endline(h); |
putchar(' '); |
if (h->col == 0) |
|
print_indent(h); |
printf("<%s", htmltags[tag].name); |
else if ((h->flags & HTML_NOSPACE) == 0) { |
for (i = 0; i < sz; i++) { |
if (h->flags & HTML_KEEP) |
printf(" %s=\"", htmlattrs[p[i].key]); |
print_word(h, " "); |
assert(p->val); |
else { |
print_encode(h, p[i].val); |
if (h->flags & HTML_PREKEEP) |
putchar('\"'); |
h->flags |= HTML_KEEP; |
|
print_endword(h); |
|
} |
} |
} |
putchar('>'); |
|
|
|
h->flags |= HTML_NOSPACE; |
if ( ! (h->flags & HTML_NONOSPACE)) |
if (HTML_CLRLINE & htmltags[tag].flags) |
h->flags &= ~HTML_NOSPACE; |
h->flags |= HTML_NEWLINE; |
|
else |
else |
h->flags &= ~HTML_NEWLINE; |
h->flags |= HTML_NOSPACE; |
|
|
return(t); |
/* Print out the tag name and attributes. */ |
} |
|
|
|
|
print_byte(h, '<'); |
|
print_word(h, htmltags[tag].name); |
|
|
/* ARGSUSED */ |
va_start(ap, fmt); |
static void |
|
print_ctag(struct html *h, enum htmltag tag) |
|
{ |
|
|
|
printf("</%s>", htmltags[tag].name); |
|
if (HTML_CLRLINE & htmltags[tag].flags) { |
|
h->flags |= HTML_NOSPACE; |
|
h->flags |= HTML_NEWLINE; |
|
putchar('\n'); |
|
} else |
|
h->flags &= ~HTML_NEWLINE; |
|
} |
|
|
|
|
have_style = 0; |
|
while (*fmt != '\0') { |
|
if (*fmt == 's') { |
|
have_style = 1; |
|
fmt++; |
|
break; |
|
} |
|
|
/* ARGSUSED */ |
/* Parse a non-style attribute and its arguments. */ |
void |
|
print_gen_doctype(struct html *h) |
|
{ |
|
|
|
printf("<!DOCTYPE HTML PUBLIC \"%s\" \"%s\">", DOCTYPE, DTD); |
|
} |
|
|
|
|
arg1 = va_arg(ap, char *); |
|
switch (*fmt++) { |
|
case 'c': |
|
attr = "class"; |
|
break; |
|
case 'h': |
|
attr = "href"; |
|
break; |
|
case 'i': |
|
attr = "id"; |
|
break; |
|
case '?': |
|
attr = arg1; |
|
arg1 = va_arg(ap, char *); |
|
break; |
|
default: |
|
abort(); |
|
} |
|
arg2 = NULL; |
|
if (*fmt == 'M') |
|
arg2 = va_arg(ap, char *); |
|
if (arg1 == NULL) |
|
continue; |
|
|
void |
/* Print the non-style attributes. */ |
print_text(struct html *h, const char *p) |
|
{ |
|
|
|
if (*p && 0 == *(p + 1)) |
print_byte(h, ' '); |
switch (*p) { |
print_word(h, attr); |
case('.'): |
print_byte(h, '='); |
/* FALLTHROUGH */ |
print_byte(h, '"'); |
case(','): |
switch (*fmt) { |
/* FALLTHROUGH */ |
case 'M': |
case(';'): |
print_href(h, arg1, arg2, 1); |
/* FALLTHROUGH */ |
fmt++; |
case(':'): |
|
/* FALLTHROUGH */ |
|
case('?'): |
|
/* FALLTHROUGH */ |
|
case('!'): |
|
/* FALLTHROUGH */ |
|
case(')'): |
|
/* FALLTHROUGH */ |
|
case(']'): |
|
/* FALLTHROUGH */ |
|
case('}'): |
|
if ( ! (HTML_IGNDELIM & h->flags)) |
|
h->flags |= HTML_NOSPACE; |
|
break; |
break; |
|
case 'I': |
|
print_href(h, arg1, NULL, 0); |
|
fmt++; |
|
break; |
|
case 'R': |
|
print_byte(h, '#'); |
|
fmt++; |
|
/* FALLTHROUGH */ |
default: |
default: |
|
print_encode(h, arg1, NULL, 1); |
break; |
break; |
} |
} |
|
print_byte(h, '"'); |
|
} |
|
|
if ( ! (h->flags & HTML_NOSPACE)) |
/* Print out styles. */ |
putchar(' '); |
|
|
|
h->flags &= ~HTML_NOSPACE; |
while (*fmt != '\0') { |
h->flags &= ~HTML_NEWLINE; |
arg1 = NULL; |
|
su = NULL; |
|
|
if (p) |
/* First letter: input argument type. */ |
print_encode(h, p); |
|
|
|
if (*p && 0 == *(p + 1)) |
switch (*fmt++) { |
switch (*p) { |
case 'h': |
case('('): |
i = va_arg(ap, int); |
/* FALLTHROUGH */ |
su = &mysu; |
case('['): |
SCALE_HS_INIT(su, i); |
/* FALLTHROUGH */ |
|
case('{'): |
|
h->flags |= HTML_NOSPACE; |
|
break; |
break; |
default: |
case 's': |
|
arg1 = va_arg(ap, char *); |
break; |
break; |
|
case 'u': |
|
su = va_arg(ap, struct roffsu *); |
|
break; |
|
case 'v': |
|
i = va_arg(ap, int); |
|
su = &mysu; |
|
SCALE_VS_INIT(su, i); |
|
break; |
|
case 'w': |
|
case 'W': |
|
if ((arg2 = va_arg(ap, char *)) == NULL) |
|
break; |
|
su = &mysu; |
|
a2width(arg2, su); |
|
if (fmt[-1] == 'W') |
|
su->scale *= -1.0; |
|
break; |
|
default: |
|
abort(); |
} |
} |
} |
|
|
|
|
/* Second letter: style name. */ |
|
|
void |
switch (*fmt++) { |
print_tagq(struct html *h, const struct tag *until) |
case 'b': |
{ |
attr = "margin-bottom"; |
struct tag *tag; |
break; |
|
case 'h': |
|
attr = "height"; |
|
break; |
|
case 'i': |
|
attr = "text-indent"; |
|
break; |
|
case 'l': |
|
attr = "margin-left"; |
|
break; |
|
case 't': |
|
attr = "margin-top"; |
|
break; |
|
case 'w': |
|
attr = "width"; |
|
break; |
|
case 'W': |
|
attr = "min-width"; |
|
break; |
|
case '?': |
|
attr = arg1; |
|
arg1 = va_arg(ap, char *); |
|
break; |
|
default: |
|
abort(); |
|
} |
|
if (su == NULL && arg1 == NULL) |
|
continue; |
|
|
while ((tag = h->tags.head) != NULL) { |
if (have_style == 1) |
print_ctag(h, tag->tag); |
print_word(h, " style=\""); |
h->tags.head = tag->next; |
else |
free(tag); |
print_byte(h, ' '); |
if (until && tag == until) |
print_word(h, attr); |
return; |
print_byte(h, ':'); |
|
print_byte(h, ' '); |
|
if (su != NULL) { |
|
v = su->scale; |
|
if (su->unit == SCALE_MM && (v /= 100.0) == 0.0) |
|
v = 1.0; |
|
else if (su->unit == SCALE_BU) |
|
v /= 24.0; |
|
(void)snprintf(numbuf, sizeof(numbuf), "%.2f", v); |
|
print_word(h, numbuf); |
|
print_word(h, roffscales[su->unit]); |
|
} else |
|
print_word(h, arg1); |
|
print_byte(h, ';'); |
|
have_style = 2; |
} |
} |
} |
if (have_style == 2) |
|
print_byte(h, '"'); |
|
|
|
va_end(ap); |
|
|
void |
/* Accommodate for "well-formed" singleton escaping. */ |
print_stagq(struct html *h, const struct tag *suntil) |
|
{ |
|
struct tag *tag; |
|
|
|
while ((tag = h->tags.head) != NULL) { |
if (HTML_AUTOCLOSE & htmltags[tag].flags) |
if (suntil && tag == suntil) |
print_byte(h, '/'); |
return; |
|
print_ctag(h, tag->tag); |
|
h->tags.head = tag->next; |
|
free(tag); |
|
} |
|
} |
|
|
|
|
print_byte(h, '>'); |
|
|
void |
if (tflags & HTML_NLBEGIN) |
bufinit(struct html *h) |
print_endline(h); |
{ |
else |
|
h->flags |= HTML_NOSPACE; |
|
|
h->buf[0] = '\0'; |
if (tflags & HTML_INDENT) |
h->buflen = 0; |
h->indent++; |
|
if (tflags & HTML_NOINDENT) |
|
h->noindent++; |
|
|
|
return t; |
} |
} |
|
|
|
static void |
void |
print_ctag(struct html *h, struct tag *tag) |
bufcat_style(struct html *h, const char *key, const char *val) |
|
{ |
{ |
|
int tflags; |
|
|
bufcat(h, key); |
/* |
bufncat(h, ":", 1); |
* Remember to close out and nullify the current |
bufcat(h, val); |
* meta-font and table, if applicable. |
bufncat(h, ";", 1); |
*/ |
} |
if (tag == h->metaf) |
|
h->metaf = NULL; |
|
if (tag == h->tblt) |
|
h->tblt = NULL; |
|
|
|
tflags = htmltags[tag->tag].flags; |
|
|
void |
if (tflags & HTML_INDENT) |
bufcat(struct html *h, const char *p) |
h->indent--; |
{ |
if (tflags & HTML_NOINDENT) |
|
h->noindent--; |
|
if (tflags & HTML_NLEND) |
|
print_endline(h); |
|
print_indent(h); |
|
print_byte(h, '<'); |
|
print_byte(h, '/'); |
|
print_word(h, htmltags[tag->tag].name); |
|
print_byte(h, '>'); |
|
if (tflags & HTML_NLAFTER) |
|
print_endline(h); |
|
|
bufncat(h, p, strlen(p)); |
h->tag = tag->next; |
|
free(tag); |
} |
} |
|
|
|
|
void |
void |
buffmt(struct html *h, const char *fmt, ...) |
print_gen_decls(struct html *h) |
{ |
{ |
va_list ap; |
print_word(h, "<!DOCTYPE html>"); |
|
print_endline(h); |
va_start(ap, fmt); |
|
(void)vsnprintf(h->buf + (int)h->buflen, |
|
BUFSIZ - h->buflen - 1, fmt, ap); |
|
va_end(ap); |
|
h->buflen = strlen(h->buf); |
|
} |
} |
|
|
|
|
void |
void |
bufncat(struct html *h, const char *p, size_t sz) |
print_text(struct html *h, const char *word) |
{ |
{ |
|
if (h->col && (h->flags & HTML_NOSPACE) == 0) { |
|
if ( ! (HTML_KEEP & h->flags)) { |
|
if (HTML_PREKEEP & h->flags) |
|
h->flags |= HTML_KEEP; |
|
print_endword(h); |
|
} else |
|
print_word(h, " "); |
|
} |
|
|
if (h->buflen + sz > BUFSIZ - 1) |
assert(NULL == h->metaf); |
sz = BUFSIZ - 1 - h->buflen; |
switch (h->metac) { |
|
case HTMLFONT_ITALIC: |
|
h->metaf = print_otag(h, TAG_I, ""); |
|
break; |
|
case HTMLFONT_BOLD: |
|
h->metaf = print_otag(h, TAG_B, ""); |
|
break; |
|
case HTMLFONT_BI: |
|
h->metaf = print_otag(h, TAG_B, ""); |
|
print_otag(h, TAG_I, ""); |
|
break; |
|
default: |
|
print_indent(h); |
|
break; |
|
} |
|
|
(void)strncat(h->buf, p, sz); |
assert(word); |
h->buflen += sz; |
if ( ! print_encode(h, word, NULL, 0)) { |
} |
if ( ! (h->flags & HTML_NONOSPACE)) |
|
h->flags &= ~HTML_NOSPACE; |
|
h->flags &= ~HTML_NONEWLINE; |
|
} else |
|
h->flags |= HTML_NOSPACE | HTML_NONEWLINE; |
|
|
|
if (h->metaf) { |
|
print_tagq(h, h->metaf); |
|
h->metaf = NULL; |
|
} |
|
|
|
h->flags &= ~HTML_IGNDELIM; |
|
} |
|
|
void |
void |
buffmt_includes(struct html *h, const char *name) |
print_tagq(struct html *h, const struct tag *until) |
{ |
{ |
const char *p, *pp; |
struct tag *tag; |
|
|
pp = h->base_includes; |
while ((tag = h->tag) != NULL) { |
|
print_ctag(h, tag); |
while (NULL != (p = strchr(pp, '%'))) { |
if (until && tag == until) |
bufncat(h, pp, (size_t)(p - pp)); |
return; |
switch (*(p + 1)) { |
|
case('I'): |
|
bufcat(h, name); |
|
break; |
|
default: |
|
bufncat(h, p, 2); |
|
break; |
|
} |
|
pp = p + 2; |
|
} |
} |
if (pp) |
|
bufcat(h, pp); |
|
} |
} |
|
|
|
|
void |
void |
buffmt_man(struct html *h, |
print_stagq(struct html *h, const struct tag *suntil) |
const char *name, const char *sec) |
|
{ |
{ |
const char *p, *pp; |
struct tag *tag; |
|
|
pp = h->base_man; |
while ((tag = h->tag) != NULL) { |
|
if (suntil && tag == suntil) |
/* LINTED */ |
return; |
while (NULL != (p = strchr(pp, '%'))) { |
print_ctag(h, tag); |
bufncat(h, pp, (size_t)(p - pp)); |
|
switch (*(p + 1)) { |
|
case('S'): |
|
bufcat(h, sec ? sec : "1"); |
|
break; |
|
case('N'): |
|
buffmt(h, name); |
|
break; |
|
default: |
|
bufncat(h, p, 2); |
|
break; |
|
} |
|
pp = p + 2; |
|
} |
} |
if (pp) |
|
bufcat(h, pp); |
|
} |
} |
|
|
|
|
void |
void |
bufcat_su(struct html *h, const char *p, const struct roffsu *su) |
print_paragraph(struct html *h) |
{ |
{ |
double v; |
struct tag *t; |
const char *u; |
|
|
|
v = su->scale; |
t = print_otag(h, TAG_DIV, "c", "Pp"); |
|
print_tagq(h, t); |
|
} |
|
|
switch (su->unit) { |
|
case (SCALE_CM): |
/*********************************************************************** |
u = "cm"; |
* Low level output functions. |
break; |
* They implement line breaking using a short static buffer. |
case (SCALE_IN): |
***********************************************************************/ |
u = "in"; |
|
break; |
/* |
case (SCALE_PC): |
* Buffer one HTML output byte. |
u = "pc"; |
* If the buffer is full, flush and deactivate it and start a new line. |
break; |
* If the buffer is inactive, print directly. |
case (SCALE_PT): |
*/ |
u = "pt"; |
static void |
break; |
print_byte(struct html *h, char c) |
case (SCALE_EM): |
{ |
u = "em"; |
if ((h->flags & HTML_BUFFER) == 0) { |
break; |
putchar(c); |
case (SCALE_MM): |
h->col++; |
if (0 == (v /= 100)) |
return; |
v = 1; |
|
u = "em"; |
|
break; |
|
case (SCALE_EN): |
|
u = "ex"; |
|
break; |
|
case (SCALE_BU): |
|
u = "ex"; |
|
break; |
|
case (SCALE_VS): |
|
u = "em"; |
|
break; |
|
default: |
|
u = "ex"; |
|
break; |
|
} |
} |
|
|
if (su->pt) |
if (h->col + h->bufcol < sizeof(h->buf)) { |
buffmt(h, "%s: %f%s;", p, v, u); |
h->buf[h->bufcol++] = c; |
else |
return; |
/* LINTED */ |
} |
buffmt(h, "%s: %d%s;", p, (int)v, u); |
|
|
putchar('\n'); |
|
h->col = 0; |
|
print_indent(h); |
|
putchar(' '); |
|
putchar(' '); |
|
fwrite(h->buf, h->bufcol, 1, stdout); |
|
putchar(c); |
|
h->col = (h->indent + 1) * 2 + h->bufcol + 1; |
|
h->bufcol = 0; |
|
h->flags &= ~HTML_BUFFER; |
} |
} |
|
|
|
/* |
|
* If something was printed on the current output line, end it. |
|
* Not to be called right after print_indent(). |
|
*/ |
void |
void |
html_idcat(char *dst, const char *src, int sz) |
print_endline(struct html *h) |
{ |
{ |
int ssz; |
if (h->col == 0) |
|
return; |
|
|
assert(sz); |
if (h->bufcol) { |
|
putchar(' '); |
|
fwrite(h->buf, h->bufcol, 1, stdout); |
|
h->bufcol = 0; |
|
} |
|
putchar('\n'); |
|
h->col = 0; |
|
h->flags |= HTML_NOSPACE; |
|
h->flags &= ~HTML_BUFFER; |
|
} |
|
|
/* Cf. <http://www.w3.org/TR/html4/types.html#h-6.2>. */ |
/* |
|
* Flush the HTML output buffer. |
|
* If it is inactive, activate it. |
|
*/ |
|
static void |
|
print_endword(struct html *h) |
|
{ |
|
if (h->noindent) { |
|
print_byte(h, ' '); |
|
return; |
|
} |
|
|
for ( ; *dst != '\0' && sz; dst++, sz--) |
if ((h->flags & HTML_BUFFER) == 0) { |
/* Jump to end. */ ; |
h->col++; |
|
h->flags |= HTML_BUFFER; |
|
} else if (h->bufcol) { |
|
putchar(' '); |
|
fwrite(h->buf, h->bufcol, 1, stdout); |
|
h->col += h->bufcol + 1; |
|
} |
|
h->bufcol = 0; |
|
} |
|
|
assert(sz > 2); |
/* |
|
* If at the beginning of a new output line, |
|
* perform indentation and mark the line as containing output. |
|
* Make sure to really produce some output right afterwards, |
|
* but do not use print_otag() for producing it. |
|
*/ |
|
static void |
|
print_indent(struct html *h) |
|
{ |
|
size_t i; |
|
|
/* We can't start with a number (bah). */ |
if (h->col) |
|
return; |
|
|
*dst++ = 'x'; |
if (h->noindent == 0) { |
*dst = '\0'; |
h->col = h->indent * 2; |
sz--; |
for (i = 0; i < h->col; i++) |
|
putchar(' '); |
for ( ; *src != '\0' && sz > 1; src++) { |
|
ssz = snprintf(dst, (size_t)sz, "%.2x", *src); |
|
sz -= ssz; |
|
dst += ssz; |
|
} |
} |
|
h->flags &= ~HTML_NOSPACE; |
|
} |
|
|
|
/* |
|
* Print or buffer some characters |
|
* depending on the current HTML output buffer state. |
|
*/ |
|
static void |
|
print_word(struct html *h, const char *cp) |
|
{ |
|
while (*cp != '\0') |
|
print_byte(h, *cp++); |
|
} |
|
|
|
/* |
|
* Calculate the scaling unit passed in a `-width' argument. This uses |
|
* either a native scaling unit (e.g., 1i, 2m) or the string length of |
|
* the value. |
|
*/ |
|
static void |
|
a2width(const char *p, struct roffsu *su) |
|
{ |
|
if (a2roffsu(p, su, SCALE_MAX) < 2) { |
|
su->unit = SCALE_EN; |
|
su->scale = html_strlen(p); |
|
} else if (su->scale < 0.0) |
|
su->scale = 0.0; |
} |
} |