version 1.51, 2009/09/21 14:56:56 |
version 1.82, 2009/11/09 05:11:46 |
|
|
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
*/ |
*/ |
#include <sys/types.h> |
#include <sys/types.h> |
#include <sys/queue.h> |
|
|
|
#include <assert.h> |
#include <assert.h> |
#include <err.h> |
#include <ctype.h> |
|
#include <stdarg.h> |
#include <stdio.h> |
#include <stdio.h> |
|
#include <stdint.h> |
#include <stdlib.h> |
#include <stdlib.h> |
#include <string.h> |
#include <string.h> |
#include <unistd.h> |
#include <unistd.h> |
|
|
|
#include "out.h" |
#include "chars.h" |
#include "chars.h" |
#include "html.h" |
#include "html.h" |
|
#include "main.h" |
|
|
|
#define UNCONST(a) ((void *)(uintptr_t)(const void *)(a)) |
|
|
#define DOCTYPE "-//W3C//DTD HTML 4.01//EN" |
#define DOCTYPE "-//W3C//DTD HTML 4.01//EN" |
#define DTD "http://www.w3.org/TR/html4/strict.dtd" |
#define DTD "http://www.w3.org/TR/html4/strict.dtd" |
|
|
struct htmldata { |
struct htmldata { |
char *name; |
const char *name; |
int flags; |
int flags; |
#define HTML_CLRLINE (1 << 0) |
#define HTML_CLRLINE (1 << 0) |
#define HTML_NOSTACK (1 << 1) |
#define HTML_NOSTACK (1 << 1) |
Line 61 static const struct htmldata htmltags[TAG_MAX] = { |
|
Line 66 static const struct htmldata htmltags[TAG_MAX] = { |
|
{"base", HTML_CLRLINE | HTML_NOSTACK}, /* TAG_BASE */ |
{"base", HTML_CLRLINE | HTML_NOSTACK}, /* TAG_BASE */ |
}; |
}; |
|
|
static const char *const htmlattrs[ATTR_MAX] = { |
static const char *const htmlattrs[ATTR_MAX] = { |
"http-equiv", |
"http-equiv", |
"content", |
"content", |
"name", |
"name", |
Line 73 static const char *const htmlattrs[ATTR_MAX] = { |
|
Line 78 static const char *const htmlattrs[ATTR_MAX] = { |
|
"style", |
"style", |
"width", |
"width", |
"valign", |
"valign", |
|
"target", |
|
"id", |
|
"summary", |
}; |
}; |
|
|
#ifdef __linux__ |
#ifdef __linux__ |
extern int getsubopt(char **, char * const *, char **); |
extern int getsubopt(char **, char * const *, char **); |
#endif |
#endif |
|
|
|
|
|
static void print_spec(struct html *, const char *, int); |
|
static void print_res(struct html *, const char *, int); |
|
static void print_ctag(struct html *, enum htmltag); |
|
static void print_encode(struct html *, const char *); |
|
|
|
|
void * |
void * |
html_alloc(char *outopts) |
html_alloc(char *outopts) |
{ |
{ |
struct html *h; |
struct html *h; |
char *toks[3], *v; |
const char *toks[4]; |
|
char *v; |
|
|
toks[0] = "style"; |
toks[0] = "style"; |
toks[1] = "base"; |
toks[1] = "man"; |
toks[2] = NULL; |
toks[2] = "includes"; |
|
toks[3] = NULL; |
|
|
if (NULL == (h = calloc(1, sizeof(struct html)))) |
h = calloc(1, sizeof(struct html)); |
return(NULL); |
if (NULL == h) { |
|
perror(NULL); |
SLIST_INIT(&h->tags); |
exit(EXIT_FAILURE); |
SLIST_INIT(&h->ords); |
|
|
|
if (NULL == (h->symtab = chars_init(CHARS_HTML))) { |
|
free(h); |
|
return(NULL); |
|
} |
} |
|
|
|
h->tags.head = NULL; |
|
h->ords.head = NULL; |
|
h->symtab = chars_init(CHARS_HTML); |
|
|
while (outopts && *outopts) |
while (outopts && *outopts) |
switch (getsubopt(&outopts, toks, &v)) { |
switch (getsubopt(&outopts, UNCONST(toks), &v)) { |
case (0): |
case (0): |
h->style = v; |
h->style = v; |
break; |
break; |
case (1): |
case (1): |
h->base = v; |
h->base_man = v; |
break; |
break; |
|
case (2): |
|
h->base_includes = v; |
|
break; |
default: |
default: |
break; |
break; |
} |
} |
Line 125 html_free(void *p) |
|
Line 144 html_free(void *p) |
|
|
|
h = (struct html *)p; |
h = (struct html *)p; |
|
|
while ( ! SLIST_EMPTY(&h->ords)) { |
while ((ord = h->ords.head) != NULL) { |
ord = SLIST_FIRST(&h->ords); |
h->ords.head = ord->next; |
SLIST_REMOVE_HEAD(&h->ords, entry); |
|
free(ord); |
free(ord); |
} |
} |
|
|
while ( ! SLIST_EMPTY(&h->tags)) { |
while ((tag = h->tags.head) != NULL) { |
tag = SLIST_FIRST(&h->tags); |
h->tags.head = tag->next; |
SLIST_REMOVE_HEAD(&h->tags, entry); |
|
free(tag); |
free(tag); |
} |
} |
|
|
if (h->symtab) |
if (h->symtab) |
chars_free(h->symtab); |
chars_free(h->symtab); |
|
|
free(h); |
free(h); |
} |
} |
|
|
Line 171 print_gen_head(struct html *h) |
|
Line 189 print_gen_head(struct html *h) |
|
tag[3].val = "all"; |
tag[3].val = "all"; |
print_otag(h, TAG_LINK, 4, tag); |
print_otag(h, TAG_LINK, 4, tag); |
} |
} |
|
|
if (h->base) { |
|
tag[0].key = ATTR_HREF; |
|
tag[1].val = h->base; |
|
print_otag(h, TAG_BASE, 1, tag); |
|
} |
|
} |
} |
|
|
|
|
|
|
print_spec(struct html *h, const char *p, int len) |
print_spec(struct html *h, const char *p, int len) |
{ |
{ |
const char *rhs; |
const char *rhs; |
int i; |
|
size_t sz; |
size_t sz; |
|
|
rhs = chars_a2ascii(h->symtab, p, (size_t)len, &sz); |
rhs = chars_a2ascii(h->symtab, p, (size_t)len, &sz); |
|
|
if (NULL == rhs) |
if (NULL == rhs) |
return; |
return; |
for (i = 0; i < (int)sz; i++) |
fwrite(rhs, 1, sz, stdout); |
putchar(rhs[i]); |
|
} |
} |
|
|
|
|
|
|
print_res(struct html *h, const char *p, int len) |
print_res(struct html *h, const char *p, int len) |
{ |
{ |
const char *rhs; |
const char *rhs; |
int i; |
|
size_t sz; |
size_t sz; |
|
|
rhs = chars_a2res(h->symtab, p, (size_t)len, &sz); |
rhs = chars_a2res(h->symtab, p, (size_t)len, &sz); |
|
|
if (NULL == rhs) |
if (NULL == rhs) |
return; |
return; |
for (i = 0; i < (int)sz; i++) |
fwrite(rhs, 1, sz, stdout); |
putchar(rhs[i]); |
|
} |
} |
|
|
|
|
static void |
static void |
print_escape(struct html *h, const char **p) |
print_encode(struct html *h, const char *p) |
{ |
{ |
int j, type; |
size_t sz; |
const char *wp; |
int len; |
|
const char *seq; |
|
enum roffdeco deco; |
|
|
wp = *p; |
for (; *p; p++) { |
type = 1; |
sz = strcspn(p, "\\<>&"); |
|
|
if (0 == *(++wp)) { |
fwrite(p, 1, sz, stdout); |
*p = wp; |
p += /* LINTED */ |
return; |
sz; |
} |
|
|
|
if ('(' == *wp) { |
if ('<' == *p) { |
wp++; |
printf("<"); |
if (0 == *wp || 0 == *(wp + 1)) { |
continue; |
*p = 0 == *wp ? wp : wp + 1; |
} else if ('>' == *p) { |
return; |
printf(">"); |
} |
continue; |
|
} else if ('&' == *p) { |
|
printf("&"); |
|
continue; |
|
} else if ('\0' == *p) |
|
break; |
|
|
print_spec(h, wp, 2); |
seq = ++p; |
*p = ++wp; |
len = a2roffdeco(&deco, &seq, &sz); |
return; |
|
|
|
} else if ('*' == *wp) { |
switch (deco) { |
if (0 == *(++wp)) { |
case (DECO_RESERVED): |
*p = wp; |
print_res(h, seq, sz); |
return; |
|
} |
|
|
|
switch (*wp) { |
|
case ('('): |
|
wp++; |
|
if (0 == *wp || 0 == *(wp + 1)) { |
|
*p = 0 == *wp ? wp : wp + 1; |
|
return; |
|
} |
|
|
|
print_res(h, wp, 2); |
|
*p = ++wp; |
|
return; |
|
case ('['): |
|
type = 0; |
|
break; |
break; |
default: |
case (DECO_SPECIAL): |
print_res(h, wp, 1); |
print_spec(h, seq, sz); |
*p = wp; |
|
return; |
|
} |
|
|
|
} else if ('f' == *wp) { |
|
if (0 == *(++wp)) { |
|
*p = wp; |
|
return; |
|
} |
|
|
|
switch (*wp) { |
|
case ('B'): |
|
/* TODO */ |
|
break; |
break; |
case ('I'): |
|
/* TODO */ |
|
break; |
|
case ('P'): |
|
/* FALLTHROUGH */ |
|
case ('R'): |
|
/* TODO */ |
|
break; |
|
default: |
default: |
break; |
break; |
} |
} |
|
|
*p = wp; |
p += len - 1; |
return; |
|
|
|
} else if ('[' != *wp) { |
|
print_spec(h, wp, 1); |
|
*p = wp; |
|
return; |
|
} |
} |
|
|
wp++; |
|
for (j = 0; *wp && ']' != *wp; wp++, j++) |
|
/* Loop... */ ; |
|
|
|
if (0 == *wp) { |
|
*p = wp; |
|
return; |
|
} |
|
|
|
if (type) |
|
print_spec(h, wp - j, j); |
|
else |
|
print_res(h, wp - j, j); |
|
|
|
*p = wp; |
|
} |
} |
|
|
|
|
static void |
|
print_encode(struct html *h, const char *p) |
|
{ |
|
|
|
for (; *p; p++) { |
|
if ('\\' == *p) { |
|
print_escape(h, &p); |
|
continue; |
|
} |
|
switch (*p) { |
|
case ('<'): |
|
printf("<"); |
|
break; |
|
case ('>'): |
|
printf(">"); |
|
break; |
|
case ('&'): |
|
printf("&"); |
|
break; |
|
default: |
|
putchar(*p); |
|
break; |
|
} |
|
} |
|
} |
|
|
|
|
|
struct tag * |
struct tag * |
print_otag(struct html *h, enum htmltag tag, |
print_otag(struct html *h, enum htmltag tag, |
int sz, const struct htmlpair *p) |
int sz, const struct htmlpair *p) |
Line 347 print_otag(struct html *h, enum htmltag tag, |
|
Line 274 print_otag(struct html *h, enum htmltag tag, |
|
struct tag *t; |
struct tag *t; |
|
|
if ( ! (HTML_NOSTACK & htmltags[tag].flags)) { |
if ( ! (HTML_NOSTACK & htmltags[tag].flags)) { |
if (NULL == (t = malloc(sizeof(struct tag)))) |
t = malloc(sizeof(struct tag)); |
err(EXIT_FAILURE, "malloc"); |
if (NULL == t) { |
|
perror(NULL); |
|
exit(EXIT_FAILURE); |
|
} |
t->tag = tag; |
t->tag = tag; |
SLIST_INSERT_HEAD(&h->tags, t, entry); |
t->next = h->tags.head; |
|
h->tags.head = t; |
} else |
} else |
t = NULL; |
t = NULL; |
|
|
if ( ! (HTML_NOSPACE & h->flags)) |
if ( ! (HTML_NOSPACE & h->flags)) |
if ( ! (HTML_CLRLINE & htmltags[tag].flags)) |
if ( ! (HTML_CLRLINE & htmltags[tag].flags)) |
printf(" "); |
putchar(' '); |
|
|
printf("<%s", htmltags[tag].name); |
printf("<%s", htmltags[tag].name); |
for (i = 0; i < sz; i++) { |
for (i = 0; i < sz; i++) { |
printf(" %s=\"", htmlattrs[p[i].key]); |
printf(" %s=\"", htmlattrs[p[i].key]); |
assert(p->val); |
assert(p->val); |
print_encode(h, p[i].val); |
print_encode(h, p[i].val); |
printf("\""); |
putchar('\"'); |
} |
} |
printf(">"); |
putchar('>'); |
|
|
h->flags |= HTML_NOSPACE; |
h->flags |= HTML_NOSPACE; |
if (HTML_CLRLINE & htmltags[tag].flags) |
if (HTML_CLRLINE & htmltags[tag].flags) |
Line 383 print_ctag(struct html *h, enum htmltag tag) |
|
Line 314 print_ctag(struct html *h, enum htmltag tag) |
|
{ |
{ |
|
|
printf("</%s>", htmltags[tag].name); |
printf("</%s>", htmltags[tag].name); |
if (HTML_CLRLINE & htmltags[tag].flags) |
if (HTML_CLRLINE & htmltags[tag].flags) { |
h->flags |= HTML_NOSPACE; |
h->flags |= HTML_NOSPACE; |
if (HTML_CLRLINE & htmltags[tag].flags) |
|
h->flags |= HTML_NEWLINE; |
h->flags |= HTML_NEWLINE; |
else |
putchar('\n'); |
|
} else |
h->flags &= ~HTML_NEWLINE; |
h->flags &= ~HTML_NEWLINE; |
} |
} |
|
|
Line 424 print_text(struct html *h, const char *p) |
|
Line 355 print_text(struct html *h, const char *p) |
|
case(']'): |
case(']'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case('}'): |
case('}'): |
h->flags |= HTML_NOSPACE; |
if ( ! (HTML_IGNDELIM & h->flags)) |
|
h->flags |= HTML_NOSPACE; |
break; |
break; |
default: |
default: |
break; |
break; |
} |
} |
|
|
if ( ! (h->flags & HTML_NOSPACE)) |
if ( ! (h->flags & HTML_NOSPACE)) |
printf(" "); |
putchar(' '); |
|
|
h->flags &= ~HTML_NOSPACE; |
h->flags &= ~HTML_NOSPACE; |
h->flags &= ~HTML_NEWLINE; |
h->flags &= ~HTML_NEWLINE; |
Line 459 print_tagq(struct html *h, const struct tag *until) |
|
Line 391 print_tagq(struct html *h, const struct tag *until) |
|
{ |
{ |
struct tag *tag; |
struct tag *tag; |
|
|
while ( ! SLIST_EMPTY(&h->tags)) { |
while ((tag = h->tags.head) != NULL) { |
tag = SLIST_FIRST(&h->tags); |
|
print_ctag(h, tag->tag); |
print_ctag(h, tag->tag); |
SLIST_REMOVE_HEAD(&h->tags, entry); |
h->tags.head = tag->next; |
free(tag); |
free(tag); |
if (until && tag == until) |
if (until && tag == until) |
return; |
return; |
Line 475 print_stagq(struct html *h, const struct tag *suntil) |
|
Line 406 print_stagq(struct html *h, const struct tag *suntil) |
|
{ |
{ |
struct tag *tag; |
struct tag *tag; |
|
|
while ( ! SLIST_EMPTY(&h->tags)) { |
while ((tag = h->tags.head) != NULL) { |
tag = SLIST_FIRST(&h->tags); |
|
if (suntil && tag == suntil) |
if (suntil && tag == suntil) |
return; |
return; |
print_ctag(h, tag->tag); |
print_ctag(h, tag->tag); |
SLIST_REMOVE_HEAD(&h->tags, entry); |
h->tags.head = tag->next; |
free(tag); |
free(tag); |
|
} |
|
} |
|
|
|
|
|
void |
|
bufinit(struct html *h) |
|
{ |
|
|
|
h->buf[0] = '\0'; |
|
h->buflen = 0; |
|
} |
|
|
|
|
|
void |
|
bufcat_style(struct html *h, const char *key, const char *val) |
|
{ |
|
|
|
bufcat(h, key); |
|
bufncat(h, ":", 1); |
|
bufcat(h, val); |
|
bufncat(h, ";", 1); |
|
} |
|
|
|
|
|
void |
|
bufcat(struct html *h, const char *p) |
|
{ |
|
|
|
bufncat(h, p, strlen(p)); |
|
} |
|
|
|
|
|
void |
|
buffmt(struct html *h, const char *fmt, ...) |
|
{ |
|
va_list ap; |
|
|
|
va_start(ap, fmt); |
|
(void)vsnprintf(h->buf + (int)h->buflen, |
|
BUFSIZ - h->buflen - 1, fmt, ap); |
|
va_end(ap); |
|
h->buflen = strlen(h->buf); |
|
} |
|
|
|
|
|
void |
|
bufncat(struct html *h, const char *p, size_t sz) |
|
{ |
|
|
|
if (h->buflen + sz > BUFSIZ - 1) |
|
sz = BUFSIZ - 1 - h->buflen; |
|
|
|
(void)strncat(h->buf, p, sz); |
|
h->buflen += sz; |
|
} |
|
|
|
|
|
void |
|
buffmt_includes(struct html *h, const char *name) |
|
{ |
|
const char *p, *pp; |
|
|
|
pp = h->base_includes; |
|
|
|
while (NULL != (p = strchr(pp, '%'))) { |
|
bufncat(h, pp, (size_t)(p - pp)); |
|
switch (*(p + 1)) { |
|
case('I'): |
|
bufcat(h, name); |
|
break; |
|
default: |
|
bufncat(h, p, 2); |
|
break; |
|
} |
|
pp = p + 2; |
|
} |
|
if (pp) |
|
bufcat(h, pp); |
|
} |
|
|
|
|
|
void |
|
buffmt_man(struct html *h, |
|
const char *name, const char *sec) |
|
{ |
|
const char *p, *pp; |
|
|
|
pp = h->base_man; |
|
|
|
/* LINTED */ |
|
while (NULL != (p = strchr(pp, '%'))) { |
|
bufncat(h, pp, (size_t)(p - pp)); |
|
switch (*(p + 1)) { |
|
case('S'): |
|
bufcat(h, sec ? sec : "1"); |
|
break; |
|
case('N'): |
|
buffmt(h, name); |
|
break; |
|
default: |
|
bufncat(h, p, 2); |
|
break; |
|
} |
|
pp = p + 2; |
|
} |
|
if (pp) |
|
bufcat(h, pp); |
|
} |
|
|
|
|
|
void |
|
bufcat_su(struct html *h, const char *p, const struct roffsu *su) |
|
{ |
|
double v; |
|
const char *u; |
|
|
|
v = su->scale; |
|
|
|
switch (su->unit) { |
|
case (SCALE_CM): |
|
u = "cm"; |
|
break; |
|
case (SCALE_IN): |
|
u = "in"; |
|
break; |
|
case (SCALE_PC): |
|
u = "pc"; |
|
break; |
|
case (SCALE_PT): |
|
u = "pt"; |
|
break; |
|
case (SCALE_EM): |
|
u = "em"; |
|
break; |
|
case (SCALE_MM): |
|
if (0 == (v /= 100)) |
|
v = 1; |
|
u = "em"; |
|
break; |
|
case (SCALE_EN): |
|
u = "ex"; |
|
break; |
|
case (SCALE_BU): |
|
u = "ex"; |
|
break; |
|
case (SCALE_VS): |
|
u = "em"; |
|
break; |
|
default: |
|
u = "ex"; |
|
break; |
|
} |
|
|
|
if (su->pt) |
|
buffmt(h, "%s: %f%s;", p, v, u); |
|
else |
|
/* LINTED */ |
|
buffmt(h, "%s: %d%s;", p, (int)v, u); |
|
} |
|
|
|
|
|
void |
|
html_idcat(char *dst, const char *src, int sz) |
|
{ |
|
int ssz; |
|
|
|
assert(sz); |
|
|
|
/* Cf. <http://www.w3.org/TR/html4/types.html#h-6.2>. */ |
|
|
|
for ( ; *dst != '\0' && sz; dst++, sz--) |
|
/* Jump to end. */ ; |
|
|
|
assert(sz > 2); |
|
|
|
/* We can't start with a number (bah). */ |
|
|
|
*dst++ = 'x'; |
|
*dst = '\0'; |
|
sz--; |
|
|
|
for ( ; *src != '\0' && sz > 1; src++) { |
|
ssz = snprintf(dst, (size_t)sz, "%.2x", *src); |
|
sz -= ssz; |
|
dst += ssz; |
} |
} |
} |
} |