version 1.61, 2009/10/07 15:27:11 |
version 1.88, 2009/11/14 19:23:58 |
|
|
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
*/ |
*/ |
#include <sys/types.h> |
#include <sys/types.h> |
#include <sys/queue.h> |
|
|
|
#include <assert.h> |
#include <assert.h> |
#include <err.h> |
#include <ctype.h> |
#include <stdio.h> |
|
#include <stdarg.h> |
#include <stdarg.h> |
|
#include <stdio.h> |
|
#include <stdint.h> |
#include <stdlib.h> |
#include <stdlib.h> |
#include <string.h> |
#include <string.h> |
#include <unistd.h> |
#include <unistd.h> |
|
|
#include "out.h" |
#include "out.h" |
#include "chars.h" |
#include "chars.h" |
#include "html.h" |
#include "html.h" |
|
#include "main.h" |
|
|
|
#define UNCONST(a) ((void *)(uintptr_t)(const void *)(a)) |
|
|
#define DOCTYPE "-//W3C//DTD HTML 4.01//EN" |
#define DOCTYPE "-//W3C//DTD HTML 4.01//EN" |
#define DTD "http://www.w3.org/TR/html4/strict.dtd" |
#define DTD "http://www.w3.org/TR/html4/strict.dtd" |
|
|
struct htmldata { |
struct htmldata { |
char *name; |
const char *name; |
int flags; |
int flags; |
#define HTML_CLRLINE (1 << 0) |
#define HTML_CLRLINE (1 << 0) |
#define HTML_NOSTACK (1 << 1) |
#define HTML_NOSTACK (1 << 1) |
Line 63 static const struct htmldata htmltags[TAG_MAX] = { |
|
Line 66 static const struct htmldata htmltags[TAG_MAX] = { |
|
{"base", HTML_CLRLINE | HTML_NOSTACK}, /* TAG_BASE */ |
{"base", HTML_CLRLINE | HTML_NOSTACK}, /* TAG_BASE */ |
}; |
}; |
|
|
static const char *const htmlattrs[ATTR_MAX] = { |
static const char *const htmlattrs[ATTR_MAX] = { |
"http-equiv", |
"http-equiv", |
"content", |
"content", |
"name", |
"name", |
Line 77 static const char *const htmlattrs[ATTR_MAX] = { |
|
Line 80 static const char *const htmlattrs[ATTR_MAX] = { |
|
"valign", |
"valign", |
"target", |
"target", |
"id", |
"id", |
|
"summary", |
}; |
}; |
|
|
#ifdef __linux__ |
#ifdef __linux__ |
extern int getsubopt(char **, char * const *, char **); |
extern int getsubopt(char **, char * const *, char **); |
#endif |
#endif |
|
|
|
|
|
static void print_spec(struct html *, const char *, size_t); |
|
static void print_res(struct html *, const char *, size_t); |
|
static void print_ctag(struct html *, enum htmltag); |
|
static int print_encode(struct html *, const char *, int); |
|
static void print_metaf(struct html *, enum roffdeco); |
|
|
|
|
void * |
void * |
html_alloc(char *outopts) |
html_alloc(char *outopts) |
{ |
{ |
struct html *h; |
struct html *h; |
char *toks[4], *v; |
const char *toks[4]; |
|
char *v; |
|
|
toks[0] = "style"; |
toks[0] = "style"; |
toks[1] = "man"; |
toks[1] = "man"; |
toks[2] = "includes"; |
toks[2] = "includes"; |
toks[3] = NULL; |
toks[3] = NULL; |
|
|
if (NULL == (h = calloc(1, sizeof(struct html)))) |
h = calloc(1, sizeof(struct html)); |
return(NULL); |
if (NULL == h) { |
|
perror(NULL); |
SLIST_INIT(&h->tags); |
exit(EXIT_FAILURE); |
SLIST_INIT(&h->ords); |
|
|
|
if (NULL == (h->symtab = chars_init(CHARS_HTML))) { |
|
free(h); |
|
return(NULL); |
|
} |
} |
|
|
|
h->tags.head = NULL; |
|
h->ords.head = NULL; |
|
h->symtab = chars_init(CHARS_HTML); |
|
|
while (outopts && *outopts) |
while (outopts && *outopts) |
switch (getsubopt(&outopts, toks, &v)) { |
switch (getsubopt(&outopts, UNCONST(toks), &v)) { |
case (0): |
case (0): |
h->style = v; |
h->style = v; |
break; |
break; |
Line 133 html_free(void *p) |
|
Line 145 html_free(void *p) |
|
|
|
h = (struct html *)p; |
h = (struct html *)p; |
|
|
while ( ! SLIST_EMPTY(&h->ords)) { |
while ((ord = h->ords.head) != NULL) { |
ord = SLIST_FIRST(&h->ords); |
h->ords.head = ord->next; |
SLIST_REMOVE_HEAD(&h->ords, entry); |
|
free(ord); |
free(ord); |
} |
} |
|
|
while ( ! SLIST_EMPTY(&h->tags)) { |
while ((tag = h->tags.head) != NULL) { |
tag = SLIST_FIRST(&h->tags); |
h->tags.head = tag->next; |
SLIST_REMOVE_HEAD(&h->tags, entry); |
|
free(tag); |
free(tag); |
} |
} |
|
|
Line 184 print_gen_head(struct html *h) |
|
Line 194 print_gen_head(struct html *h) |
|
|
|
|
|
static void |
static void |
print_spec(struct html *h, const char *p, int len) |
print_spec(struct html *h, const char *p, size_t len) |
{ |
{ |
const char *rhs; |
const char *rhs; |
int i; |
|
size_t sz; |
size_t sz; |
|
|
rhs = chars_a2ascii(h->symtab, p, (size_t)len, &sz); |
rhs = chars_a2ascii(h->symtab, p, len, &sz); |
|
|
if (NULL == rhs) |
if (NULL == rhs) |
return; |
return; |
for (i = 0; i < (int)sz; i++) |
fwrite(rhs, 1, sz, stdout); |
putchar(rhs[i]); |
|
} |
} |
|
|
|
|
static void |
static void |
print_res(struct html *h, const char *p, int len) |
print_res(struct html *h, const char *p, size_t len) |
{ |
{ |
const char *rhs; |
const char *rhs; |
int i; |
|
size_t sz; |
size_t sz; |
|
|
rhs = chars_a2res(h->symtab, p, (size_t)len, &sz); |
rhs = chars_a2res(h->symtab, p, len, &sz); |
|
|
if (NULL == rhs) |
if (NULL == rhs) |
return; |
return; |
for (i = 0; i < (int)sz; i++) |
fwrite(rhs, 1, sz, stdout); |
putchar(rhs[i]); |
|
} |
} |
|
|
|
|
static void |
static void |
print_escape(struct html *h, const char **p) |
print_metaf(struct html *h, enum roffdeco deco) |
{ |
{ |
int j, type; |
const char *class; |
const char *wp; |
struct htmlpair tag; |
|
|
wp = *p; |
switch (deco) { |
type = 1; |
case (DECO_BOLD): |
|
class = "bold"; |
|
break; |
|
case (DECO_ITALIC): |
|
class = "italic"; |
|
break; |
|
case (DECO_ROMAN): |
|
class = "roman"; |
|
break; |
|
default: |
|
abort(); |
|
/* NOTREACHED */ |
|
} |
|
|
if (0 == *(++wp)) { |
if (h->metaf) { |
*p = wp; |
assert(h->tags.head); |
return; |
assert(h->metaf == h->tags.head); |
|
print_tagq(h, h->metaf); |
} |
} |
|
|
|
PAIR_CLASS_INIT(&tag, class); |
|
h->metaf = print_otag(h, TAG_SPAN, 1, &tag); |
|
} |
|
|
if ('(' == *wp) { |
|
wp++; |
|
if (0 == *wp || 0 == *(wp + 1)) { |
|
*p = 0 == *wp ? wp : wp + 1; |
|
return; |
|
} |
|
|
|
print_spec(h, wp, 2); |
static int |
*p = ++wp; |
print_encode(struct html *h, const char *p, int norecurse) |
return; |
{ |
|
size_t sz; |
|
int len, nospace; |
|
const char *seq; |
|
enum roffdeco deco; |
|
|
} else if ('*' == *wp) { |
nospace = 0; |
if (0 == *(++wp)) { |
|
*p = wp; |
|
return; |
|
} |
|
|
|
switch (*wp) { |
for (; *p; p++) { |
case ('('): |
sz = strcspn(p, "\\<>&"); |
wp++; |
|
if (0 == *wp || 0 == *(wp + 1)) { |
|
*p = 0 == *wp ? wp : wp + 1; |
|
return; |
|
} |
|
|
|
print_res(h, wp, 2); |
fwrite(p, 1, sz, stdout); |
*p = ++wp; |
p += /* LINTED */ |
return; |
sz; |
case ('['): |
|
type = 0; |
if ('<' == *p) { |
|
printf("<"); |
|
continue; |
|
} else if ('>' == *p) { |
|
printf(">"); |
|
continue; |
|
} else if ('&' == *p) { |
|
printf("&"); |
|
continue; |
|
} else if ('\0' == *p) |
break; |
break; |
default: |
|
print_res(h, wp, 1); |
|
*p = wp; |
|
return; |
|
} |
|
|
|
} else if ('f' == *wp) { |
|
if (0 == *(++wp)) { |
|
*p = wp; |
|
return; |
|
} |
|
|
|
switch (*wp) { |
seq = ++p; |
case ('B'): |
len = a2roffdeco(&deco, &seq, &sz); |
/* TODO */ |
|
|
switch (deco) { |
|
case (DECO_RESERVED): |
|
print_res(h, seq, sz); |
break; |
break; |
case ('I'): |
case (DECO_SPECIAL): |
/* TODO */ |
print_spec(h, seq, sz); |
break; |
break; |
case ('P'): |
case (DECO_BOLD): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('R'): |
case (DECO_ITALIC): |
/* TODO */ |
/* FALLTHROUGH */ |
|
case (DECO_ROMAN): |
|
if (norecurse) |
|
break; |
|
print_metaf(h, deco); |
break; |
break; |
default: |
default: |
break; |
break; |
} |
} |
|
|
*p = wp; |
p += len - 1; |
return; |
|
|
|
} else if ('[' != *wp) { |
if (DECO_NOSPACE == deco && '\0' == *(p + 1)) |
print_spec(h, wp, 1); |
nospace = 1; |
*p = wp; |
|
return; |
|
} |
} |
|
|
wp++; |
return(nospace); |
for (j = 0; *wp && ']' != *wp; wp++, j++) |
|
/* Loop... */ ; |
|
|
|
if (0 == *wp) { |
|
*p = wp; |
|
return; |
|
} |
|
|
|
if (type) |
|
print_spec(h, wp - j, j); |
|
else |
|
print_res(h, wp - j, j); |
|
|
|
*p = wp; |
|
} |
} |
|
|
|
|
static void |
|
print_encode(struct html *h, const char *p) |
|
{ |
|
|
|
for (; *p; p++) { |
|
if ('\\' == *p) { |
|
print_escape(h, &p); |
|
continue; |
|
} |
|
switch (*p) { |
|
case ('<'): |
|
printf("<"); |
|
break; |
|
case ('>'): |
|
printf(">"); |
|
break; |
|
case ('&'): |
|
printf("&"); |
|
break; |
|
default: |
|
putchar(*p); |
|
break; |
|
} |
|
} |
|
} |
|
|
|
|
|
struct tag * |
struct tag * |
print_otag(struct html *h, enum htmltag tag, |
print_otag(struct html *h, enum htmltag tag, |
int sz, const struct htmlpair *p) |
int sz, const struct htmlpair *p) |
Line 350 print_otag(struct html *h, enum htmltag tag, |
|
Line 323 print_otag(struct html *h, enum htmltag tag, |
|
struct tag *t; |
struct tag *t; |
|
|
if ( ! (HTML_NOSTACK & htmltags[tag].flags)) { |
if ( ! (HTML_NOSTACK & htmltags[tag].flags)) { |
if (NULL == (t = malloc(sizeof(struct tag)))) |
t = malloc(sizeof(struct tag)); |
err(EXIT_FAILURE, "malloc"); |
if (NULL == t) { |
|
perror(NULL); |
|
exit(EXIT_FAILURE); |
|
} |
t->tag = tag; |
t->tag = tag; |
SLIST_INSERT_HEAD(&h->tags, t, entry); |
t->next = h->tags.head; |
|
h->tags.head = t; |
} else |
} else |
t = NULL; |
t = NULL; |
|
|
if ( ! (HTML_NOSPACE & h->flags)) |
if ( ! (HTML_NOSPACE & h->flags)) |
if ( ! (HTML_CLRLINE & htmltags[tag].flags)) |
if ( ! (HTML_CLRLINE & htmltags[tag].flags)) |
printf(" "); |
putchar(' '); |
|
|
printf("<%s", htmltags[tag].name); |
printf("<%s", htmltags[tag].name); |
for (i = 0; i < sz; i++) { |
for (i = 0; i < sz; i++) { |
printf(" %s=\"", htmlattrs[p[i].key]); |
printf(" %s=\"", htmlattrs[p[i].key]); |
assert(p->val); |
assert(p->val); |
print_encode(h, p[i].val); |
(void)print_encode(h, p[i].val, 1); |
printf("\""); |
putchar('\"'); |
} |
} |
printf(">"); |
putchar('>'); |
|
|
h->flags |= HTML_NOSPACE; |
h->flags |= HTML_NOSPACE; |
if (HTML_CLRLINE & htmltags[tag].flags) |
|
h->flags |= HTML_NEWLINE; |
|
else |
|
h->flags &= ~HTML_NEWLINE; |
|
|
|
return(t); |
return(t); |
} |
} |
|
|
Line 386 print_ctag(struct html *h, enum htmltag tag) |
|
Line 358 print_ctag(struct html *h, enum htmltag tag) |
|
{ |
{ |
|
|
printf("</%s>", htmltags[tag].name); |
printf("</%s>", htmltags[tag].name); |
if (HTML_CLRLINE & htmltags[tag].flags) |
if (HTML_CLRLINE & htmltags[tag].flags) { |
h->flags |= HTML_NOSPACE; |
h->flags |= HTML_NOSPACE; |
if (HTML_CLRLINE & htmltags[tag].flags) |
putchar('\n'); |
h->flags |= HTML_NEWLINE; |
} |
else |
|
h->flags &= ~HTML_NEWLINE; |
|
} |
} |
|
|
|
|
Line 435 print_text(struct html *h, const char *p) |
|
Line 405 print_text(struct html *h, const char *p) |
|
} |
} |
|
|
if ( ! (h->flags & HTML_NOSPACE)) |
if ( ! (h->flags & HTML_NOSPACE)) |
printf(" "); |
putchar(' '); |
|
|
h->flags &= ~HTML_NOSPACE; |
assert(p); |
h->flags &= ~HTML_NEWLINE; |
if ( ! print_encode(h, p, 0)) |
|
h->flags &= ~HTML_NOSPACE; |
|
|
if (p) |
|
print_encode(h, p); |
|
|
|
if (*p && 0 == *(p + 1)) |
if (*p && 0 == *(p + 1)) |
switch (*p) { |
switch (*p) { |
case('('): |
case('('): |
Line 463 print_tagq(struct html *h, const struct tag *until) |
|
Line 431 print_tagq(struct html *h, const struct tag *until) |
|
{ |
{ |
struct tag *tag; |
struct tag *tag; |
|
|
while ( ! SLIST_EMPTY(&h->tags)) { |
while ((tag = h->tags.head) != NULL) { |
tag = SLIST_FIRST(&h->tags); |
|
print_ctag(h, tag->tag); |
print_ctag(h, tag->tag); |
SLIST_REMOVE_HEAD(&h->tags, entry); |
h->tags.head = tag->next; |
free(tag); |
free(tag); |
if (until && tag == until) |
if (until && tag == until) |
return; |
return; |
Line 479 print_stagq(struct html *h, const struct tag *suntil) |
|
Line 446 print_stagq(struct html *h, const struct tag *suntil) |
|
{ |
{ |
struct tag *tag; |
struct tag *tag; |
|
|
while ( ! SLIST_EMPTY(&h->tags)) { |
while ((tag = h->tags.head) != NULL) { |
tag = SLIST_FIRST(&h->tags); |
|
if (suntil && tag == suntil) |
if (suntil && tag == suntil) |
return; |
return; |
print_ctag(h, tag->tag); |
print_ctag(h, tag->tag); |
SLIST_REMOVE_HEAD(&h->tags, entry); |
h->tags.head = tag->next; |
free(tag); |
free(tag); |
} |
} |
} |
} |
Line 599 buffmt_man(struct html *h, |
|
Line 565 buffmt_man(struct html *h, |
|
void |
void |
bufcat_su(struct html *h, const char *p, const struct roffsu *su) |
bufcat_su(struct html *h, const char *p, const struct roffsu *su) |
{ |
{ |
int v; |
double v; |
char *u; |
const char *u; |
|
|
v = su->scale; |
v = su->scale; |
|
|
Line 639 bufcat_su(struct html *h, const char *p, const struct |
|
Line 605 bufcat_su(struct html *h, const char *p, const struct |
|
break; |
break; |
} |
} |
|
|
buffmt(h, "%s: %d%s;", p, v, u); |
if (su->pt) |
|
buffmt(h, "%s: %f%s;", p, v, u); |
|
else |
|
/* LINTED */ |
|
buffmt(h, "%s: %d%s;", p, (int)v, u); |
|
} |
|
|
|
|
|
void |
|
html_idcat(char *dst, const char *src, int sz) |
|
{ |
|
int ssz; |
|
|
|
assert(sz); |
|
|
|
/* Cf. <http://www.w3.org/TR/html4/types.html#h-6.2>. */ |
|
|
|
for ( ; *dst != '\0' && sz; dst++, sz--) |
|
/* Jump to end. */ ; |
|
|
|
assert(sz > 2); |
|
|
|
/* We can't start with a number (bah). */ |
|
|
|
*dst++ = 'x'; |
|
*dst = '\0'; |
|
sz--; |
|
|
|
for ( ; *src != '\0' && sz > 1; src++) { |
|
ssz = snprintf(dst, (size_t)sz, "%.2x", *src); |
|
sz -= ssz; |
|
dst += ssz; |
|
} |
} |
} |