version 1.68, 2009/10/28 05:08:17 |
version 1.82, 2009/11/09 05:11:46 |
|
|
|
|
#include <assert.h> |
#include <assert.h> |
#include <ctype.h> |
#include <ctype.h> |
#include <err.h> |
|
#include <stdio.h> |
|
#include <stdarg.h> |
#include <stdarg.h> |
|
#include <stdio.h> |
#include <stdint.h> |
#include <stdint.h> |
#include <stdlib.h> |
#include <stdlib.h> |
#include <string.h> |
#include <string.h> |
Line 67 static const struct htmldata htmltags[TAG_MAX] = { |
|
Line 66 static const struct htmldata htmltags[TAG_MAX] = { |
|
{"base", HTML_CLRLINE | HTML_NOSTACK}, /* TAG_BASE */ |
{"base", HTML_CLRLINE | HTML_NOSTACK}, /* TAG_BASE */ |
}; |
}; |
|
|
static const char *const htmlattrs[ATTR_MAX] = { |
static const char *const htmlattrs[ATTR_MAX] = { |
"http-equiv", |
"http-equiv", |
"content", |
"content", |
"name", |
"name", |
Line 88 static const char *const htmlattrs[ATTR_MAX] = { |
|
Line 87 static const char *const htmlattrs[ATTR_MAX] = { |
|
extern int getsubopt(char **, char * const *, char **); |
extern int getsubopt(char **, char * const *, char **); |
#endif |
#endif |
|
|
|
|
|
static void print_spec(struct html *, const char *, int); |
|
static void print_res(struct html *, const char *, int); |
|
static void print_ctag(struct html *, enum htmltag); |
|
static void print_encode(struct html *, const char *); |
|
|
|
|
void * |
void * |
html_alloc(char *outopts) |
html_alloc(char *outopts) |
{ |
{ |
Line 100 html_alloc(char *outopts) |
|
Line 106 html_alloc(char *outopts) |
|
toks[2] = "includes"; |
toks[2] = "includes"; |
toks[3] = NULL; |
toks[3] = NULL; |
|
|
if (NULL == (h = calloc(1, sizeof(struct html)))) |
h = calloc(1, sizeof(struct html)); |
return(NULL); |
if (NULL == h) { |
|
perror(NULL); |
|
exit(EXIT_FAILURE); |
|
} |
|
|
h->tags.head = NULL; |
h->tags.head = NULL; |
h->ords.head = NULL; |
h->ords.head = NULL; |
|
h->symtab = chars_init(CHARS_HTML); |
|
|
if (NULL == (h->symtab = chars_init(CHARS_HTML))) { |
|
free(h); |
|
return(NULL); |
|
} |
|
|
|
while (outopts && *outopts) |
while (outopts && *outopts) |
switch (getsubopt(&outopts, UNCONST(toks), &v)) { |
switch (getsubopt(&outopts, UNCONST(toks), &v)) { |
case (0): |
case (0): |
|
|
print_spec(struct html *h, const char *p, int len) |
print_spec(struct html *h, const char *p, int len) |
{ |
{ |
const char *rhs; |
const char *rhs; |
int i; |
|
size_t sz; |
size_t sz; |
|
|
rhs = chars_a2ascii(h->symtab, p, (size_t)len, &sz); |
rhs = chars_a2ascii(h->symtab, p, (size_t)len, &sz); |
|
|
if (NULL == rhs) |
if (NULL == rhs) |
return; |
return; |
for (i = 0; i < (int)sz; i++) |
fwrite(rhs, 1, sz, stdout); |
putchar(rhs[i]); |
|
} |
} |
|
|
|
|
|
|
print_res(struct html *h, const char *p, int len) |
print_res(struct html *h, const char *p, int len) |
{ |
{ |
const char *rhs; |
const char *rhs; |
int i; |
|
size_t sz; |
size_t sz; |
|
|
rhs = chars_a2res(h->symtab, p, (size_t)len, &sz); |
rhs = chars_a2res(h->symtab, p, (size_t)len, &sz); |
|
|
if (NULL == rhs) |
if (NULL == rhs) |
return; |
return; |
for (i = 0; i < (int)sz; i++) |
fwrite(rhs, 1, sz, stdout); |
putchar(rhs[i]); |
|
} |
} |
|
|
|
|
static void |
static void |
print_escape(struct html *h, const char **p) |
print_encode(struct html *h, const char *p) |
{ |
{ |
int j, type; |
size_t sz; |
const char *wp; |
int len; |
|
const char *seq; |
|
enum roffdeco deco; |
|
|
wp = *p; |
for (; *p; p++) { |
type = 1; |
sz = strcspn(p, "\\<>&"); |
|
|
if (0 == *(++wp)) { |
fwrite(p, 1, sz, stdout); |
*p = wp; |
p += /* LINTED */ |
return; |
sz; |
} |
|
|
|
if ('(' == *wp) { |
if ('<' == *p) { |
wp++; |
printf("<"); |
if (0 == *wp || 0 == *(wp + 1)) { |
continue; |
*p = 0 == *wp ? wp : wp + 1; |
} else if ('>' == *p) { |
return; |
printf(">"); |
} |
continue; |
|
} else if ('&' == *p) { |
|
printf("&"); |
|
continue; |
|
} else if ('\0' == *p) |
|
break; |
|
|
print_spec(h, wp, 2); |
seq = ++p; |
*p = ++wp; |
len = a2roffdeco(&deco, &seq, &sz); |
return; |
|
|
|
} else if ('*' == *wp) { |
switch (deco) { |
if (0 == *(++wp)) { |
case (DECO_RESERVED): |
*p = wp; |
print_res(h, seq, sz); |
return; |
|
} |
|
|
|
switch (*wp) { |
|
case ('('): |
|
wp++; |
|
if (0 == *wp || 0 == *(wp + 1)) { |
|
*p = 0 == *wp ? wp : wp + 1; |
|
return; |
|
} |
|
|
|
print_res(h, wp, 2); |
|
*p = ++wp; |
|
return; |
|
case ('['): |
|
type = 0; |
|
break; |
break; |
default: |
case (DECO_SPECIAL): |
print_res(h, wp, 1); |
print_spec(h, seq, sz); |
*p = wp; |
|
return; |
|
} |
|
|
|
} else if ('f' == *wp) { |
|
if (0 == *(++wp)) { |
|
*p = wp; |
|
return; |
|
} |
|
|
|
switch (*wp) { |
|
case ('B'): |
|
/* TODO */ |
|
break; |
break; |
case ('I'): |
|
/* TODO */ |
|
break; |
|
case ('P'): |
|
/* FALLTHROUGH */ |
|
case ('R'): |
|
/* TODO */ |
|
break; |
|
default: |
default: |
break; |
break; |
} |
} |
|
|
*p = wp; |
p += len - 1; |
return; |
|
|
|
} else if ('[' != *wp) { |
|
print_spec(h, wp, 1); |
|
*p = wp; |
|
return; |
|
} |
} |
|
|
wp++; |
|
for (j = 0; *wp && ']' != *wp; wp++, j++) |
|
/* Loop... */ ; |
|
|
|
if (0 == *wp) { |
|
*p = wp; |
|
return; |
|
} |
|
|
|
if (type) |
|
print_spec(h, wp - j, j); |
|
else |
|
print_res(h, wp - j, j); |
|
|
|
*p = wp; |
|
} |
} |
|
|
|
|
static void |
|
print_encode(struct html *h, const char *p) |
|
{ |
|
|
|
for (; *p; p++) { |
|
if ('\\' == *p) { |
|
print_escape(h, &p); |
|
continue; |
|
} |
|
switch (*p) { |
|
case ('<'): |
|
printf("<"); |
|
break; |
|
case ('>'): |
|
printf(">"); |
|
break; |
|
case ('&'): |
|
printf("&"); |
|
break; |
|
default: |
|
putchar(*p); |
|
break; |
|
} |
|
} |
|
} |
|
|
|
|
|
struct tag * |
struct tag * |
print_otag(struct html *h, enum htmltag tag, |
print_otag(struct html *h, enum htmltag tag, |
int sz, const struct htmlpair *p) |
int sz, const struct htmlpair *p) |
Line 354 print_otag(struct html *h, enum htmltag tag, |
|
Line 274 print_otag(struct html *h, enum htmltag tag, |
|
struct tag *t; |
struct tag *t; |
|
|
if ( ! (HTML_NOSTACK & htmltags[tag].flags)) { |
if ( ! (HTML_NOSTACK & htmltags[tag].flags)) { |
if (NULL == (t = malloc(sizeof(struct tag)))) |
t = malloc(sizeof(struct tag)); |
err(EXIT_FAILURE, "malloc"); |
if (NULL == t) { |
|
perror(NULL); |
|
exit(EXIT_FAILURE); |
|
} |
t->tag = tag; |
t->tag = tag; |
t->next = h->tags.head; |
t->next = h->tags.head; |
h->tags.head = t; |
h->tags.head = t; |
Line 364 print_otag(struct html *h, enum htmltag tag, |
|
Line 287 print_otag(struct html *h, enum htmltag tag, |
|
|
|
if ( ! (HTML_NOSPACE & h->flags)) |
if ( ! (HTML_NOSPACE & h->flags)) |
if ( ! (HTML_CLRLINE & htmltags[tag].flags)) |
if ( ! (HTML_CLRLINE & htmltags[tag].flags)) |
printf(" "); |
putchar(' '); |
|
|
printf("<%s", htmltags[tag].name); |
printf("<%s", htmltags[tag].name); |
for (i = 0; i < sz; i++) { |
for (i = 0; i < sz; i++) { |
printf(" %s=\"", htmlattrs[p[i].key]); |
printf(" %s=\"", htmlattrs[p[i].key]); |
assert(p->val); |
assert(p->val); |
print_encode(h, p[i].val); |
print_encode(h, p[i].val); |
printf("\""); |
putchar('\"'); |
} |
} |
printf(">"); |
putchar('>'); |
|
|
h->flags |= HTML_NOSPACE; |
h->flags |= HTML_NOSPACE; |
if (HTML_CLRLINE & htmltags[tag].flags) |
if (HTML_CLRLINE & htmltags[tag].flags) |
Line 391 print_ctag(struct html *h, enum htmltag tag) |
|
Line 314 print_ctag(struct html *h, enum htmltag tag) |
|
{ |
{ |
|
|
printf("</%s>", htmltags[tag].name); |
printf("</%s>", htmltags[tag].name); |
if (HTML_CLRLINE & htmltags[tag].flags) |
if (HTML_CLRLINE & htmltags[tag].flags) { |
h->flags |= HTML_NOSPACE; |
h->flags |= HTML_NOSPACE; |
if (HTML_CLRLINE & htmltags[tag].flags) |
|
h->flags |= HTML_NEWLINE; |
h->flags |= HTML_NEWLINE; |
else |
putchar('\n'); |
|
} else |
h->flags &= ~HTML_NEWLINE; |
h->flags &= ~HTML_NEWLINE; |
} |
} |
|
|
Line 440 print_text(struct html *h, const char *p) |
|
Line 363 print_text(struct html *h, const char *p) |
|
} |
} |
|
|
if ( ! (h->flags & HTML_NOSPACE)) |
if ( ! (h->flags & HTML_NOSPACE)) |
printf(" "); |
putchar(' '); |
|
|
h->flags &= ~HTML_NOSPACE; |
h->flags &= ~HTML_NOSPACE; |
h->flags &= ~HTML_NEWLINE; |
h->flags &= ~HTML_NEWLINE; |
Line 651 bufcat_su(struct html *h, const char *p, const struct |
|
Line 574 bufcat_su(struct html *h, const char *p, const struct |
|
|
|
|
|
void |
void |
html_idcpy(char *dst, const char *src, int sz) |
html_idcat(char *dst, const char *src, int sz) |
{ |
{ |
|
int ssz; |
|
|
assert(sz); |
assert(sz); |
dst[0] = '\0'; |
|
html_idcat(dst, src, sz); |
|
} |
|
|
|
|
|
void |
|
html_idcat(char *dst, const char *src, int sz) |
|
{ |
|
int i; |
|
|
|
/* Cf. <http://www.w3.org/TR/html4/types.html#h-6.2>. */ |
/* Cf. <http://www.w3.org/TR/html4/types.html#h-6.2>. */ |
|
|
for (i = 0; *dst != '\0' && i < sz - 1; dst++, i++) |
for ( ; *dst != '\0' && sz; dst++, sz--) |
/* Jump to end. */ ; |
/* Jump to end. */ ; |
|
|
for ( ; *src != '\0' && i < sz - 1; src++, i++) { |
assert(sz > 2); |
if (isalnum((u_char)*src)) { |
|
*dst++ = *src; |
|
continue; |
|
} |
|
|
|
switch (*src) { |
/* We can't start with a number (bah). */ |
case (';'): |
|
*dst++ = ';'; |
|
break; |
|
case ('-'): |
|
*dst++ = '-'; |
|
break; |
|
case (':'): |
|
*dst++ = ':'; |
|
break; |
|
case ('_'): |
|
/* FALLTHROUGH */ |
|
default: |
|
*dst++ = '_'; |
|
break; |
|
} |
|
} |
|
|
|
|
*dst++ = 'x'; |
*dst = '\0'; |
*dst = '\0'; |
|
sz--; |
|
|
|
for ( ; *src != '\0' && sz > 1; src++) { |
|
ssz = snprintf(dst, (size_t)sz, "%.2x", *src); |
|
sz -= ssz; |
|
dst += ssz; |
|
} |
} |
} |