version 1.33, 2014/07/18 23:56:57 |
version 1.59, 2015/02/23 15:12:06 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2014 Kristaps Dzonsons <kristaps@bsd.lv> |
* Copyright (c) 2014 Kristaps Dzonsons <kristaps@bsd.lv> |
|
* Copyright (c) 2014, 2015 Ingo Schwarze <schwarze@openbsd.org> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the above |
* purpose with or without fee is hereby granted, provided that the above |
|
|
#include <string.h> |
#include <string.h> |
#include <unistd.h> |
#include <unistd.h> |
|
|
|
#include "dict.h" |
|
|
/* |
/* |
* In what section can we find Perl module manuals? |
* In what section can we find Perl module manuals? |
* Sometimes (Mac OS X) it's 3pm, sometimes (OpenBSD, etc.) 3p. |
* Sometimes (Mac OS X) it's 3pm, sometimes (OpenBSD, etc.) 3p. |
|
|
char *outbuf; /* text buffered for output */ |
char *outbuf; /* text buffered for output */ |
size_t outbufsz; /* allocated size of outbuf */ |
size_t outbufsz; /* allocated size of outbuf */ |
size_t outbuflen; /* current length of outbuf */ |
size_t outbuflen; /* current length of outbuf */ |
|
size_t outlnlen; /* chars so far on this output line */ |
}; |
}; |
|
|
enum fmt { |
enum fmt { |
|
|
CMD__MAX |
CMD__MAX |
}; |
}; |
|
|
|
static void command(struct state *, const char *, size_t, size_t); |
|
static void dofile(const struct args *, const char *, |
|
const struct tm *, char *, size_t); |
|
static void donamenm(struct state *, const char *, size_t *, size_t); |
|
static void dopar(struct state *, char *, size_t, size_t); |
|
static void dosynopsisfl(const char *, size_t *, size_t); |
|
static int dosynopsisop(struct state *, const char *, size_t *, |
|
size_t, size_t *); |
|
static int formatcode(struct state *, const char *, size_t *, |
|
size_t, int, int); |
|
static void formatcodeln(struct state *, const char *, const char *, |
|
size_t *, size_t, int); |
|
static void formatescape(struct state *, const char *, size_t *, size_t); |
|
static int hasmatch(const char *, size_t, size_t); |
|
static void ordinary(struct state *, const char *, size_t, size_t); |
|
static void outbuf_addchar(struct state *); |
|
static void outbuf_addstr(struct state *, const char *); |
|
static void outbuf_flush(struct state *); |
|
static void outbuf_grow(struct state *, size_t); |
|
static enum list listguess(const char *, size_t, size_t); |
|
static void mdoc_newln(struct state *); |
|
static int readfile(const struct args *, const char *); |
|
static void register_type(const char *); |
|
static int trylink(const char *, size_t *, size_t, size_t); |
|
static void verbatim(struct state *, char *, size_t, size_t); |
|
|
static const char *const cmds[CMD__MAX] = { |
static const char *const cmds[CMD__MAX] = { |
"pod", /* CMD_POD */ |
"pod", /* CMD_POD */ |
"head1", /* CMD_HEAD1 */ |
"head1", /* CMD_HEAD1 */ |
Line 132 static const char fmts[FMT__MAX] = { |
|
Line 162 static const char fmts[FMT__MAX] = { |
|
'Z' /* FMT_NULL */ |
'Z' /* FMT_NULL */ |
}; |
}; |
|
|
static int last; |
static unsigned char last; |
|
|
|
|
static void |
static void |
Line 157 outbuf_addchar(struct state *st) |
|
Line 187 outbuf_addchar(struct state *st) |
|
if ('\\' == last) |
if ('\\' == last) |
st->outbuf[st->outbuflen++] = 'e'; |
st->outbuf[st->outbuflen++] = 'e'; |
st->outbuf[st->outbuflen] = '\0'; |
st->outbuf[st->outbuflen] = '\0'; |
st->wantws = 0; |
|
} |
} |
|
|
static void |
static void |
Line 171 outbuf_addstr(struct state *st, const char *str) |
|
Line 200 outbuf_addstr(struct state *st, const char *str) |
|
memcpy(st->outbuf + st->outbuflen, str, slen+1); |
memcpy(st->outbuf + st->outbuflen, str, slen+1); |
st->outbuflen += slen; |
st->outbuflen += slen; |
last = str[slen - 1]; |
last = str[slen - 1]; |
st->wantws = 0; |
|
} |
} |
|
|
static void |
static void |
Line 181 outbuf_flush(struct state *st) |
|
Line 209 outbuf_flush(struct state *st) |
|
if (0 == st->outbuflen) |
if (0 == st->outbuflen) |
return; |
return; |
|
|
fputs(st->outbuf, stdout); |
st->outlnlen += st->outbuflen; |
|
if (OUST_TXT == st->oust && st->wantws) { |
|
if (++st->outlnlen > 72) { |
|
putchar('\n'); |
|
st->oust = OUST_NL; |
|
st->outlnlen = st->outbuflen; |
|
} |
|
} |
|
if (OUST_NL != st->oust && st->wantws) |
|
putchar(' '); |
|
|
|
if (OUST_MAC == st->oust && '"' == *st->outbuf) |
|
printf("\\(dq%s", st->outbuf + 1); |
|
else |
|
fputs(st->outbuf, stdout); |
|
|
*st->outbuf = '\0'; |
*st->outbuf = '\0'; |
st->outbuflen = 0; |
st->outbuflen = 0; |
|
|
Line 199 mdoc_newln(struct state *st) |
|
Line 242 mdoc_newln(struct state *st) |
|
putchar('\n'); |
putchar('\n'); |
last = '\n'; |
last = '\n'; |
st->oust = OUST_NL; |
st->oust = OUST_NL; |
|
st->outlnlen = 0; |
st->wantws = 1; |
st->wantws = 1; |
} |
} |
|
|
|
|
'?' != buf[*start + 1] && |
'?' != buf[*start + 1] && |
'-' != buf[*start + 1]) { |
'-' != buf[*start + 1]) { |
(*start)--; |
(*start)--; |
fputs("Ar ", stdout); |
fputs("Ar", stdout); |
return; |
return; |
} |
} |
|
|
|
|
assert(i < end); |
assert(i < end); |
|
|
if ( ! (' ' == buf[i] || '>' == buf[i])) { |
if ( ! (' ' == buf[i] || '>' == buf[i])) { |
printf("Ar "); |
fputs("Ar", stdout); |
return; |
return; |
} |
} |
|
|
|
|
(end - *start == 2 || |
(end - *start == 2 || |
' ' == buf[*start + 2])) |
' ' == buf[*start + 2])) |
printf("\\&"); |
printf("\\&"); |
printf("%.*s ", (int)(i - *start), &buf[*start]); |
printf("%.*s", (int)(i - *start), &buf[*start]); |
*start = i; |
*start = i; |
|
|
if (' ' == buf[i]) { |
if (' ' == buf[i]) { |
|
|
*start = i; |
*start = i; |
goto again; |
goto again; |
} |
} |
printf("Ar "); |
fputs("Ar", stdout); |
*start = i; |
*start = i; |
} |
} |
} |
} |
|
|
formatcode(struct state *st, const char *buf, size_t *start, |
formatcode(struct state *st, const char *buf, size_t *start, |
size_t end, int nomacro, int pos) |
size_t end, int nomacro, int pos) |
{ |
{ |
enum fmt fmt; |
|
size_t i, j, dsz; |
size_t i, j, dsz; |
|
enum fmt fmt; |
|
unsigned char uc; |
|
int gotmacro, wantws; |
|
|
assert(*start + 1 < end); |
assert(*start + 1 < end); |
assert('<' == buf[*start + 1]); |
assert('<' == buf[*start + 1]); |
Line 553 formatcode(struct state *st, const char *buf, size_t * |
|
Line 599 formatcode(struct state *st, const char *buf, size_t * |
|
if (FMT__MAX != fmt && !nomacro) { |
if (FMT__MAX != fmt && !nomacro) { |
|
|
/* |
/* |
|
* Do we need spacing before the upcoming macro, |
|
* after any pending text already in the outbuf? |
* We may already have wantws if there was whitespace |
* We may already have wantws if there was whitespace |
* before the code ("text B<text"), but initial |
* before the code ("text B<text"), or there may be |
* whitespace inside our scope ("textB< text") |
* whitespace inside our scope ("textB< text"). |
* allows to break at this point as well. |
|
*/ |
*/ |
|
|
st->wantws |= ' ' == buf[*start]; |
wantws = ' ' == buf[*start] || |
|
(st->wantws && ! st->outbuflen); |
|
|
/* |
/* |
* If we are on a text line and there is no |
* If we are on a text line and there is no |
* whitespace before our content, we have to make |
* whitespace before our content, we have to make |
* the previous word a prefix to the macro line. |
* the previous word a prefix to the macro line. |
* In the following, mdoc_newln() must not be used |
|
* lest we clobber out output state. |
|
*/ |
*/ |
|
|
if (OUST_MAC != st->oust && !st->wantws) { |
if (OUST_MAC != st->oust && ! wantws) { |
if (OUST_NL != st->oust) |
if (OUST_NL != st->oust) |
putchar('\n'); |
mdoc_newln(st); |
printf(".Pf "); |
fputs(".Pf", stdout); |
|
st->oust = OUST_MAC; |
|
st->wantws = wantws = 1; |
} |
} |
|
|
outbuf_flush(st); |
outbuf_flush(st); |
|
|
/* Whitespace is easier to suppress on macro lines. */ |
/* Whitespace is easier to suppress on macro lines. */ |
|
|
if (OUST_MAC == st->oust && !st->wantws) |
if (OUST_MAC == st->oust && ! wantws) |
printf(" Ns "); |
printf(" Ns"); |
|
|
/* Unless we are on a macro line, start one. */ |
/* Unless we are on a macro line, start one. */ |
|
|
if (OUST_MAC != st->oust && st->wantws) { |
if (OUST_MAC != st->oust) { |
if (OUST_NL != st->oust) |
if (OUST_NL != st->oust) |
putchar('\n'); |
mdoc_newln(st); |
putchar('.'); |
putchar('.'); |
|
st->oust = OUST_MAC; |
} else |
} else |
putchar(' '); |
putchar(' '); |
|
st->wantws = 1; |
|
|
/* |
/* |
* Print the macro corresponding to this format code, |
* Print the macro corresponding to this format code, |
Line 597 formatcode(struct state *st, const char *buf, size_t * |
|
Line 647 formatcode(struct state *st, const char *buf, size_t * |
|
*/ |
*/ |
|
|
switch (fmt) { |
switch (fmt) { |
case (FMT_ITALIC): |
|
printf("Em "); |
|
break; |
|
case (FMT_BOLD): |
case (FMT_BOLD): |
if (SECT_SYNOPSIS == st->sect) { |
if (SECT_SYNOPSIS == st->sect) { |
if (1 == dsz && '-' == buf[*start]) |
if (1 == dsz && '-' == buf[*start]) |
dosynopsisfl(buf, start, end); |
dosynopsisfl(buf, start, end); |
else if (0 == pos) |
else if (0 == pos) |
printf("Nm "); |
fputs("Nm", stdout); |
else |
else |
printf("Ar "); |
fputs("Ar", stdout); |
break; |
break; |
} |
} |
if (0 == strncmp(buf + *start, "NULL", 4) && |
/* FALLTHROUGH */ |
('=' == buf[*start + 4] || |
case (FMT_ITALIC): |
'>' == buf[*start + 4])) |
i = 0; |
printf("Dv "); |
uc = buf[*start]; |
else |
while (isalnum(uc) || '_' == uc || ' ' == uc) |
printf("Sy "); |
uc = buf[*start + ++i]; |
|
if ('=' != uc && '>' != uc) |
|
i = 0; |
|
if (4 == i && ! strncmp(buf + *start, "NULL", 4)) { |
|
fputs("Dv", stdout); |
|
break; |
|
} |
|
switch (i ? dict_get(buf + *start, i) : MDOC_MAX) { |
|
case MDOC_Fa: |
|
fputs("Fa", stdout); |
|
break; |
|
case MDOC_Vt: |
|
fputs("Vt", stdout); |
|
break; |
|
default: |
|
fputs(FMT_BOLD == fmt ? "Sy" : "Em", stdout); |
|
break; |
|
} |
break; |
break; |
case (FMT_CODE): |
case (FMT_CODE): |
printf("Qo Li "); |
fputs("Qo Li", stdout); |
break; |
break; |
case (FMT_LINK): |
case (FMT_LINK): |
/* Try to link; use "No" if it's empty. */ |
/* Try to link; use "No" if it's empty. */ |
if ( ! trylink(buf, start, end, dsz)) |
if ( ! trylink(buf, start, end, dsz)) |
printf("No "); |
fputs("No", stdout); |
break; |
break; |
case (FMT_FILE): |
case (FMT_FILE): |
printf("Pa "); |
fputs("Pa", stdout); |
break; |
break; |
case (FMT_NBSP): |
case (FMT_NBSP): |
printf("No "); |
fputs("No", stdout); |
break; |
break; |
default: |
default: |
abort(); |
abort(); |
} |
} |
st->oust = OUST_MAC; |
} else { |
st->wantws = 1; |
|
} else |
|
outbuf_flush(st); |
outbuf_flush(st); |
|
st->wantws = 0; |
|
} |
|
|
/* |
/* |
* Process until we reach the end marker (e.g., '>') or until we |
* Process until we reach the end marker (e.g., '>') or until we |
Line 645 formatcode(struct state *st, const char *buf, size_t * |
|
Line 709 formatcode(struct state *st, const char *buf, size_t * |
|
* Don't emit any newlines: since we're on a macro line, we |
* Don't emit any newlines: since we're on a macro line, we |
* don't want to break the line. |
* don't want to break the line. |
*/ |
*/ |
|
|
|
gotmacro = 0; |
while (*start < end) { |
while (*start < end) { |
if ('>' == buf[*start] && 1 == dsz) { |
if ('>' == buf[*start] && 1 == dsz) { |
(*start)++; |
(*start)++; |
Line 666 formatcode(struct state *st, const char *buf, size_t * |
|
Line 732 formatcode(struct state *st, const char *buf, size_t * |
|
break; |
break; |
} |
} |
} |
} |
if (*start + 1 < end && '<' == buf[*start + 1]) { |
if (*start + 1 < end && '<' == buf[*start + 1] && |
formatcode(st, buf, start, end, nomacro, 1); |
'A' <= buf[*start] && 'Z' >= buf[*start]) { |
|
gotmacro = formatcode(st, buf, |
|
start, end, nomacro, 1); |
continue; |
continue; |
} |
} |
|
|
/* Suppress newlines and multiple spaces. */ |
/* Suppress newlines and multiple spaces. */ |
|
|
last = buf[(*start)++]; |
last = buf[(*start)++]; |
if (' ' == last || '\n' == last) { |
if (isspace(last)) { |
putchar(' '); |
outbuf_flush(st); |
while (*start < end && ' ' == buf[*start]) |
st->wantws = 1; |
|
gotmacro = 0; |
|
while (*start < end && |
|
isspace((unsigned char)buf[*start])) |
(*start)++; |
(*start)++; |
continue; |
continue; |
} |
} |
|
|
if (OUST_MAC == st->oust && FMT__MAX != fmt) { |
if (OUST_MAC == st->oust && FMT__MAX != fmt) { |
if ( ! st->wantws) { |
if (gotmacro && ! st->wantws) { |
printf(" Ns "); |
printf(" Ns"); |
st->wantws = 1; |
st->wantws = 1; |
} |
} |
|
gotmacro = 0; |
|
|
/* |
/* |
* Escape macro-like words. |
* Escape macro-like words. |
* This matches "Xx " and "XxEOLN". |
* This matches "Xx " and "XxEOLN". |
*/ |
*/ |
|
|
if (end - *start > 0 && |
if (*start < end && ! st->outbuflen && |
isupper((unsigned char)last) && |
isupper(last) && |
islower((unsigned char)buf[*start]) && |
islower((unsigned char)buf[*start]) && |
(end - *start == 1 || |
(end - *start == 1 || |
' ' == buf[*start + 1] || |
' ' == buf[*start + 1] || |
'>' == buf[*start + 1])) |
'>' == buf[*start + 1])) |
printf("\\&"); |
outbuf_addstr(st, "\\&"); |
|
last = buf[*start - 1]; |
} |
} |
|
outbuf_addchar(st); |
putchar(last); |
|
|
|
/* Protect against character escapes. */ |
|
|
|
if ('\\' == last) |
|
putchar('e'); |
|
} |
} |
|
|
if (FMT__MAX == fmt) |
if (FMT__MAX == fmt) |
return(0); |
return(0); |
|
|
|
outbuf_flush(st); |
|
|
if ( ! nomacro && FMT_CODE == fmt) |
if ( ! nomacro && FMT_CODE == fmt) |
printf(" Qc "); |
fputs(" Qc", stdout); |
|
|
st->wantws = ' ' == last; |
st->wantws = ' ' == last; |
return(1); |
return(1); |
|
|
formatcodeln(struct state *st, const char *linemac, |
formatcodeln(struct state *st, const char *linemac, |
const char *buf, size_t *start, size_t end, int nomacro) |
const char *buf, size_t *start, size_t end, int nomacro) |
{ |
{ |
int gotmacro, wantws; |
int gotmacro; |
|
|
assert(OUST_NL == st->oust); |
assert(OUST_NL == st->oust); |
assert(st->wantws); |
assert(st->wantws); |
printf(".%s ", linemac); |
printf(".%s", linemac); |
st->oust = OUST_MAC; |
st->oust = OUST_MAC; |
|
|
gotmacro = 0; |
gotmacro = 0; |
while (*start < end) { |
while (*start < end) { |
wantws = ' ' == buf[*start] || '\n' == buf[*start]; |
if (*start + 1 < end && '<' == buf[*start + 1] && |
if (wantws) { |
'A' <= buf[*start] && 'Z' >= buf[*start]) { |
last = ' '; |
|
do { |
|
(*start)++; |
|
} while (*start < end && ' ' == buf[*start]); |
|
} |
|
|
|
if (*start + 1 < end && '<' == buf[*start + 1]) { |
|
st->wantws |= wantws; |
|
gotmacro = formatcode(st, buf, |
gotmacro = formatcode(st, buf, |
start, end, nomacro, 1); |
start, end, nomacro, 1); |
continue; |
continue; |
} |
} |
|
|
|
/* Suppress newlines and multiple spaces. */ |
|
|
|
last = buf[(*start)++]; |
|
if (isspace(last)) { |
|
outbuf_flush(st); |
|
st->wantws = 1; |
|
while (*start < end && |
|
isspace((unsigned char)buf[*start])) |
|
(*start)++; |
|
continue; |
|
} |
|
|
if (gotmacro) { |
if (gotmacro) { |
if (*start < end || st->outbuflen) { |
if (*start < end) { |
if (st->wantws || |
if (st->wantws) |
(wantws && !st->outbuflen)) |
printf(" No"); |
printf(" No "); |
|
else |
else |
printf(" Ns "); |
printf(" Ns"); |
} |
} |
|
st->wantws = 1; |
gotmacro = 0; |
gotmacro = 0; |
} |
} |
outbuf_flush(st); |
|
st->wantws = wantws; |
|
|
|
if (*start >= end) |
|
break; |
|
|
|
if (st->wantws) { |
|
putchar(' '); |
|
st->wantws = 0; |
|
} |
|
|
|
/* |
/* |
* Since we're already on a macro line, we want to make |
* Since we're already on a macro line, we want to make |
* sure that we don't inadvertently invoke a macro. |
* sure that we don't inadvertently invoke a macro. |
Line 781 formatcodeln(struct state *st, const char *linemac, |
|
Line 844 formatcodeln(struct state *st, const char *linemac, |
|
* are used in troff and we don't want to escape |
* are used in troff and we don't want to escape |
* something that needn't be escaped. |
* something that needn't be escaped. |
*/ |
*/ |
if (' ' == last && end - *start > 1 && |
if (*start < end && ! st->outbuflen && isupper(last) && |
isupper((unsigned char)buf[*start]) && |
islower((unsigned char)buf[*start]) && |
islower((unsigned char)buf[*start + 1]) && |
(end - *start == 1 || ' ' == buf[*start + 1])) { |
(end - *start == 2 || ' ' == buf[*start + 2])) |
outbuf_addstr(st, "\\&"); |
printf("\\&"); |
last = buf[*start - 1]; |
|
} |
putchar(last = buf[*start]); |
outbuf_addchar(st); |
|
|
/* Protect against character escapes. */ |
|
|
|
if ('\\' == last) |
|
putchar('e'); |
|
|
|
(*start)++; |
|
} |
} |
|
outbuf_flush(st); |
|
st->wantws = 1; |
} |
} |
|
|
/* |
/* |
Line 1001 command(struct state *st, const char *buf, size_t star |
|
Line 1059 command(struct state *st, const char *buf, size_t star |
|
} |
} |
|
|
/* |
/* |
|
* Put the type provided as an argument into the dictionary. |
|
*/ |
|
static void |
|
register_type(const char *ptype) |
|
{ |
|
const char *pname, *pend; |
|
|
|
pname = ptype; |
|
while (isalnum((unsigned char)*pname) || '_' == *pname) |
|
pname++; |
|
if ((pname - ptype == 6 && ! strncmp(ptype, "struct", 6)) || |
|
(pname - ptype == 4 && ! strncmp(ptype, "enum", 4))) { |
|
while (' ' == *pname) |
|
pname++; |
|
pend = pname; |
|
while (isalnum((unsigned char)*pend) || '_' == *pend) |
|
pend++; |
|
if (pend > pname) |
|
dict_put(pname, pend - pname, MDOC_Vt); |
|
} else |
|
pend = pname; |
|
if (pend > ptype) |
|
dict_put(ptype, pend - ptype, MDOC_Vt); |
|
} |
|
|
|
/* |
* Just pump out the line in a verbatim block. |
* Just pump out the line in a verbatim block. |
* From the perspective of external callers, |
* From the perspective of external callers, |
* always stays in OUST_NL/wantws mode. |
* always stays in OUST_NL/wantws mode. |
*/ |
*/ |
static void |
static void |
verbatim(struct state *st, const char *buf, size_t start, size_t end) |
verbatim(struct state *st, char *buf, size_t start, size_t end) |
{ |
{ |
size_t i; |
size_t i, ift, ifo, ifa, ifc, inl; |
|
char *cp, *cp2; |
|
int indisplay, nopen, wantsp; |
|
|
if ( ! st->parsing || st->paused) |
if (st->paused || ! st->parsing) |
return; |
return; |
|
|
|
indisplay = wantsp = 0; |
|
|
again: |
again: |
|
if (start == end) { |
|
if (indisplay) |
|
puts(".Ed"); |
|
return; |
|
} |
|
|
|
if ('\n' == buf[start]) { |
|
wantsp = 1; |
|
start++; |
|
goto again; |
|
} |
|
|
/* |
/* |
* If we're in the SYNOPSIS, see if we're an #include block. |
* If we're in the SYNOPSIS, see if we're an #include block. |
* If we are, then print the "In" macro and re-loop. |
* If we are, then print the "In" macro and re-loop. |
|
|
*/ |
*/ |
if (SECT_SYNOPSIS == st->sect) { |
if (SECT_SYNOPSIS == st->sect) { |
i = start; |
i = start; |
for (i = start; i < end && ' ' == buf[i]; i++) |
while (i < end && buf[i] == ' ') |
/* Spin. */ ; |
i++; |
if (i == end) |
if (i == end) |
return; |
goto again; |
|
|
/* We're an include block! */ |
/* We're an include block! */ |
if (end - i > 10 && |
if (end - i > 10 && |
0 == memcmp(&buf[i], "#include <", 10)) { |
0 == memcmp(&buf[i], "#include <", 10)) { |
start = i + 10; |
start = i + 10; |
while (start < end && ' ' == buf[start]) |
while (start < end && ' ' == buf[start]) |
start++; |
start++; |
|
if (indisplay) |
|
puts(".Ed"); |
|
indisplay = wantsp = 0; |
fputs(".In ", stdout); |
fputs(".In ", stdout); |
/* Stop til the '>' marker or we hit eoln. */ |
/* Stop til the '>' marker or we hit eoln. */ |
while (start < end && |
while (start < end && |
|
|
start++; |
start++; |
if (start < end && '\n' == buf[start]) |
if (start < end && '\n' == buf[start]) |
start++; |
start++; |
if (start < end) |
goto again; |
|
} |
|
|
|
/* Other preprocessor directives. */ |
|
if ('#' == buf[i]) { |
|
if (indisplay) |
|
puts(".Ed"); |
|
indisplay = wantsp = 0; |
|
fputs(".Fd ", stdout); |
|
start = i; |
|
while(start < end && '\n' != buf[start]) |
|
putchar(buf[start++]); |
|
putchar('\n'); |
|
if (start < end && '\n' == buf[start]) |
|
start++; |
|
|
|
/* Remember #define for Dv or Fn. */ |
|
|
|
if (strncmp(buf + i + 1, "define", 6) || |
|
! isspace((unsigned char)buf[i + 7])) |
goto again; |
goto again; |
return; |
|
|
ifo = i + 7; |
|
while (ifo < start && |
|
isspace((unsigned char)buf[ifo])) |
|
ifo++; |
|
ifa = ifo; |
|
while ('_' == buf[ifa] || |
|
isalnum((unsigned char)buf[ifa])) |
|
ifa++; |
|
dict_put(buf + ifo, ifa - ifo, |
|
'(' == buf[ifa] ? MDOC_Fo : MDOC_Dv); |
|
|
|
goto again; |
} |
} |
|
|
|
/* Parse function declaration. */ |
|
ifo = ifa = ifc = 0; |
|
inl = end; |
|
nopen = 0; |
|
for (ift = i; i < end; i++) { |
|
if (ifc) { |
|
if (buf[i] != '\n') |
|
continue; |
|
inl = i; |
|
break; |
|
} |
|
switch (buf[i]) { |
|
case '\t': |
|
/* FALLTHROUGH */ |
|
case ' ': |
|
if ( ! ifa) |
|
ifo = i; |
|
break; |
|
case '(': |
|
if (ifo) { |
|
nopen++; |
|
if ( ! ifa) |
|
ifa = i; |
|
} else |
|
i = end; |
|
break; |
|
case ')': |
|
switch (nopen) { |
|
case 0: |
|
i = end; |
|
break; |
|
case 1: |
|
ifc = i; |
|
break; |
|
default: |
|
nopen--; |
|
break; |
|
} |
|
break; |
|
default: |
|
break; |
|
} |
|
} |
|
|
|
/* Encode function declaration. */ |
|
if (ifc) { |
|
for (i = ifa; i < ifc; i++) |
|
if (buf[i] == '\n') |
|
buf[i] = ' '; |
|
buf[ifo++] = '\0'; |
|
register_type(buf + ift); |
|
if (indisplay) |
|
puts(".Ed"); |
|
indisplay = wantsp = 0; |
|
printf(".Ft %s", buf + ift); |
|
if (buf[ifo] == '*') { |
|
fputs(" *", stdout); |
|
ifo++; |
|
} |
|
putchar('\n'); |
|
buf[ifa++] = '\0'; |
|
printf(".Fo %s\n", buf + ifo); |
|
dict_put(buf + ifo, 0, MDOC_Fo); |
|
buf[ifc++] = '\0'; |
|
for (;;) { |
|
cp = strchr(buf + ifa, ','); |
|
if (cp != NULL) { |
|
cp2 = cp; |
|
*cp++ = '\0'; |
|
} else |
|
cp2 = strchr(buf + ifa, '\0'); |
|
while (isalnum((unsigned char)cp2[-1]) || |
|
'_' == cp2[-1]) |
|
cp2--; |
|
if ('\0' != *cp2) |
|
dict_put(cp2, 0, MDOC_Fa); |
|
register_type(buf + ifa); |
|
if (strchr(buf + ifa, ' ') == NULL) |
|
printf(".Fa %s\n", buf + ifa); |
|
else |
|
printf(".Fa \"%s\"\n", buf + ifa); |
|
if (cp == NULL) |
|
break; |
|
while (*cp == ' ' || *cp == '\t') |
|
cp++; |
|
ifa = cp - buf; |
|
} |
|
puts(".Fc"); |
|
if (buf[ifc] == ';') |
|
ifc++; |
|
if (ifc < inl) { |
|
buf[inl] = '\0'; |
|
puts(buf + ifc); |
|
} |
|
start = inl < end ? inl + 1 : end; |
|
goto again; |
|
} |
} |
} |
|
|
if (start == end) |
if ( ! indisplay) |
return; |
puts(".Bd -literal"); |
puts(".Bd -literal"); |
else if (wantsp) |
for (last = ' '; start < end; start++) { |
putchar('\n'); |
|
indisplay = 1; |
|
wantsp = 0; |
|
|
|
for (last = '\n'; start < end; start++) { |
/* |
/* |
* Handle accidental macros (newline starting with |
* Handle accidental macros (newline starting with |
* control character) and escapes. |
* control character) and escapes. |
*/ |
*/ |
if ('\n' == last) |
if ('\n' == last) { |
|
if ('\n' == buf[start]) |
|
goto again; |
if ('.' == buf[start] || '\'' == buf[start]) |
if ('.' == buf[start] || '\'' == buf[start]) |
printf("\\&"); |
printf("\\&"); |
|
} |
putchar(last = buf[start]); |
putchar(last = buf[start]); |
if ('\\' == buf[start]) |
if ('\\' == buf[start]) |
printf("e"); |
printf("e"); |
} |
} |
putchar(last = '\n'); |
if ('\n' != last) |
puts(".Ed"); |
putchar('\n'); |
|
if (indisplay) |
|
puts(".Ed"); |
} |
} |
|
|
/* |
/* |
Line 1133 donamenm(struct state *st, const char *buf, size_t *st |
|
Line 1376 donamenm(struct state *st, const char *buf, size_t *st |
|
assert(OUST_NL == st->oust); |
assert(OUST_NL == st->oust); |
assert(st->wantws); |
assert(st->wantws); |
|
|
while (*start < end && ' ' == buf[*start]) |
while (*start < end && isspace((unsigned char)buf[*start])) |
(*start)++; |
(*start)++; |
|
|
if (end == *start) { |
if (end == *start) { |
Line 1154 donamenm(struct state *st, const char *buf, size_t *st |
|
Line 1397 donamenm(struct state *st, const char *buf, size_t *st |
|
printf(" ,"); |
printf(" ,"); |
mdoc_newln(st); |
mdoc_newln(st); |
(*start)++; |
(*start)++; |
while (*start < end && ' ' == buf[*start]) |
while (*start < end && isspace((unsigned char)buf[*start])) |
(*start)++; |
(*start)++; |
} |
} |
} |
} |
Line 1169 donamenm(struct state *st, const char *buf, size_t *st |
|
Line 1412 donamenm(struct state *st, const char *buf, size_t *st |
|
* |
* |
* Uses formatcode() to go to OUST_MAC mode |
* Uses formatcode() to go to OUST_MAC mode |
* and outbuf_flush() to go to OUST_TXT mode. |
* and outbuf_flush() to go to OUST_TXT mode. |
* Main text mode wantws handling is in this function. |
* In text mode, wantws requests white space before the text |
|
* currently contained in the outbuf, not before upcoming text. |
* Must make sure to go back to OUST_NL/wantws mode before returning. |
* Must make sure to go back to OUST_NL/wantws mode before returning. |
*/ |
*/ |
static void |
static void |
ordinary(struct state *st, const char *buf, size_t start, size_t end) |
ordinary(struct state *st, const char *buf, size_t start, size_t end) |
{ |
{ |
size_t i, j, opstack; |
size_t i, j, opstack, wend; |
int seq; |
enum mdoc_type mtype; |
|
int eos, noeos, seq; |
|
char savechar; |
|
|
if ( ! st->parsing || st->paused) |
if ( ! st->parsing || st->paused) |
return; |
return; |
Line 1189 ordinary(struct state *st, const char *buf, size_t sta |
|
Line 1435 ordinary(struct state *st, const char *buf, size_t sta |
|
*/ |
*/ |
if (SECT_NAME == st->sect) { |
if (SECT_NAME == st->sect) { |
for (i = end - 2; i > start; i--) |
for (i = end - 2; i > start; i--) |
if ('-' == buf[i] && ' ' == buf[i + 1]) |
if ('-' == buf[i] && |
|
isspace((unsigned char)buf[i + 1])) |
break; |
break; |
if ('-' == buf[i]) { |
if ('-' == buf[i]) { |
j = i; |
j = i; |
Line 1199 ordinary(struct state *st, const char *buf, size_t sta |
|
Line 1446 ordinary(struct state *st, const char *buf, size_t sta |
|
break; |
break; |
donamenm(st, buf, &start, i + 1); |
donamenm(st, buf, &start, i + 1); |
start = j + 1; |
start = j + 1; |
while (start < end && ' ' == buf[start]) |
while (start < end && |
|
isspace((unsigned char)buf[start])) |
start++; |
start++; |
|
while (start < end && '.' == buf[end - 1]) |
|
end--; |
formatcodeln(st, "Nd", buf, &start, end, 1); |
formatcodeln(st, "Nd", buf, &start, end, 1); |
mdoc_newln(st); |
mdoc_newln(st); |
return; |
return; |
Line 1220 ordinary(struct state *st, const char *buf, size_t sta |
|
Line 1470 ordinary(struct state *st, const char *buf, size_t sta |
|
* Escape initial control characters. |
* Escape initial control characters. |
*/ |
*/ |
while (start < end) { |
while (start < end) { |
if (start < end - 1 && '<' == buf[start + 1]) |
if (start < end - 1 && '<' == buf[start + 1] && |
|
'A' <= buf[start] && 'Z' >= buf[start]) |
break; |
break; |
else if ('\n' == buf[start]) |
else if ('\n' == buf[start]) |
break; |
break; |
Line 1241 ordinary(struct state *st, const char *buf, size_t sta |
|
Line 1492 ordinary(struct state *st, const char *buf, size_t sta |
|
&start, end, &opstack)) |
&start, end, &opstack)) |
continue; |
continue; |
|
|
|
/* Merely buffer non-whitespace. */ |
|
|
|
last = buf[start++]; |
|
if ( ! isspace(last)) |
|
outbuf_addchar(st); |
|
if (start < end && |
|
! isspace((unsigned char)buf[start - 1]) && |
|
! isspace((unsigned char)buf[start])) |
|
continue; |
|
|
/* |
/* |
|
* Found the end of a word. |
|
* Rewind trailing delimiters. |
|
*/ |
|
|
|
eos = noeos = 0; |
|
for (wend = st->outbuflen; wend; wend--) |
|
if ('.' == st->outbuf[wend - 1] || |
|
'!' == st->outbuf[wend - 1] || |
|
'?' == st->outbuf[wend - 1]) |
|
eos = 1; |
|
else if ('|' == st->outbuf[wend - 1] || |
|
',' == st->outbuf[wend - 1] || |
|
';' == st->outbuf[wend - 1] || |
|
':' == st->outbuf[wend - 1]) |
|
noeos = 1; |
|
else if ('\'' != st->outbuf[wend - 1] && |
|
'"' != st->outbuf[wend - 1] && |
|
')' != st->outbuf[wend - 1] && |
|
']' != st->outbuf[wend - 1]) |
|
break; |
|
eos &= ! noeos; |
|
|
|
/* |
|
* Detect function names. |
|
*/ |
|
|
|
mtype = MDOC_Fa; |
|
savechar = '\0'; |
|
if (wend && ')' == st->outbuf[wend] && |
|
'(' == st->outbuf[wend - 1]) { |
|
mtype = dict_get(st->outbuf, --wend); |
|
if (MDOC_Dv == mtype) |
|
mtype = MDOC_Fo; |
|
if (MDOC_Fo == mtype || MDOC_MAX == mtype) { |
|
st->outbuflen = wend; |
|
st->outbuf[wend] = '\0'; |
|
mdoc_newln(st); |
|
if (MDOC_Fo == mtype) |
|
fputs(".Fn", stdout); |
|
else |
|
fputs(".Xr", stdout); |
|
st->oust = OUST_MAC; |
|
} |
|
} else { |
|
mtype = dict_get(st->outbuf, wend); |
|
if (MDOC_Dv == mtype) { |
|
savechar = st->outbuf[wend]; |
|
st->outbuf[wend] = '\0'; |
|
mdoc_newln(st); |
|
fputs(".Dv", stdout); |
|
st->oust = OUST_MAC; |
|
} else |
|
mtype = MDOC_Fa; |
|
} |
|
|
|
/* |
* On whitespace, flush the output buffer |
* On whitespace, flush the output buffer |
* and allow breaking to a macro line. |
* and allow breaking to a macro line. |
* Otherwise, buffer text and clear wantws. |
|
*/ |
*/ |
|
|
last = buf[start++]; |
outbuf_flush(st); |
if (' ' == last) { |
|
outbuf_flush(st); |
/* |
putchar(' '); |
* End macro lines, and |
st->wantws = 1; |
* end text lines at the end of sentences. |
} else |
*/ |
outbuf_addchar(st); |
|
|
if (OUST_MAC == st->oust || (eos && wend > 1 && |
|
islower((unsigned char)st->outbuf[wend - 1]))) { |
|
if (MDOC_MAX == mtype) |
|
fputs(" 3", stdout); |
|
if (MDOC_Fa != mtype) { |
|
if (MDOC_Dv == mtype) |
|
st->outbuf[wend] = savechar; |
|
else |
|
wend += 2; |
|
while ('\0' != st->outbuf[wend]) |
|
printf(" %c", |
|
st->outbuf[wend++]); |
|
} |
|
mdoc_newln(st); |
|
} |
|
|
|
/* Advance to the next word. */ |
|
|
|
while ('\n' != buf[start] && |
|
isspace((unsigned char)buf[start])) |
|
start++; |
|
st->wantws = 1; |
} |
} |
|
|
if (start < end - 1 && '<' == buf[start + 1]) { |
if (start < end - 1 && '<' == buf[start + 1] && |
|
'A' <= buf[start] && 'Z' >= buf[start]) { |
formatcode(st, buf, &start, end, 0, seq); |
formatcode(st, buf, &start, end, 0, seq); |
if (OUST_MAC == st->oust) { |
if (OUST_MAC == st->oust) { |
/* |
/* |
Line 1264 ordinary(struct state *st, const char *buf, size_t sta |
|
Line 1603 ordinary(struct state *st, const char *buf, size_t sta |
|
* XXX Some punctuation characters |
* XXX Some punctuation characters |
* are not handled yet. |
* are not handled yet. |
*/ |
*/ |
if ((start == end - 1 || |
if ((start == end - 1 || |
(start < end - 1 && |
(start < end - 1 && |
(' ' == buf[start + 1] || |
(' ' == buf[start + 1] || |
'\n' == buf[start + 1]))) && |
'\n' == buf[start + 1]))) && |
('.' == buf[start] || |
NULL != strchr("|.,;:?!)]", buf[start])) { |
',' == buf[start])) { |
|
putchar(' '); |
putchar(' '); |
putchar(buf[start++]); |
putchar(buf[start++]); |
} |
} |
Line 1294 ordinary(struct state *st, const char *buf, size_t sta |
|
Line 1632 ordinary(struct state *st, const char *buf, size_t sta |
|
*/ |
*/ |
|
|
if ( ! st->wantws && start < end && |
if ( ! st->wantws && start < end && |
'<' != buf[start + 1]) { |
('<' != buf[start + 1] || |
printf(" Ns "); |
'A' > buf[start] || |
|
'Z' < buf[start])) { |
|
fputs(" Ns", stdout); |
st->wantws = 1; |
st->wantws = 1; |
} |
} |
} |
} |
} else if (start < end && '\n' == buf[start]) { |
} else if (start < end && '\n' == buf[start]) { |
outbuf_flush(st); |
outbuf_flush(st); |
mdoc_newln(st); |
st->wantws = 1; |
if (++start >= end) |
if (++start >= end) |
continue; |
continue; |
/* |
/* |
Line 1312 ordinary(struct state *st, const char *buf, size_t sta |
|
Line 1652 ordinary(struct state *st, const char *buf, size_t sta |
|
* have a macro subsequent it, which may be |
* have a macro subsequent it, which may be |
* possible if we have an escape next. |
* possible if we have an escape next. |
*/ |
*/ |
if (' ' == buf[start] || '\t' == buf[start]) |
if (' ' == buf[start] || '\t' == buf[start]) { |
|
mdoc_newln(st); |
puts(".br"); |
puts(".br"); |
|
} |
for ( ; start < end; start++) |
for ( ; start < end; start++) |
if (' ' != buf[start] && '\t' != buf[start]) |
if (' ' != buf[start] && '\t' != buf[start]) |
break; |
break; |
Line 1329 ordinary(struct state *st, const char *buf, size_t sta |
|
Line 1671 ordinary(struct state *st, const char *buf, size_t sta |
|
* (default: starts with "="). |
* (default: starts with "="). |
*/ |
*/ |
static void |
static void |
dopar(struct state *st, const char *buf, size_t start, size_t end) |
dopar(struct state *st, char *buf, size_t start, size_t end) |
{ |
{ |
|
|
assert(OUST_NL == st->oust); |
assert(OUST_NL == st->oust); |
Line 1351 dopar(struct state *st, const char *buf, size_t start, |
|
Line 1693 dopar(struct state *st, const char *buf, size_t start, |
|
*/ |
*/ |
static void |
static void |
dofile(const struct args *args, const char *fname, |
dofile(const struct args *args, const char *fname, |
const struct tm *tm, const char *buf, size_t sz) |
const struct tm *tm, char *buf, size_t sz) |
{ |
{ |
char datebuf[64]; |
char datebuf[64]; |
struct state st; |
struct state st; |
const char *fbase, *fext, *section, *date; |
const char *fbase, *fext, *section, *date, *format; |
char *title, *cp; |
char *title, *cp; |
size_t sup, end, i, cur = 0; |
size_t cur, end; |
|
int verb; |
|
|
if (0 == sz) |
if (0 == sz) |
return; |
return; |
Line 1400 dofile(const struct args *args, const char *fname, |
|
Line 1743 dofile(const struct args *args, const char *fname, |
|
|
|
/* Date. Or the given "tm" if not supplied. */ |
/* Date. Or the given "tm" if not supplied. */ |
|
|
if (NULL == (date = args->date)) { |
date = args->date; |
strftime(datebuf, sizeof(datebuf), "%B %d, %Y", tm); |
format = (NULL == date) ? "%B %d, %Y" : |
|
strcmp(date, "Mdocdate") ? NULL : "$" "Mdocdate: %B %d %Y $"; |
|
|
|
if (NULL != format) { |
|
strftime(datebuf, sizeof(datebuf), format, tm); |
date = datebuf; |
date = datebuf; |
} |
} |
|
|
Line 1416 dofile(const struct args *args, const char *fname, |
|
Line 1763 dofile(const struct args *args, const char *fname, |
|
|
|
free(title); |
free(title); |
|
|
|
dict_init(); |
memset(&st, 0, sizeof(struct state)); |
memset(&st, 0, sizeof(struct state)); |
st.oust = OUST_NL; |
st.oust = OUST_NL; |
st.wantws = 1; |
st.wantws = 1; |
Line 1424 dofile(const struct args *args, const char *fname, |
|
Line 1772 dofile(const struct args *args, const char *fname, |
|
|
|
/* Main loop over file contents. */ |
/* Main loop over file contents. */ |
|
|
while (cur < sz) { |
cur = 0; |
|
for (;;) { |
|
while (cur < sz && '\n' == buf[cur]) |
|
cur++; |
|
if (cur >= sz) |
|
break; |
|
|
|
verb = isspace((unsigned char)buf[cur]); |
|
|
/* Read until next paragraph. */ |
/* Read until next paragraph. */ |
for (i = cur + 1; i < sz; i++) |
|
if ('\n' == buf[i] && '\n' == buf[i - 1]) { |
for (end = cur + 1; end + 1 < sz; end++) |
/* Consume blank paragraphs. */ |
if ('\n' == buf[end] && '\n' == buf[end + 1] && |
while (i + 1 < sz && '\n' == buf[i + 1]) |
!(verb && end + 2 < sz && |
i++; |
isspace((unsigned char)buf[end + 2]))) |
break; |
break; |
} |
|
|
|
/* Adjust end marker for EOF. */ |
/* Adjust end marker for EOF. */ |
end = i < sz ? i - 1 : |
|
('\n' == buf[sz - 1] ? sz - 1 : sz); |
|
sup = i < sz ? end + 2 : sz; |
|
|
|
|
if (end < sz && '\n' != buf[end]) |
|
end++; |
|
|
/* Process paragraph and adjust start. */ |
/* Process paragraph and adjust start. */ |
|
|
dopar(&st, buf, cur, end); |
dopar(&st, buf, cur, end); |
cur = sup; |
cur = end + 2; |
} |
} |
|
dict_destroy(); |
} |
} |
|
|
/* |
/* |