version 1.2, 2009/07/12 09:48:00 |
version 1.30, 2010/08/24 12:18:48 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2008, 2009 Kristaps Dzonsons <kristaps@kth.se> |
* Copyright (c) 2008, 2009, 2010 Kristaps Dzonsons <kristaps@bsd.lv> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the above |
* purpose with or without fee is hereby granted, provided that the above |
|
|
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
*/ |
*/ |
|
#ifdef HAVE_CONFIG_H |
|
#include "config.h" |
|
#endif |
|
|
#include <sys/types.h> |
#include <sys/types.h> |
|
|
#include <assert.h> |
#include <assert.h> |
#include <ctype.h> |
#include <ctype.h> |
#include <stdlib.h> |
#include <stdlib.h> |
|
#include <stdio.h> |
|
#include <string.h> |
|
#include <time.h> |
|
|
|
#include "mandoc.h" |
#include "libmandoc.h" |
#include "libmandoc.h" |
|
|
|
static int a2time(time_t *, const char *, const char *); |
|
|
|
|
int |
int |
mandoc_special(const char *p) |
mandoc_special(char *p) |
{ |
{ |
int c; |
int len, i; |
|
char term; |
|
char *sv; |
|
|
if ('\\' != *p++) |
len = 0; |
return(0); |
term = '\0'; |
|
sv = p; |
|
|
switch (*p) { |
assert('\\' == *p); |
case ('\\'): |
p++; |
|
|
|
switch (*p++) { |
|
#if 0 |
|
case ('Z'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('\''): |
case ('X'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('`'): |
case ('x'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('q'): |
case ('w'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('-'): |
case ('S'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('~'): |
case ('R'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('^'): |
case ('o'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('%'): |
case ('N'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('0'): |
case ('l'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case (' '): |
case ('L'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('|'): |
case ('H'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('&'): |
case ('h'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('.'): |
case ('D'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case (':'): |
case ('C'): |
/* FALLTHROUGH */ |
/* FALLTHROUGH */ |
case ('e'): |
case ('b'): |
return(2); |
/* FALLTHROUGH */ |
case ('f'): |
case ('B'): |
if (0 == *++p || ! isgraph((u_char)*p)) |
/* FALLTHROUGH */ |
|
case ('a'): |
|
/* FALLTHROUGH */ |
|
case ('A'): |
|
if (*p++ != '\'') |
return(0); |
return(0); |
return(3); |
term = '\''; |
case ('*'): |
break; |
if (0 == *++p || ! isgraph((u_char)*p)) |
#endif |
return(0); |
case ('h'): |
switch (*p) { |
/* FALLTHROUGH */ |
|
case ('v'): |
|
/* FALLTHROUGH */ |
|
case ('s'): |
|
if (ASCII_HYPH == *p) |
|
*p = '-'; |
|
|
|
i = 0; |
|
if ('+' == *p || '-' == *p) { |
|
p++; |
|
i = 1; |
|
} |
|
|
|
switch (*p++) { |
case ('('): |
case ('('): |
if (0 == *++p || ! isgraph((u_char)*p)) |
len = 2; |
|
break; |
|
case ('['): |
|
term = ']'; |
|
break; |
|
case ('\''): |
|
term = '\''; |
|
break; |
|
case ('0'): |
|
i = 1; |
|
/* FALLTHROUGH */ |
|
default: |
|
len = 1; |
|
p--; |
|
break; |
|
} |
|
|
|
if (ASCII_HYPH == *p) |
|
*p = '-'; |
|
if ('+' == *p || '-' == *p) { |
|
if (i) |
return(0); |
return(0); |
return(4); |
p++; |
|
} |
|
|
|
break; |
|
#if 0 |
|
case ('Y'): |
|
/* FALLTHROUGH */ |
|
case ('V'): |
|
/* FALLTHROUGH */ |
|
case ('$'): |
|
/* FALLTHROUGH */ |
|
case ('n'): |
|
/* FALLTHROUGH */ |
|
case ('k'): |
|
/* FALLTHROUGH */ |
|
#endif |
|
case ('M'): |
|
/* FALLTHROUGH */ |
|
case ('m'): |
|
/* FALLTHROUGH */ |
|
case ('f'): |
|
/* FALLTHROUGH */ |
|
case ('F'): |
|
/* FALLTHROUGH */ |
|
case ('*'): |
|
switch (*p++) { |
|
case ('('): |
|
len = 2; |
|
break; |
case ('['): |
case ('['): |
for (c = 3, p++; *p && ']' != *p; p++, c++) |
term = ']'; |
if ( ! isgraph((u_char)*p)) |
break; |
break; |
|
return(*p == ']' ? c : 0); |
|
default: |
default: |
|
len = 1; |
|
p--; |
break; |
break; |
} |
} |
return(3); |
break; |
case ('('): |
case ('('): |
if (0 == *++p || ! isgraph((u_char)*p)) |
len = 2; |
return(0); |
break; |
if (0 == *++p || ! isgraph((u_char)*p)) |
|
return(0); |
|
return(4); |
|
case ('['): |
case ('['): |
|
term = ']'; |
break; |
break; |
|
case ('z'): |
|
len = 1; |
|
if ('\\' == *p) { |
|
p += mandoc_special(p); |
|
return(*p ? (int)(p - sv) : 0); |
|
} |
|
break; |
default: |
default: |
return(0); |
len = 1; |
|
p--; |
|
break; |
} |
} |
|
|
for (c = 3, p++; *p && ']' != *p; p++, c++) |
if (term) { |
if ( ! isgraph((u_char)*p)) |
for ( ; *p && term != *p; p++) |
|
if (ASCII_HYPH == *p) |
|
*p = '-'; |
|
return(*p ? (int)(p - sv) : 0); |
|
} |
|
|
|
for (i = 0; *p && i < len; i++, p++) |
|
if (ASCII_HYPH == *p) |
|
*p = '-'; |
|
return(i == len ? (int)(p - sv) : 0); |
|
} |
|
|
|
|
|
void * |
|
mandoc_calloc(size_t num, size_t size) |
|
{ |
|
void *ptr; |
|
|
|
ptr = calloc(num, size); |
|
if (NULL == ptr) { |
|
perror(NULL); |
|
exit(MANDOCLEVEL_SYSERR); |
|
} |
|
|
|
return(ptr); |
|
} |
|
|
|
|
|
void * |
|
mandoc_malloc(size_t size) |
|
{ |
|
void *ptr; |
|
|
|
ptr = malloc(size); |
|
if (NULL == ptr) { |
|
perror(NULL); |
|
exit(MANDOCLEVEL_SYSERR); |
|
} |
|
|
|
return(ptr); |
|
} |
|
|
|
|
|
void * |
|
mandoc_realloc(void *ptr, size_t size) |
|
{ |
|
|
|
ptr = realloc(ptr, size); |
|
if (NULL == ptr) { |
|
perror(NULL); |
|
exit(MANDOCLEVEL_SYSERR); |
|
} |
|
|
|
return(ptr); |
|
} |
|
|
|
|
|
char * |
|
mandoc_strdup(const char *ptr) |
|
{ |
|
char *p; |
|
|
|
p = strdup(ptr); |
|
if (NULL == p) { |
|
perror(NULL); |
|
exit(MANDOCLEVEL_SYSERR); |
|
} |
|
|
|
return(p); |
|
} |
|
|
|
|
|
static int |
|
a2time(time_t *t, const char *fmt, const char *p) |
|
{ |
|
struct tm tm; |
|
char *pp; |
|
|
|
memset(&tm, 0, sizeof(struct tm)); |
|
|
|
pp = strptime(p, fmt, &tm); |
|
if (NULL != pp && '\0' == *pp) { |
|
*t = mktime(&tm); |
|
return(1); |
|
} |
|
|
|
return(0); |
|
} |
|
|
|
|
|
/* |
|
* Convert from a manual date string (see mdoc(7) and man(7)) into a |
|
* date according to the stipulated date type. |
|
*/ |
|
time_t |
|
mandoc_a2time(int flags, const char *p) |
|
{ |
|
time_t t; |
|
|
|
if (MTIME_MDOCDATE & flags) { |
|
if (0 == strcmp(p, "$" "Mdocdate$")) |
|
return(time(NULL)); |
|
if (a2time(&t, "$" "Mdocdate: %b %d %Y $", p)) |
|
return(t); |
|
} |
|
|
|
if (MTIME_CANONICAL & flags || MTIME_REDUCED & flags) |
|
if (a2time(&t, "%b %d, %Y", p)) |
|
return(t); |
|
|
|
if (MTIME_ISO_8601 & flags) |
|
if (a2time(&t, "%Y-%m-%d", p)) |
|
return(t); |
|
|
|
if (MTIME_REDUCED & flags) { |
|
if (a2time(&t, "%d, %Y", p)) |
|
return(t); |
|
if (a2time(&t, "%Y", p)) |
|
return(t); |
|
} |
|
|
|
return(0); |
|
} |
|
|
|
|
|
int |
|
mandoc_eos(const char *p, size_t sz, int enclosed) |
|
{ |
|
const char *q; |
|
int found; |
|
|
|
if (0 == sz) |
|
return(0); |
|
|
|
/* |
|
* End-of-sentence recognition must include situations where |
|
* some symbols, such as `)', allow prior EOS punctuation to |
|
* propogate outward. |
|
*/ |
|
|
|
found = 0; |
|
for (q = p + (int)sz - 1; q >= p; q--) { |
|
switch (*q) { |
|
case ('\"'): |
|
/* FALLTHROUGH */ |
|
case ('\''): |
|
/* FALLTHROUGH */ |
|
case (']'): |
|
/* FALLTHROUGH */ |
|
case (')'): |
|
if (0 == found) |
|
enclosed = 1; |
break; |
break; |
|
case ('.'): |
|
/* FALLTHROUGH */ |
|
case ('!'): |
|
/* FALLTHROUGH */ |
|
case ('?'): |
|
found = 1; |
|
break; |
|
default: |
|
return(found && (!enclosed || isalnum((unsigned char)*q))); |
|
} |
|
} |
|
|
return(*p == ']' ? c : 0); |
return(found && !enclosed); |
} |
} |
|
|
|
|
|
int |
|
mandoc_hyph(const char *start, const char *c) |
|
{ |
|
|
|
/* |
|
* Choose whether to break at a hyphenated character. We only |
|
* do this if it's free-standing within a word. |
|
*/ |
|
|
|
/* Skip first/last character of buffer. */ |
|
if (c == start || '\0' == *(c + 1)) |
|
return(0); |
|
/* Skip first/last character of word. */ |
|
if ('\t' == *(c + 1) || '\t' == *(c - 1)) |
|
return(0); |
|
if (' ' == *(c + 1) || ' ' == *(c - 1)) |
|
return(0); |
|
/* Skip double invocations. */ |
|
if ('-' == *(c + 1) || '-' == *(c - 1)) |
|
return(0); |
|
/* Skip escapes. */ |
|
if ('\\' == *(c - 1)) |
|
return(0); |
|
|
|
return(1); |
|
} |