version 1.11, 2011/11/24 12:54:19 |
version 1.135, 2014/04/13 22:03:04 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2011 Kristaps Dzonsons <kristaps@bsd.lv> |
* Copyright (c) 2011, 2012 Kristaps Dzonsons <kristaps@bsd.lv> |
|
* Copyright (c) 2011, 2012, 2013, 2014 Ingo Schwarze <schwarze@openbsd.org> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the above |
* purpose with or without fee is hereby granted, provided that the above |
|
|
#include "config.h" |
#include "config.h" |
#endif |
#endif |
|
|
#include <sys/param.h> |
#include <sys/stat.h> |
|
#include <sys/wait.h> |
|
|
#include <assert.h> |
#include <assert.h> |
#include <dirent.h> |
#include <ctype.h> |
|
#include <errno.h> |
#include <fcntl.h> |
#include <fcntl.h> |
|
#include <fts.h> |
#include <getopt.h> |
#include <getopt.h> |
|
#include <limits.h> |
|
#include <stddef.h> |
#include <stdio.h> |
#include <stdio.h> |
#include <stdint.h> |
#include <stdint.h> |
#include <stdlib.h> |
#include <stdlib.h> |
#include <string.h> |
#include <string.h> |
|
#include <unistd.h> |
|
|
#ifdef __linux__ |
#ifdef HAVE_OHASH |
# include <db_185.h> |
#include <ohash.h> |
#else |
#else |
# include <db.h> |
#include "compat_ohash.h" |
#endif |
#endif |
|
#include <sqlite3.h> |
|
|
#include "man.h" |
|
#include "mdoc.h" |
#include "mdoc.h" |
|
#include "man.h" |
#include "mandoc.h" |
#include "mandoc.h" |
#include "mandocdb.h" |
#include "mandoc_aux.h" |
#include "manpath.h" |
#include "manpath.h" |
|
#include "mansearch.h" |
|
|
#define MANDOC_BUFSZ BUFSIZ |
extern int mansearch_keymax; |
#define MANDOC_SLOP 1024 |
extern const char *const mansearch_keynames[]; |
|
|
/* Tiny list for files. No need to bring in QUEUE. */ |
#define SQL_EXEC(_v) \ |
|
if (SQLITE_OK != sqlite3_exec(db, (_v), NULL, NULL, NULL)) \ |
|
say("", "%s: %s", (_v), sqlite3_errmsg(db)) |
|
#define SQL_BIND_TEXT(_s, _i, _v) \ |
|
if (SQLITE_OK != sqlite3_bind_text \ |
|
((_s), (_i)++, (_v), -1, SQLITE_STATIC)) \ |
|
say(mlink->file, "%s", sqlite3_errmsg(db)) |
|
#define SQL_BIND_INT(_s, _i, _v) \ |
|
if (SQLITE_OK != sqlite3_bind_int \ |
|
((_s), (_i)++, (_v))) \ |
|
say(mlink->file, "%s", sqlite3_errmsg(db)) |
|
#define SQL_BIND_INT64(_s, _i, _v) \ |
|
if (SQLITE_OK != sqlite3_bind_int64 \ |
|
((_s), (_i)++, (_v))) \ |
|
say(mlink->file, "%s", sqlite3_errmsg(db)) |
|
#define SQL_STEP(_s) \ |
|
if (SQLITE_DONE != sqlite3_step((_s))) \ |
|
say(mlink->file, "%s", sqlite3_errmsg(db)) |
|
|
struct of { |
enum op { |
char *fname; /* heap-allocated */ |
OP_DEFAULT = 0, /* new dbs from dir list or default config */ |
struct of *next; /* NULL for last one */ |
OP_CONFFILE, /* new databases from custom config file */ |
struct of *first; /* first in list */ |
OP_UPDATE, /* delete/add entries in existing database */ |
|
OP_DELETE, /* delete entries from existing database */ |
|
OP_TEST /* change no databases, report potential problems */ |
}; |
}; |
|
|
/* Buffer for storing growable data. */ |
enum form { |
|
FORM_NONE, /* format is unknown */ |
|
FORM_SRC, /* format is -man or -mdoc */ |
|
FORM_CAT /* format is cat */ |
|
}; |
|
|
struct buf { |
struct str { |
char *cp; |
char *rendered; /* key in UTF-8 or ASCII form */ |
size_t len; /* current length */ |
const struct mpage *mpage; /* if set, the owning parse */ |
size_t size; /* total buffer size */ |
uint64_t mask; /* bitmask in sequence */ |
|
char key[]; /* may contain escape sequences */ |
}; |
}; |
|
|
/* Operation we're going to perform. */ |
struct inodev { |
|
ino_t st_ino; |
|
dev_t st_dev; |
|
}; |
|
|
enum op { |
struct mpage { |
OP_NEW = 0, /* new database */ |
struct inodev inodev; /* used for hashing routine */ |
OP_UPDATE, /* delete/add entries in existing database */ |
int64_t recno; /* id in mpages SQL table */ |
OP_DELETE /* delete entries from existing database */ |
enum form form; /* format from file content */ |
|
char *sec; /* section from file content */ |
|
char *arch; /* architecture from file content */ |
|
char *title; /* title from file content */ |
|
char *desc; /* description from file content */ |
|
struct mlink *mlinks; /* singly linked list */ |
}; |
}; |
|
|
#define MAN_ARGS DB *hash, \ |
struct mlink { |
struct buf *buf, \ |
char file[PATH_MAX]; /* filename rel. to manpath */ |
struct buf *dbuf, \ |
enum form dform; /* format from directory */ |
const struct man_node *n |
enum form fform; /* format from file name suffix */ |
#define MDOC_ARGS DB *hash, \ |
char *dsec; /* section from directory */ |
struct buf *buf, \ |
char *arch; /* architecture from directory */ |
struct buf *dbuf, \ |
char *name; /* name from file name (not empty) */ |
const struct mdoc_node *n, \ |
char *fsec; /* section from file name suffix */ |
const struct mdoc_meta *m |
struct mlink *next; /* singly linked list */ |
|
struct mpage *mpage; /* parent */ |
|
int gzip; /* filename has a .gz suffix */ |
|
}; |
|
|
static void buf_appendmdoc(struct buf *, |
enum stmt { |
const struct mdoc_node *, int); |
STMT_DELETE_PAGE = 0, /* delete mpage */ |
static void buf_append(struct buf *, const char *); |
STMT_INSERT_PAGE, /* insert mpage */ |
static void buf_appendb(struct buf *, |
STMT_INSERT_LINK, /* insert mlink */ |
const void *, size_t); |
STMT_INSERT_NAME, /* insert name */ |
static void dbt_put(DB *, const char *, DBT *, DBT *); |
STMT_INSERT_KEY, /* insert parsed key */ |
static void hash_put(DB *, const struct buf *, uint64_t); |
STMT__MAX |
static void hash_reset(DB **); |
}; |
static void index_merge(const struct of *, struct mparse *, |
|
struct buf *, struct buf *, |
|
DB *, DB *, const char *, |
|
DB *, const char *, int, |
|
recno_t, const recno_t *, size_t); |
|
static void index_prune(const struct of *, DB *, |
|
const char *, DB *, const char *, |
|
int, recno_t *, recno_t **, size_t *); |
|
static void ofile_argbuild(char *[], int, int, struct of **); |
|
static int ofile_dirbuild(const char *, int, struct of **); |
|
static void ofile_free(struct of *); |
|
static int pman_node(MAN_ARGS); |
|
static void pmdoc_node(MDOC_ARGS); |
|
static void pmdoc_An(MDOC_ARGS); |
|
static void pmdoc_Cd(MDOC_ARGS); |
|
static void pmdoc_Er(MDOC_ARGS); |
|
static void pmdoc_Ev(MDOC_ARGS); |
|
static void pmdoc_Fd(MDOC_ARGS); |
|
static void pmdoc_In(MDOC_ARGS); |
|
static void pmdoc_Fn(MDOC_ARGS); |
|
static void pmdoc_Fo(MDOC_ARGS); |
|
static void pmdoc_Nd(MDOC_ARGS); |
|
static void pmdoc_Nm(MDOC_ARGS); |
|
static void pmdoc_Pa(MDOC_ARGS); |
|
static void pmdoc_St(MDOC_ARGS); |
|
static void pmdoc_Vt(MDOC_ARGS); |
|
static void pmdoc_Xr(MDOC_ARGS); |
|
static void usage(void); |
|
|
|
typedef void (*pmdoc_nf)(MDOC_ARGS); |
typedef int (*mdoc_fp)(struct mpage *, const struct mdoc_node *); |
|
|
static const pmdoc_nf mdocs[MDOC_MAX] = { |
struct mdoc_handler { |
NULL, /* Ap */ |
mdoc_fp fp; /* optional handler */ |
NULL, /* Dd */ |
uint64_t mask; /* set unless handler returns 0 */ |
NULL, /* Dt */ |
|
NULL, /* Os */ |
|
NULL, /* Sh */ |
|
NULL, /* Ss */ |
|
NULL, /* Pp */ |
|
NULL, /* D1 */ |
|
NULL, /* Dl */ |
|
NULL, /* Bd */ |
|
NULL, /* Ed */ |
|
NULL, /* Bl */ |
|
NULL, /* El */ |
|
NULL, /* It */ |
|
NULL, /* Ad */ |
|
pmdoc_An, /* An */ |
|
NULL, /* Ar */ |
|
pmdoc_Cd, /* Cd */ |
|
NULL, /* Cm */ |
|
NULL, /* Dv */ |
|
pmdoc_Er, /* Er */ |
|
pmdoc_Ev, /* Ev */ |
|
NULL, /* Ex */ |
|
NULL, /* Fa */ |
|
pmdoc_Fd, /* Fd */ |
|
NULL, /* Fl */ |
|
pmdoc_Fn, /* Fn */ |
|
NULL, /* Ft */ |
|
NULL, /* Ic */ |
|
pmdoc_In, /* In */ |
|
NULL, /* Li */ |
|
pmdoc_Nd, /* Nd */ |
|
pmdoc_Nm, /* Nm */ |
|
NULL, /* Op */ |
|
NULL, /* Ot */ |
|
pmdoc_Pa, /* Pa */ |
|
NULL, /* Rv */ |
|
pmdoc_St, /* St */ |
|
pmdoc_Vt, /* Va */ |
|
pmdoc_Vt, /* Vt */ |
|
pmdoc_Xr, /* Xr */ |
|
NULL, /* %A */ |
|
NULL, /* %B */ |
|
NULL, /* %D */ |
|
NULL, /* %I */ |
|
NULL, /* %J */ |
|
NULL, /* %N */ |
|
NULL, /* %O */ |
|
NULL, /* %P */ |
|
NULL, /* %R */ |
|
NULL, /* %T */ |
|
NULL, /* %V */ |
|
NULL, /* Ac */ |
|
NULL, /* Ao */ |
|
NULL, /* Aq */ |
|
NULL, /* At */ |
|
NULL, /* Bc */ |
|
NULL, /* Bf */ |
|
NULL, /* Bo */ |
|
NULL, /* Bq */ |
|
NULL, /* Bsx */ |
|
NULL, /* Bx */ |
|
NULL, /* Db */ |
|
NULL, /* Dc */ |
|
NULL, /* Do */ |
|
NULL, /* Dq */ |
|
NULL, /* Ec */ |
|
NULL, /* Ef */ |
|
NULL, /* Em */ |
|
NULL, /* Eo */ |
|
NULL, /* Fx */ |
|
NULL, /* Ms */ |
|
NULL, /* No */ |
|
NULL, /* Ns */ |
|
NULL, /* Nx */ |
|
NULL, /* Ox */ |
|
NULL, /* Pc */ |
|
NULL, /* Pf */ |
|
NULL, /* Po */ |
|
NULL, /* Pq */ |
|
NULL, /* Qc */ |
|
NULL, /* Ql */ |
|
NULL, /* Qo */ |
|
NULL, /* Qq */ |
|
NULL, /* Re */ |
|
NULL, /* Rs */ |
|
NULL, /* Sc */ |
|
NULL, /* So */ |
|
NULL, /* Sq */ |
|
NULL, /* Sm */ |
|
NULL, /* Sx */ |
|
NULL, /* Sy */ |
|
NULL, /* Tn */ |
|
NULL, /* Ux */ |
|
NULL, /* Xc */ |
|
NULL, /* Xo */ |
|
pmdoc_Fo, /* Fo */ |
|
NULL, /* Fc */ |
|
NULL, /* Oo */ |
|
NULL, /* Oc */ |
|
NULL, /* Bk */ |
|
NULL, /* Ek */ |
|
NULL, /* Bt */ |
|
NULL, /* Hf */ |
|
NULL, /* Fr */ |
|
NULL, /* Ud */ |
|
NULL, /* Lb */ |
|
NULL, /* Lp */ |
|
NULL, /* Lk */ |
|
NULL, /* Mt */ |
|
NULL, /* Brq */ |
|
NULL, /* Bro */ |
|
NULL, /* Brc */ |
|
NULL, /* %C */ |
|
NULL, /* Es */ |
|
NULL, /* En */ |
|
NULL, /* Dx */ |
|
NULL, /* %Q */ |
|
NULL, /* br */ |
|
NULL, /* sp */ |
|
NULL, /* %U */ |
|
NULL, /* Ta */ |
|
}; |
}; |
|
|
static const char *progname; |
static void dbclose(int); |
|
static void dbadd(struct mpage *, struct mchars *); |
|
static void dbadd_mlink(const struct mlink *mlink); |
|
static int dbopen(int); |
|
static void dbprune(void); |
|
static void filescan(const char *); |
|
static void *hash_alloc(size_t, void *); |
|
static void hash_free(void *, size_t, void *); |
|
static void *hash_halloc(size_t, void *); |
|
static void mlink_add(struct mlink *, const struct stat *); |
|
static void mlink_check(struct mpage *, struct mlink *); |
|
static void mlink_free(struct mlink *); |
|
static void mlinks_undupe(struct mpage *); |
|
static void mpages_free(void); |
|
static void mpages_merge(struct mchars *, struct mparse *); |
|
static void names_check(void); |
|
static void parse_cat(struct mpage *, int); |
|
static void parse_man(struct mpage *, const struct man_node *); |
|
static void parse_mdoc(struct mpage *, const struct mdoc_node *); |
|
static int parse_mdoc_body(struct mpage *, const struct mdoc_node *); |
|
static int parse_mdoc_head(struct mpage *, const struct mdoc_node *); |
|
static int parse_mdoc_Fd(struct mpage *, const struct mdoc_node *); |
|
static int parse_mdoc_Fn(struct mpage *, const struct mdoc_node *); |
|
static int parse_mdoc_Nd(struct mpage *, const struct mdoc_node *); |
|
static int parse_mdoc_Nm(struct mpage *, const struct mdoc_node *); |
|
static int parse_mdoc_Sh(struct mpage *, const struct mdoc_node *); |
|
static int parse_mdoc_Xr(struct mpage *, const struct mdoc_node *); |
|
static void putkey(const struct mpage *, char *, uint64_t); |
|
static void putkeys(const struct mpage *, |
|
const char *, size_t, uint64_t); |
|
static void putmdockey(const struct mpage *, |
|
const struct mdoc_node *, uint64_t); |
|
static void render_key(struct mchars *, struct str *); |
|
static void say(const char *, const char *, ...); |
|
static int set_basedir(const char *); |
|
static int treescan(void); |
|
static size_t utf8(unsigned int, char [7]); |
|
|
|
static char tempfilename[32]; |
|
static char *progname; |
|
static int nodb; /* no database changes */ |
|
static int mparse_options; /* abort the parse early */ |
|
static int use_all; /* use all found files */ |
|
static int debug; /* print what we're doing */ |
|
static int warnings; /* warn about crap */ |
|
static int write_utf8; /* write UTF-8 output; else ASCII */ |
|
static int exitcode; /* to be returned by main */ |
|
static enum op op; /* operational mode */ |
|
static char basedir[PATH_MAX]; /* current base directory */ |
|
static struct ohash mpages; /* table of distinct manual pages */ |
|
static struct ohash mlinks; /* table of directory entries */ |
|
static struct ohash names; /* table of all names */ |
|
static struct ohash strings; /* table of all strings */ |
|
static sqlite3 *db = NULL; /* current database */ |
|
static sqlite3_stmt *stmts[STMT__MAX]; /* current statements */ |
|
static uint64_t name_mask; |
|
|
|
static const struct mdoc_handler mdocs[MDOC_MAX] = { |
|
{ NULL, 0 }, /* Ap */ |
|
{ NULL, 0 }, /* Dd */ |
|
{ NULL, 0 }, /* Dt */ |
|
{ NULL, 0 }, /* Os */ |
|
{ parse_mdoc_Sh, TYPE_Sh }, /* Sh */ |
|
{ parse_mdoc_head, TYPE_Ss }, /* Ss */ |
|
{ NULL, 0 }, /* Pp */ |
|
{ NULL, 0 }, /* D1 */ |
|
{ NULL, 0 }, /* Dl */ |
|
{ NULL, 0 }, /* Bd */ |
|
{ NULL, 0 }, /* Ed */ |
|
{ NULL, 0 }, /* Bl */ |
|
{ NULL, 0 }, /* El */ |
|
{ NULL, 0 }, /* It */ |
|
{ NULL, 0 }, /* Ad */ |
|
{ NULL, TYPE_An }, /* An */ |
|
{ NULL, TYPE_Ar }, /* Ar */ |
|
{ NULL, TYPE_Cd }, /* Cd */ |
|
{ NULL, TYPE_Cm }, /* Cm */ |
|
{ NULL, TYPE_Dv }, /* Dv */ |
|
{ NULL, TYPE_Er }, /* Er */ |
|
{ NULL, TYPE_Ev }, /* Ev */ |
|
{ NULL, 0 }, /* Ex */ |
|
{ NULL, TYPE_Fa }, /* Fa */ |
|
{ parse_mdoc_Fd, 0 }, /* Fd */ |
|
{ NULL, TYPE_Fl }, /* Fl */ |
|
{ parse_mdoc_Fn, 0 }, /* Fn */ |
|
{ NULL, TYPE_Ft }, /* Ft */ |
|
{ NULL, TYPE_Ic }, /* Ic */ |
|
{ NULL, TYPE_In }, /* In */ |
|
{ NULL, TYPE_Li }, /* Li */ |
|
{ parse_mdoc_Nd, 0 }, /* Nd */ |
|
{ parse_mdoc_Nm, 0 }, /* Nm */ |
|
{ NULL, 0 }, /* Op */ |
|
{ NULL, 0 }, /* Ot */ |
|
{ NULL, TYPE_Pa }, /* Pa */ |
|
{ NULL, 0 }, /* Rv */ |
|
{ NULL, TYPE_St }, /* St */ |
|
{ NULL, TYPE_Va }, /* Va */ |
|
{ parse_mdoc_body, TYPE_Va }, /* Vt */ |
|
{ parse_mdoc_Xr, 0 }, /* Xr */ |
|
{ NULL, 0 }, /* %A */ |
|
{ NULL, 0 }, /* %B */ |
|
{ NULL, 0 }, /* %D */ |
|
{ NULL, 0 }, /* %I */ |
|
{ NULL, 0 }, /* %J */ |
|
{ NULL, 0 }, /* %N */ |
|
{ NULL, 0 }, /* %O */ |
|
{ NULL, 0 }, /* %P */ |
|
{ NULL, 0 }, /* %R */ |
|
{ NULL, 0 }, /* %T */ |
|
{ NULL, 0 }, /* %V */ |
|
{ NULL, 0 }, /* Ac */ |
|
{ NULL, 0 }, /* Ao */ |
|
{ NULL, 0 }, /* Aq */ |
|
{ NULL, TYPE_At }, /* At */ |
|
{ NULL, 0 }, /* Bc */ |
|
{ NULL, 0 }, /* Bf */ |
|
{ NULL, 0 }, /* Bo */ |
|
{ NULL, 0 }, /* Bq */ |
|
{ NULL, TYPE_Bsx }, /* Bsx */ |
|
{ NULL, TYPE_Bx }, /* Bx */ |
|
{ NULL, 0 }, /* Db */ |
|
{ NULL, 0 }, /* Dc */ |
|
{ NULL, 0 }, /* Do */ |
|
{ NULL, 0 }, /* Dq */ |
|
{ NULL, 0 }, /* Ec */ |
|
{ NULL, 0 }, /* Ef */ |
|
{ NULL, TYPE_Em }, /* Em */ |
|
{ NULL, 0 }, /* Eo */ |
|
{ NULL, TYPE_Fx }, /* Fx */ |
|
{ NULL, TYPE_Ms }, /* Ms */ |
|
{ NULL, 0 }, /* No */ |
|
{ NULL, 0 }, /* Ns */ |
|
{ NULL, TYPE_Nx }, /* Nx */ |
|
{ NULL, TYPE_Ox }, /* Ox */ |
|
{ NULL, 0 }, /* Pc */ |
|
{ NULL, 0 }, /* Pf */ |
|
{ NULL, 0 }, /* Po */ |
|
{ NULL, 0 }, /* Pq */ |
|
{ NULL, 0 }, /* Qc */ |
|
{ NULL, 0 }, /* Ql */ |
|
{ NULL, 0 }, /* Qo */ |
|
{ NULL, 0 }, /* Qq */ |
|
{ NULL, 0 }, /* Re */ |
|
{ NULL, 0 }, /* Rs */ |
|
{ NULL, 0 }, /* Sc */ |
|
{ NULL, 0 }, /* So */ |
|
{ NULL, 0 }, /* Sq */ |
|
{ NULL, 0 }, /* Sm */ |
|
{ NULL, 0 }, /* Sx */ |
|
{ NULL, TYPE_Sy }, /* Sy */ |
|
{ NULL, TYPE_Tn }, /* Tn */ |
|
{ NULL, 0 }, /* Ux */ |
|
{ NULL, 0 }, /* Xc */ |
|
{ NULL, 0 }, /* Xo */ |
|
{ parse_mdoc_head, 0 }, /* Fo */ |
|
{ NULL, 0 }, /* Fc */ |
|
{ NULL, 0 }, /* Oo */ |
|
{ NULL, 0 }, /* Oc */ |
|
{ NULL, 0 }, /* Bk */ |
|
{ NULL, 0 }, /* Ek */ |
|
{ NULL, 0 }, /* Bt */ |
|
{ NULL, 0 }, /* Hf */ |
|
{ NULL, 0 }, /* Fr */ |
|
{ NULL, 0 }, /* Ud */ |
|
{ NULL, TYPE_Lb }, /* Lb */ |
|
{ NULL, 0 }, /* Lp */ |
|
{ NULL, TYPE_Lk }, /* Lk */ |
|
{ NULL, TYPE_Mt }, /* Mt */ |
|
{ NULL, 0 }, /* Brq */ |
|
{ NULL, 0 }, /* Bro */ |
|
{ NULL, 0 }, /* Brc */ |
|
{ NULL, 0 }, /* %C */ |
|
{ NULL, 0 }, /* Es */ |
|
{ NULL, 0 }, /* En */ |
|
{ NULL, TYPE_Dx }, /* Dx */ |
|
{ NULL, 0 }, /* %Q */ |
|
{ NULL, 0 }, /* br */ |
|
{ NULL, 0 }, /* sp */ |
|
{ NULL, 0 }, /* %U */ |
|
{ NULL, 0 }, /* Ta */ |
|
}; |
|
|
int |
int |
main(int argc, char *argv[]) |
main(int argc, char *argv[]) |
{ |
{ |
struct mparse *mp; /* parse sequence */ |
int ch, i; |
struct manpaths dirs; |
size_t j, sz; |
enum op op; /* current operation */ |
const char *path_arg; |
const char *dir; |
struct mchars *mc; |
char ibuf[MAXPATHLEN], /* index fname */ |
struct manpaths dirs; |
fbuf[MAXPATHLEN]; /* btree fname */ |
struct mparse *mp; |
int verb, /* output verbosity */ |
struct ohash_info mpages_info, mlinks_info; |
ch, i, flags; |
|
DB *idx, /* index database */ |
|
*db, /* keyword database */ |
|
*hash; /* temporary keyword hashtable */ |
|
BTREEINFO info; /* btree configuration */ |
|
recno_t maxrec; /* supremum of all records */ |
|
recno_t *recs; /* buffer of empty records */ |
|
size_t sz1, sz2, |
|
recsz, /* buffer size of recs */ |
|
reccur; /* valid number of recs */ |
|
struct buf buf, /* keyword buffer */ |
|
dbuf; /* description buffer */ |
|
struct of *of; /* list of files for processing */ |
|
extern int optind; |
|
extern char *optarg; |
|
|
|
|
memset(stmts, 0, STMT__MAX * sizeof(sqlite3_stmt *)); |
|
memset(&dirs, 0, sizeof(struct manpaths)); |
|
|
|
mpages_info.alloc = mlinks_info.alloc = hash_alloc; |
|
mpages_info.halloc = mlinks_info.halloc = hash_halloc; |
|
mpages_info.hfree = mlinks_info.hfree = hash_free; |
|
|
|
mpages_info.key_offset = offsetof(struct mpage, inodev); |
|
mlinks_info.key_offset = offsetof(struct mlink, file); |
|
|
progname = strrchr(argv[0], '/'); |
progname = strrchr(argv[0], '/'); |
if (progname == NULL) |
if (progname == NULL) |
progname = argv[0]; |
progname = argv[0]; |
else |
else |
++progname; |
++progname; |
|
|
memset(&dirs, 0, sizeof(struct manpaths)); |
/* |
|
* We accept a few different invocations. |
|
* The CHECKOP macro makes sure that invocation styles don't |
|
* clobber each other. |
|
*/ |
|
#define CHECKOP(_op, _ch) do \ |
|
if (OP_DEFAULT != (_op)) { \ |
|
fprintf(stderr, "-%c: Conflicting option\n", (_ch)); \ |
|
goto usage; \ |
|
} while (/*CONSTCOND*/0) |
|
|
verb = 0; |
path_arg = NULL; |
of = NULL; |
op = OP_DEFAULT; |
db = idx = NULL; |
|
mp = NULL; |
|
hash = NULL; |
|
recs = NULL; |
|
recsz = reccur = 0; |
|
maxrec = 0; |
|
op = OP_NEW; |
|
dir = NULL; |
|
|
|
while (-1 != (ch = getopt(argc, argv, "d:u:v"))) |
while (-1 != (ch = getopt(argc, argv, "aC:Dd:npQT:tu:v"))) |
switch (ch) { |
switch (ch) { |
|
case ('a'): |
|
use_all = 1; |
|
break; |
|
case ('C'): |
|
CHECKOP(op, ch); |
|
path_arg = optarg; |
|
op = OP_CONFFILE; |
|
break; |
|
case ('D'): |
|
debug++; |
|
break; |
case ('d'): |
case ('d'): |
dir = optarg; |
CHECKOP(op, ch); |
|
path_arg = optarg; |
op = OP_UPDATE; |
op = OP_UPDATE; |
break; |
break; |
|
case ('n'): |
|
nodb = 1; |
|
break; |
|
case ('p'): |
|
warnings = 1; |
|
break; |
|
case ('Q'): |
|
mparse_options |= MPARSE_QUICK; |
|
break; |
|
case ('T'): |
|
if (strcmp(optarg, "utf8")) { |
|
fprintf(stderr, "-T%s: Unsupported " |
|
"output format\n", optarg); |
|
goto usage; |
|
} |
|
write_utf8 = 1; |
|
break; |
|
case ('t'): |
|
CHECKOP(op, ch); |
|
dup2(STDOUT_FILENO, STDERR_FILENO); |
|
op = OP_TEST; |
|
nodb = warnings = 1; |
|
break; |
case ('u'): |
case ('u'): |
dir = optarg; |
CHECKOP(op, ch); |
|
path_arg = optarg; |
op = OP_DELETE; |
op = OP_DELETE; |
break; |
break; |
case ('v'): |
case ('v'): |
verb++; |
/* Compatibility with espie@'s makewhatis. */ |
break; |
break; |
default: |
default: |
usage(); |
goto usage; |
return((int)MANDOCLEVEL_BADARG); |
|
} |
} |
|
|
argc -= optind; |
argc -= optind; |
argv += optind; |
argv += optind; |
|
|
memset(&info, 0, sizeof(BTREEINFO)); |
if (OP_CONFFILE == op && argc > 0) { |
info.flags = R_DUP; |
fprintf(stderr, "-C: Too many arguments\n"); |
|
goto usage; |
|
} |
|
|
mp = mparse_alloc(MPARSE_AUTO, MANDOCLEVEL_FATAL, NULL, NULL); |
exitcode = (int)MANDOCLEVEL_OK; |
|
mp = mparse_alloc(mparse_options, MANDOCLEVEL_FATAL, NULL, NULL); |
|
mc = mchars_alloc(); |
|
|
memset(&buf, 0, sizeof(struct buf)); |
ohash_init(&mpages, 6, &mpages_info); |
memset(&dbuf, 0, sizeof(struct buf)); |
ohash_init(&mlinks, 6, &mlinks_info); |
|
|
buf.size = dbuf.size = MANDOC_BUFSZ; |
if (OP_UPDATE == op || OP_DELETE == op || OP_TEST == op) { |
|
/* |
|
* Force processing all files. |
|
*/ |
|
use_all = 1; |
|
|
buf.cp = mandoc_malloc(buf.size); |
/* |
dbuf.cp = mandoc_malloc(dbuf.size); |
* All of these deal with a specific directory. |
|
* Jump into that directory then collect files specified |
|
* on the command-line. |
|
*/ |
|
if (0 == set_basedir(path_arg)) |
|
goto out; |
|
for (i = 0; i < argc; i++) |
|
filescan(argv[i]); |
|
if (0 == dbopen(1)) |
|
goto out; |
|
if (OP_TEST != op) |
|
dbprune(); |
|
if (OP_DELETE != op) |
|
mpages_merge(mc, mp); |
|
dbclose(1); |
|
} else { |
|
/* |
|
* If we have arguments, use them as our manpaths. |
|
* If we don't, grok from manpath(1) or however else |
|
* manpath_parse() wants to do it. |
|
*/ |
|
if (argc > 0) { |
|
dirs.paths = mandoc_calloc |
|
(argc, sizeof(char *)); |
|
dirs.sz = (size_t)argc; |
|
for (i = 0; i < argc; i++) |
|
dirs.paths[i] = mandoc_strdup(argv[i]); |
|
} else |
|
manpath_parse(&dirs, path_arg, NULL, NULL); |
|
|
flags = OP_NEW == op ? O_CREAT|O_TRUNC|O_RDWR : O_CREAT|O_RDWR; |
if (0 == dirs.sz) { |
|
exitcode = (int)MANDOCLEVEL_BADARG; |
|
say("", "Empty manpath"); |
|
} |
|
|
if (OP_UPDATE == op || OP_DELETE == op) { |
/* |
ibuf[0] = fbuf[0] = '\0'; |
* First scan the tree rooted at a base directory, then |
|
* build a new database and finally move it into place. |
|
* Ignore zero-length directories and strip trailing |
|
* slashes. |
|
*/ |
|
for (j = 0; j < dirs.sz; j++) { |
|
sz = strlen(dirs.paths[j]); |
|
if (sz && '/' == dirs.paths[j][sz - 1]) |
|
dirs.paths[j][--sz] = '\0'; |
|
if (0 == sz) |
|
continue; |
|
|
strlcat(fbuf, dir, MAXPATHLEN); |
if (j) { |
strlcat(fbuf, "/", MAXPATHLEN); |
ohash_init(&mpages, 6, &mpages_info); |
sz1 = strlcat(fbuf, MANDOC_DB, MAXPATHLEN); |
ohash_init(&mlinks, 6, &mlinks_info); |
|
} |
|
|
strlcat(ibuf, dir, MAXPATHLEN); |
if (0 == set_basedir(dirs.paths[j])) |
strlcat(ibuf, "/", MAXPATHLEN); |
goto out; |
sz2 = strlcat(ibuf, MANDOC_IDX, MAXPATHLEN); |
if (0 == treescan()) |
|
goto out; |
|
if (0 == set_basedir(dirs.paths[j])) |
|
goto out; |
|
if (0 == dbopen(0)) |
|
goto out; |
|
|
if (sz1 >= MAXPATHLEN || sz2 >= MAXPATHLEN) { |
mpages_merge(mc, mp); |
fprintf(stderr, "%s: Path too long\n", dir); |
if (warnings && |
exit((int)MANDOCLEVEL_BADARG); |
! (MPARSE_QUICK & mparse_options)) |
|
names_check(); |
|
dbclose(0); |
|
|
|
if (j + 1 < dirs.sz) { |
|
mpages_free(); |
|
ohash_delete(&mpages); |
|
ohash_delete(&mlinks); |
|
} |
} |
} |
|
} |
|
out: |
|
set_basedir(NULL); |
|
manpath_free(&dirs); |
|
mchars_free(mc); |
|
mparse_free(mp); |
|
mpages_free(); |
|
ohash_delete(&mpages); |
|
ohash_delete(&mlinks); |
|
return(exitcode); |
|
usage: |
|
fprintf(stderr, "usage: %s [-aDnpQ] [-C file] [-Tutf8]\n" |
|
" %s [-aDnpQ] [-Tutf8] dir ...\n" |
|
" %s [-DnpQ] [-Tutf8] -d dir [file ...]\n" |
|
" %s [-Dnp] -u dir [file ...]\n" |
|
" %s [-Q] -t file ...\n", |
|
progname, progname, progname, |
|
progname, progname); |
|
|
db = dbopen(fbuf, flags, 0644, DB_BTREE, &info); |
return((int)MANDOCLEVEL_BADARG); |
idx = dbopen(ibuf, flags, 0644, DB_RECNO, NULL); |
} |
|
|
if (NULL == db) { |
/* |
perror(fbuf); |
* Scan a directory tree rooted at "basedir" for manpages. |
exit((int)MANDOCLEVEL_SYSERR); |
* We use fts(), scanning directory parts along the way for clues to our |
} else if (NULL == db) { |
* section and architecture. |
perror(ibuf); |
* |
exit((int)MANDOCLEVEL_SYSERR); |
* If use_all has been specified, grok all files. |
|
* If not, sanitise paths to the following: |
|
* |
|
* [./]man*[/<arch>]/<name>.<section> |
|
* or |
|
* [./]cat<section>[/<arch>]/<name>.0 |
|
* |
|
* TODO: accomodate for multi-language directories. |
|
*/ |
|
static int |
|
treescan(void) |
|
{ |
|
FTS *f; |
|
FTSENT *ff; |
|
struct mlink *mlink; |
|
int dform, gzip; |
|
char *dsec, *arch, *fsec, *cp; |
|
const char *path; |
|
const char *argv[2]; |
|
|
|
argv[0] = "."; |
|
argv[1] = (char *)NULL; |
|
|
|
/* |
|
* Walk through all components under the directory, using the |
|
* logical descent of files. |
|
*/ |
|
f = fts_open((char * const *)argv, FTS_LOGICAL, NULL); |
|
if (NULL == f) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "&fts_open"); |
|
return(0); |
|
} |
|
|
|
dsec = arch = NULL; |
|
dform = FORM_NONE; |
|
|
|
while (NULL != (ff = fts_read(f))) { |
|
path = ff->fts_path + 2; |
|
/* |
|
* If we're a regular file, add an mlink by using the |
|
* stored directory data and handling the filename. |
|
*/ |
|
if (FTS_F == ff->fts_info) { |
|
if (0 == strcmp(path, MANDOC_DB)) |
|
continue; |
|
if ( ! use_all && ff->fts_level < 2) { |
|
if (warnings) |
|
say(path, "Extraneous file"); |
|
continue; |
|
} |
|
gzip = 0; |
|
fsec = NULL; |
|
while (NULL == fsec) { |
|
fsec = strrchr(ff->fts_name, '.'); |
|
if (NULL == fsec || strcmp(fsec+1, "gz")) |
|
break; |
|
gzip = 1; |
|
*fsec = '\0'; |
|
fsec = NULL; |
|
} |
|
if (NULL == fsec) { |
|
if ( ! use_all) { |
|
if (warnings) |
|
say(path, |
|
"No filename suffix"); |
|
continue; |
|
} |
|
} else if (0 == strcmp(++fsec, "html")) { |
|
if (warnings) |
|
say(path, "Skip html"); |
|
continue; |
|
} else if (0 == strcmp(fsec, "ps")) { |
|
if (warnings) |
|
say(path, "Skip ps"); |
|
continue; |
|
} else if (0 == strcmp(fsec, "pdf")) { |
|
if (warnings) |
|
say(path, "Skip pdf"); |
|
continue; |
|
} else if ( ! use_all && |
|
((FORM_SRC == dform && strcmp(fsec, dsec)) || |
|
(FORM_CAT == dform && strcmp(fsec, "0")))) { |
|
if (warnings) |
|
say(path, "Wrong filename suffix"); |
|
continue; |
|
} else |
|
fsec[-1] = '\0'; |
|
|
|
mlink = mandoc_calloc(1, sizeof(struct mlink)); |
|
strlcpy(mlink->file, path, sizeof(mlink->file)); |
|
mlink->dform = dform; |
|
mlink->dsec = dsec; |
|
mlink->arch = arch; |
|
mlink->name = ff->fts_name; |
|
mlink->fsec = fsec; |
|
mlink->gzip = gzip; |
|
mlink_add(mlink, ff->fts_statp); |
|
continue; |
|
} else if (FTS_D != ff->fts_info && |
|
FTS_DP != ff->fts_info) { |
|
if (warnings) |
|
say(path, "Not a regular file"); |
|
continue; |
} |
} |
|
|
if (verb > 2) { |
switch (ff->fts_level) { |
printf("%s: Opened\n", fbuf); |
case (0): |
printf("%s: Opened\n", ibuf); |
/* Ignore the root directory. */ |
|
break; |
|
case (1): |
|
/* |
|
* This might contain manX/ or catX/. |
|
* Try to infer this from the name. |
|
* If we're not in use_all, enforce it. |
|
*/ |
|
cp = ff->fts_name; |
|
if (FTS_DP == ff->fts_info) |
|
break; |
|
|
|
if (0 == strncmp(cp, "man", 3)) { |
|
dform = FORM_SRC; |
|
dsec = cp + 3; |
|
} else if (0 == strncmp(cp, "cat", 3)) { |
|
dform = FORM_CAT; |
|
dsec = cp + 3; |
|
} else { |
|
dform = FORM_NONE; |
|
dsec = NULL; |
|
} |
|
|
|
if (NULL != dsec || use_all) |
|
break; |
|
|
|
if (warnings) |
|
say(path, "Unknown directory part"); |
|
fts_set(f, ff, FTS_SKIP); |
|
break; |
|
case (2): |
|
/* |
|
* Possibly our architecture. |
|
* If we're descending, keep tabs on it. |
|
*/ |
|
if (FTS_DP != ff->fts_info && NULL != dsec) |
|
arch = ff->fts_name; |
|
else |
|
arch = NULL; |
|
break; |
|
default: |
|
if (FTS_DP == ff->fts_info || use_all) |
|
break; |
|
if (warnings) |
|
say(path, "Extraneous directory part"); |
|
fts_set(f, ff, FTS_SKIP); |
|
break; |
} |
} |
|
} |
|
|
ofile_argbuild(argv, argc, verb, &of); |
fts_close(f); |
if (NULL == of) |
return(1); |
goto out; |
} |
|
|
of = of->first; |
/* |
|
* Add a file to the mlinks table. |
|
* Do not verify that it's a "valid" looking manpage (we'll do that |
|
* later). |
|
* |
|
* Try to infer the manual section, architecture, and page name from the |
|
* path, assuming it looks like |
|
* |
|
* [./]man*[/<arch>]/<name>.<section> |
|
* or |
|
* [./]cat<section>[/<arch>]/<name>.0 |
|
* |
|
* See treescan() for the fts(3) version of this. |
|
*/ |
|
static void |
|
filescan(const char *file) |
|
{ |
|
char buf[PATH_MAX]; |
|
struct stat st; |
|
struct mlink *mlink; |
|
char *p, *start; |
|
|
index_prune(of, db, fbuf, idx, ibuf, verb, |
assert(use_all); |
&maxrec, &recs, &recsz); |
|
|
|
if (OP_UPDATE == op) |
if (0 == strncmp(file, "./", 2)) |
index_merge(of, mp, &dbuf, &buf, hash, |
file += 2; |
db, fbuf, idx, ibuf, verb, |
|
maxrec, recs, reccur); |
|
|
|
goto out; |
if (NULL == realpath(file, buf)) { |
|
exitcode = (int)MANDOCLEVEL_BADARG; |
|
say(file, "&realpath"); |
|
return; |
} |
} |
|
|
|
if (strstr(buf, basedir) == buf) |
|
start = buf + strlen(basedir) + 1; |
|
else if (OP_TEST == op) |
|
start = buf; |
|
else { |
|
exitcode = (int)MANDOCLEVEL_BADARG; |
|
say("", "%s: outside base directory", buf); |
|
return; |
|
} |
|
|
|
if (-1 == stat(buf, &st)) { |
|
exitcode = (int)MANDOCLEVEL_BADARG; |
|
say(file, "&stat"); |
|
return; |
|
} else if ( ! (S_IFREG & st.st_mode)) { |
|
exitcode = (int)MANDOCLEVEL_BADARG; |
|
say(file, "Not a regular file"); |
|
return; |
|
} |
|
|
|
mlink = mandoc_calloc(1, sizeof(struct mlink)); |
|
strlcpy(mlink->file, start, sizeof(mlink->file)); |
|
|
/* |
/* |
* Configure the directories we're going to scan. |
* First try to guess our directory structure. |
* If we have command-line arguments, use them. |
* If we find a separator, try to look for man* or cat*. |
* If not, we use man(1)'s method (see mandocdb.8). |
* If we find one of these and what's underneath is a directory, |
|
* assume it's an architecture. |
*/ |
*/ |
|
if (NULL != (p = strchr(start, '/'))) { |
|
*p++ = '\0'; |
|
if (0 == strncmp(start, "man", 3)) { |
|
mlink->dform = FORM_SRC; |
|
mlink->dsec = start + 3; |
|
} else if (0 == strncmp(start, "cat", 3)) { |
|
mlink->dform = FORM_CAT; |
|
mlink->dsec = start + 3; |
|
} |
|
|
if (argc > 0) { |
start = p; |
dirs.paths = mandoc_malloc(argc * sizeof(char *)); |
if (NULL != mlink->dsec && NULL != (p = strchr(start, '/'))) { |
dirs.sz = argc; |
*p++ = '\0'; |
for (i = 0; i < argc; i++) |
mlink->arch = start; |
dirs.paths[i] = mandoc_strdup(argv[i]); |
start = p; |
|
} |
|
} |
|
|
|
/* |
|
* Now check the file suffix. |
|
* Suffix of `.0' indicates a catpage, `.1-9' is a manpage. |
|
*/ |
|
p = strrchr(start, '\0'); |
|
while (p-- > start && '/' != *p && '.' != *p) |
|
/* Loop. */ ; |
|
|
|
if ('.' == *p) { |
|
*p++ = '\0'; |
|
mlink->fsec = p; |
|
} |
|
|
|
/* |
|
* Now try to parse the name. |
|
* Use the filename portion of the path. |
|
*/ |
|
mlink->name = start; |
|
if (NULL != (p = strrchr(start, '/'))) { |
|
mlink->name = p + 1; |
|
*p = '\0'; |
|
} |
|
mlink_add(mlink, &st); |
|
} |
|
|
|
static void |
|
mlink_add(struct mlink *mlink, const struct stat *st) |
|
{ |
|
struct inodev inodev; |
|
struct mpage *mpage; |
|
unsigned int slot; |
|
|
|
assert(NULL != mlink->file); |
|
|
|
mlink->dsec = mandoc_strdup(mlink->dsec ? mlink->dsec : ""); |
|
mlink->arch = mandoc_strdup(mlink->arch ? mlink->arch : ""); |
|
mlink->name = mandoc_strdup(mlink->name ? mlink->name : ""); |
|
mlink->fsec = mandoc_strdup(mlink->fsec ? mlink->fsec : ""); |
|
|
|
if ('0' == *mlink->fsec) { |
|
free(mlink->fsec); |
|
mlink->fsec = mandoc_strdup(mlink->dsec); |
|
mlink->fform = FORM_CAT; |
|
} else if ('1' <= *mlink->fsec && '9' >= *mlink->fsec) |
|
mlink->fform = FORM_SRC; |
|
else |
|
mlink->fform = FORM_NONE; |
|
|
|
slot = ohash_qlookup(&mlinks, mlink->file); |
|
assert(NULL == ohash_find(&mlinks, slot)); |
|
ohash_insert(&mlinks, slot, mlink); |
|
|
|
inodev.st_ino = st->st_ino; |
|
inodev.st_dev = st->st_dev; |
|
slot = ohash_lookup_memory(&mpages, (char *)&inodev, |
|
sizeof(struct inodev), inodev.st_ino); |
|
mpage = ohash_find(&mpages, slot); |
|
if (NULL == mpage) { |
|
mpage = mandoc_calloc(1, sizeof(struct mpage)); |
|
mpage->inodev.st_ino = inodev.st_ino; |
|
mpage->inodev.st_dev = inodev.st_dev; |
|
ohash_insert(&mpages, slot, mpage); |
} else |
} else |
manpath_parse(&dirs, NULL, NULL); |
mlink->next = mpage->mlinks; |
|
mpage->mlinks = mlink; |
|
mlink->mpage = mpage; |
|
} |
|
|
for (i = 0; i < dirs.sz; i++) { |
static void |
ibuf[0] = fbuf[0] = '\0'; |
mlink_free(struct mlink *mlink) |
|
{ |
|
|
strlcat(fbuf, dirs.paths[i], MAXPATHLEN); |
free(mlink->dsec); |
strlcat(fbuf, "/", MAXPATHLEN); |
free(mlink->arch); |
sz1 = strlcat(fbuf, MANDOC_DB, MAXPATHLEN); |
free(mlink->name); |
|
free(mlink->fsec); |
|
free(mlink); |
|
} |
|
|
strlcat(ibuf, dirs.paths[i], MAXPATHLEN); |
static void |
strlcat(ibuf, "/", MAXPATHLEN); |
mpages_free(void) |
sz2 = strlcat(ibuf, MANDOC_IDX, MAXPATHLEN); |
{ |
|
struct mpage *mpage; |
|
struct mlink *mlink; |
|
unsigned int slot; |
|
|
if (sz1 >= MAXPATHLEN || sz2 >= MAXPATHLEN) { |
mpage = ohash_first(&mpages, &slot); |
fprintf(stderr, "%s: Path too long\n", |
while (NULL != mpage) { |
dirs.paths[i]); |
while (NULL != (mlink = mpage->mlinks)) { |
exit((int)MANDOCLEVEL_BADARG); |
mpage->mlinks = mlink->next; |
|
mlink_free(mlink); |
} |
} |
|
free(mpage->sec); |
|
free(mpage->arch); |
|
free(mpage->title); |
|
free(mpage->desc); |
|
free(mpage); |
|
mpage = ohash_next(&mpages, &slot); |
|
} |
|
} |
|
|
db = dbopen(fbuf, flags, 0644, DB_BTREE, &info); |
/* |
idx = dbopen(ibuf, flags, 0644, DB_RECNO, NULL); |
* For each mlink to the mpage, check whether the path looks like |
|
* it is formatted, and if it does, check whether a source manual |
|
* exists by the same name, ignoring the suffix. |
|
* If both conditions hold, drop the mlink. |
|
*/ |
|
static void |
|
mlinks_undupe(struct mpage *mpage) |
|
{ |
|
char buf[PATH_MAX]; |
|
struct mlink **prev; |
|
struct mlink *mlink; |
|
char *bufp; |
|
|
if (NULL == db) { |
mpage->form = FORM_CAT; |
perror(fbuf); |
prev = &mpage->mlinks; |
exit((int)MANDOCLEVEL_SYSERR); |
while (NULL != (mlink = *prev)) { |
} else if (NULL == db) { |
if (FORM_CAT != mlink->dform) { |
perror(ibuf); |
mpage->form = FORM_NONE; |
exit((int)MANDOCLEVEL_SYSERR); |
goto nextlink; |
} |
} |
|
if (strlcpy(buf, mlink->file, PATH_MAX) >= PATH_MAX) { |
if (verb > 2) { |
if (warnings) |
printf("%s: Truncated\n", fbuf); |
say(mlink->file, "Filename too long"); |
printf("%s: Truncated\n", ibuf); |
goto nextlink; |
} |
} |
|
bufp = strstr(buf, "cat"); |
|
assert(NULL != bufp); |
|
memcpy(bufp, "man", 3); |
|
if (NULL != (bufp = strrchr(buf, '.'))) |
|
*++bufp = '\0'; |
|
strlcat(buf, mlink->dsec, PATH_MAX); |
|
if (NULL == ohash_find(&mlinks, |
|
ohash_qlookup(&mlinks, buf))) |
|
goto nextlink; |
|
if (warnings) |
|
say(mlink->file, "Man source exists: %s", buf); |
|
if (use_all) |
|
goto nextlink; |
|
*prev = mlink->next; |
|
mlink_free(mlink); |
|
continue; |
|
nextlink: |
|
prev = &(*prev)->next; |
|
} |
|
} |
|
|
ofile_free(of); |
static void |
of = NULL; |
mlink_check(struct mpage *mpage, struct mlink *mlink) |
|
{ |
|
struct str *str; |
|
unsigned int slot; |
|
|
if ( ! ofile_dirbuild(dirs.paths[i], verb, &of)) |
/* |
exit((int)MANDOCLEVEL_SYSERR); |
* Check whether the manual section given in a file |
|
* agrees with the directory where the file is located. |
|
* Some manuals have suffixes like (3p) on their |
|
* section number either inside the file or in the |
|
* directory name, some are linked into more than one |
|
* section, like encrypt(1) = makekey(8). |
|
*/ |
|
|
if (NULL == of) |
if (FORM_SRC == mpage->form && |
continue; |
strcasecmp(mpage->sec, mlink->dsec)) |
|
say(mlink->file, "Section \"%s\" manual in %s directory", |
|
mpage->sec, mlink->dsec); |
|
|
of = of->first; |
/* |
|
* Manual page directories exist for each kernel |
|
* architecture as returned by machine(1). |
|
* However, many manuals only depend on the |
|
* application architecture as returned by arch(1). |
|
* For example, some (2/ARM) manuals are shared |
|
* across the "armish" and "zaurus" kernel |
|
* architectures. |
|
* A few manuals are even shared across completely |
|
* different architectures, for example fdformat(1) |
|
* on amd64, i386, sparc, and sparc64. |
|
*/ |
|
|
index_merge(of, mp, &dbuf, &buf, hash, db, fbuf, |
if (strcasecmp(mpage->arch, mlink->arch)) |
idx, ibuf, verb, maxrec, recs, reccur); |
say(mlink->file, "Architecture \"%s\" manual in " |
} |
"\"%s\" directory", mpage->arch, mlink->arch); |
|
|
out: |
/* |
if (db) |
* XXX |
(*db->close)(db); |
* parse_cat() doesn't set NAME_TITLE yet. |
if (idx) |
*/ |
(*idx->close)(idx); |
|
if (hash) |
|
(*hash->close)(hash); |
|
if (mp) |
|
mparse_free(mp); |
|
|
|
manpath_free(&dirs); |
if (FORM_CAT == mpage->form) |
ofile_free(of); |
return; |
free(buf.cp); |
|
free(dbuf.cp); |
|
free(recs); |
|
|
|
return(MANDOCLEVEL_OK); |
/* |
|
* Check whether this mlink |
|
* appears as a name in the NAME section. |
|
*/ |
|
|
|
slot = ohash_qlookup(&names, mlink->name); |
|
str = ohash_find(&names, slot); |
|
assert(NULL != str); |
|
if ( ! (NAME_TITLE & str->mask)) |
|
say(mlink->file, "Name missing in NAME section"); |
} |
} |
|
|
void |
/* |
index_merge(const struct of *of, struct mparse *mp, |
* Run through the files in the global vector "mpages" |
struct buf *dbuf, struct buf *buf, |
* and add them to the database specified in "basedir". |
DB *hash, DB *db, const char *dbf, |
* |
DB *idx, const char *idxf, int verb, |
* This handles the parsing scheme itself, using the cues of directory |
recno_t maxrec, const recno_t *recs, size_t reccur) |
* and filename to determine whether the file is parsable or not. |
|
*/ |
|
static void |
|
mpages_merge(struct mchars *mc, struct mparse *mp) |
{ |
{ |
recno_t rec; |
char any[] = "any"; |
int ch; |
struct ohash_info str_info; |
DBT key, val; |
int fd[2]; |
struct mdoc *mdoc; |
struct mpage *mpage, *mpage_dest; |
struct man *man; |
struct mlink *mlink, *mlink_dest; |
const char *fn, *msec, *mtitle, *arch; |
struct mdoc *mdoc; |
size_t sv; |
struct man *man; |
unsigned seq; |
char *sodest; |
struct db_val vbuf; |
char *cp; |
|
pid_t child_pid; |
|
int status; |
|
unsigned int pslot; |
|
enum mandoclevel lvl; |
|
|
for (rec = 0; of; of = of->next) { |
str_info.alloc = hash_alloc; |
fn = of->fname; |
str_info.halloc = hash_halloc; |
if (reccur > 0) { |
str_info.hfree = hash_free; |
--reccur; |
str_info.key_offset = offsetof(struct str, key); |
rec = recs[(int)reccur]; |
|
} else if (maxrec > 0) { |
|
rec = maxrec; |
|
maxrec = 0; |
|
} else |
|
rec++; |
|
|
|
mparse_reset(mp); |
if (0 == nodb) |
hash_reset(&hash); |
SQL_EXEC("BEGIN TRANSACTION"); |
|
|
if (mparse_readfd(mp, -1, fn) >= MANDOCLEVEL_FATAL) { |
mpage = ohash_first(&mpages, &pslot); |
fprintf(stderr, "%s: Parse failure\n", fn); |
while (NULL != mpage) { |
|
mlinks_undupe(mpage); |
|
if (NULL == mpage->mlinks) { |
|
mpage = ohash_next(&mpages, &pslot); |
continue; |
continue; |
} |
} |
|
|
mparse_result(mp, &mdoc, &man); |
name_mask = NAME_MASK; |
if (NULL == mdoc && NULL == man) |
ohash_init(&names, 4, &str_info); |
continue; |
ohash_init(&strings, 6, &str_info); |
|
mparse_reset(mp); |
|
mdoc = NULL; |
|
man = NULL; |
|
sodest = NULL; |
|
child_pid = 0; |
|
fd[0] = -1; |
|
fd[1] = -1; |
|
|
msec = NULL != mdoc ? |
if (mpage->mlinks->gzip) { |
mdoc_meta(mdoc)->msec : man_meta(man)->msec; |
if (-1 == pipe(fd)) { |
mtitle = NULL != mdoc ? |
exitcode = (int)MANDOCLEVEL_SYSERR; |
mdoc_meta(mdoc)->title : man_meta(man)->title; |
say(mpage->mlinks->file, "&pipe gunzip"); |
arch = NULL != mdoc ? |
goto nextpage; |
mdoc_meta(mdoc)->arch : NULL; |
} |
|
switch (child_pid = fork()) { |
|
case (-1): |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(mpage->mlinks->file, "&fork gunzip"); |
|
child_pid = 0; |
|
close(fd[1]); |
|
close(fd[0]); |
|
goto nextpage; |
|
case (0): |
|
close(fd[0]); |
|
if (-1 == dup2(fd[1], STDOUT_FILENO)) { |
|
say(mpage->mlinks->file, |
|
"&dup gunzip"); |
|
exit(1); |
|
} |
|
execlp("gunzip", "gunzip", "-c", |
|
mpage->mlinks->file, NULL); |
|
say(mpage->mlinks->file, "&exec gunzip"); |
|
exit(1); |
|
default: |
|
close(fd[1]); |
|
break; |
|
} |
|
} |
|
|
if (NULL == arch) |
/* |
arch = ""; |
* Try interpreting the file as mdoc(7) or man(7) |
|
* source code, unless it is already known to be |
/* |
* formatted. Fall back to formatted mode. |
* The index record value consists of a nil-terminated |
|
* filename, a nil-terminated manual section, and a |
|
* nil-terminated description. Since the description |
|
* may not be set, we set a sentinel to see if we're |
|
* going to write a nil byte in its place. |
|
*/ |
*/ |
|
if (FORM_CAT != mpage->mlinks->dform || |
|
FORM_CAT != mpage->mlinks->fform) { |
|
lvl = mparse_readfd(mp, fd[0], mpage->mlinks->file); |
|
if (lvl < MANDOCLEVEL_FATAL) |
|
mparse_result(mp, &mdoc, &man, &sodest); |
|
} |
|
|
dbuf->len = 0; |
if (NULL != sodest) { |
buf_appendb(dbuf, fn, strlen(fn) + 1); |
mlink_dest = ohash_find(&mlinks, |
buf_appendb(dbuf, msec, strlen(msec) + 1); |
ohash_qlookup(&mlinks, sodest)); |
buf_appendb(dbuf, mtitle, strlen(mtitle) + 1); |
if (NULL != mlink_dest) { |
buf_appendb(dbuf, arch, strlen(arch) + 1); |
|
|
|
sv = dbuf->len; |
/* The .so target exists. */ |
|
|
/* Fix the record number in the btree value. */ |
mpage_dest = mlink_dest->mpage; |
|
mlink = mpage->mlinks; |
|
while (1) { |
|
mlink->mpage = mpage_dest; |
|
|
if (mdoc) |
/* |
pmdoc_node(hash, buf, dbuf, |
* If the target was already |
mdoc_node(mdoc), mdoc_meta(mdoc)); |
* processed, add the links |
else |
* to the database now. |
pman_node(hash, buf, dbuf, man_node(man)); |
* Otherwise, this will |
|
* happen when we come |
|
* to the target. |
|
*/ |
|
|
/* |
if (mpage_dest->recno) |
* Copy from the in-memory hashtable of pending keywords |
dbadd_mlink(mlink); |
* into the database. |
|
*/ |
|
|
|
vbuf.rec = rec; |
if (NULL == mlink->next) |
seq = R_FIRST; |
break; |
while (0 == (ch = (*hash->seq)(hash, &key, &val, seq))) { |
mlink = mlink->next; |
seq = R_NEXT; |
} |
|
|
vbuf.mask = *(uint64_t *)val.data; |
/* Move all links to the target. */ |
val.size = sizeof(struct db_val); |
|
val.data = &vbuf; |
|
|
|
if (verb > 1) |
mlink->next = mlink_dest->next; |
printf("%s: Added keyword: %s\n", |
mlink_dest->next = mpage->mlinks; |
fn, (char *)key.data); |
mpage->mlinks = NULL; |
dbt_put(db, dbf, &key, &val); |
} |
|
goto nextpage; |
|
} else if (NULL != mdoc) { |
|
mpage->form = FORM_SRC; |
|
mpage->sec = |
|
mandoc_strdup(mdoc_meta(mdoc)->msec); |
|
mpage->arch = mdoc_meta(mdoc)->arch; |
|
mpage->arch = mandoc_strdup( |
|
NULL == mpage->arch ? "" : mpage->arch); |
|
mpage->title = |
|
mandoc_strdup(mdoc_meta(mdoc)->title); |
|
} else if (NULL != man) { |
|
mpage->form = FORM_SRC; |
|
mpage->sec = |
|
mandoc_strdup(man_meta(man)->msec); |
|
mpage->arch = |
|
mandoc_strdup(mpage->mlinks->arch); |
|
mpage->title = |
|
mandoc_strdup(man_meta(man)->title); |
|
} else { |
|
mpage->form = FORM_CAT; |
|
mpage->sec = |
|
mandoc_strdup(mpage->mlinks->dsec); |
|
mpage->arch = |
|
mandoc_strdup(mpage->mlinks->arch); |
|
mpage->title = |
|
mandoc_strdup(mpage->mlinks->name); |
} |
} |
if (ch < 0) { |
putkey(mpage, mpage->sec, TYPE_sec); |
perror("hash"); |
putkey(mpage, '\0' == *mpage->arch ? |
exit((int)MANDOCLEVEL_SYSERR); |
any : mpage->arch, TYPE_arch); |
|
|
|
for (mlink = mpage->mlinks; mlink; mlink = mlink->next) { |
|
if ('\0' != *mlink->dsec) |
|
putkey(mpage, mlink->dsec, TYPE_sec); |
|
if ('\0' != *mlink->fsec) |
|
putkey(mpage, mlink->fsec, TYPE_sec); |
|
putkey(mpage, '\0' == *mlink->arch ? |
|
any : mlink->arch, TYPE_arch); |
|
putkey(mpage, mlink->name, NAME_FILE); |
} |
} |
|
|
/* |
|
* Apply to the index. If we haven't had a description |
|
* set, put an empty one in now. |
|
*/ |
|
|
|
if (dbuf->len == sv) |
assert(NULL == mpage->desc); |
buf_appendb(dbuf, "", 1); |
if (NULL != mdoc) { |
|
if (NULL != (cp = mdoc_meta(mdoc)->name)) |
|
putkey(mpage, cp, NAME_HEAD); |
|
parse_mdoc(mpage, mdoc_node(mdoc)); |
|
} else if (NULL != man) |
|
parse_man(mpage, man_node(man)); |
|
else |
|
parse_cat(mpage, fd[0]); |
|
if (NULL == mpage->desc) |
|
mpage->desc = mandoc_strdup(mpage->mlinks->name); |
|
|
key.data = &rec; |
if (warnings && !use_all) |
key.size = sizeof(recno_t); |
for (mlink = mpage->mlinks; mlink; |
|
mlink = mlink->next) |
|
mlink_check(mpage, mlink); |
|
|
val.data = dbuf->cp; |
dbadd(mpage, mc); |
val.size = dbuf->len; |
|
|
|
if (verb) |
nextpage: |
printf("%s: Added index\n", fn); |
if (child_pid) { |
dbt_put(idx, idxf, &key, &val); |
if (-1 == waitpid(child_pid, &status, 0)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(mpage->mlinks->file, "&wait gunzip"); |
|
} else if (WIFSIGNALED(status)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(mpage->mlinks->file, |
|
"gunzip died from signal %d", |
|
WTERMSIG(status)); |
|
} else if (WEXITSTATUS(status)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(mpage->mlinks->file, |
|
"gunzip failed with code %d", |
|
WEXITSTATUS(status)); |
|
} |
|
} |
|
ohash_delete(&strings); |
|
ohash_delete(&names); |
|
mpage = ohash_next(&mpages, &pslot); |
} |
} |
|
|
|
if (0 == nodb) |
|
SQL_EXEC("END TRANSACTION"); |
} |
} |
|
|
/* |
|
* Scan through all entries in the index file `idx' and prune those |
|
* entries in `ofile'. |
|
* Pruning consists of removing from `db', then invalidating the entry |
|
* in `idx' (zeroing its value size). |
|
*/ |
|
static void |
static void |
index_prune(const struct of *ofile, DB *db, const char *dbf, |
names_check(void) |
DB *idx, const char *idxf, int verb, |
|
recno_t *maxrec, recno_t **recs, size_t *recsz) |
|
{ |
{ |
const struct of *of; |
sqlite3_stmt *stmt; |
const char *fn; |
const char *name, *sec, *arch, *key; |
struct db_val *vbuf; |
int irc; |
unsigned seq, sseq; |
|
DBT key, val; |
|
size_t reccur; |
|
int ch; |
|
|
|
reccur = 0; |
sqlite3_prepare_v2(db, |
seq = R_FIRST; |
"SELECT name, sec, arch, key FROM (" |
while (0 == (ch = (*idx->seq)(idx, &key, &val, seq))) { |
"SELECT name AS key, pageid FROM names " |
seq = R_NEXT; |
"WHERE bits & ? AND NOT EXISTS (" |
*maxrec = *(recno_t *)key.data; |
"SELECT pageid FROM mlinks " |
if (0 == val.size) { |
"WHERE mlinks.pageid == names.pageid " |
if (reccur >= *recsz) { |
"AND mlinks.name == names.name" |
*recsz += MANDOC_SLOP; |
")" |
*recs = mandoc_realloc(*recs, |
") JOIN (" |
*recsz * sizeof(recno_t)); |
"SELECT * FROM mlinks GROUP BY pageid" |
} |
") USING (pageid);", |
(*recs)[(int)reccur] = *maxrec; |
-1, &stmt, NULL); |
reccur++; |
|
continue; |
|
} |
|
|
|
fn = (char *)val.data; |
if (SQLITE_OK != sqlite3_bind_int64(stmt, 1, NAME_TITLE)) |
for (of = ofile; of; of = of->next) |
say("", "%s", sqlite3_errmsg(db)); |
if (0 == strcmp(fn, of->fname)) |
|
break; |
|
|
|
if (NULL == of) |
while (SQLITE_ROW == (irc = sqlite3_step(stmt))) { |
continue; |
name = sqlite3_column_text(stmt, 0); |
|
sec = sqlite3_column_text(stmt, 1); |
|
arch = sqlite3_column_text(stmt, 2); |
|
key = sqlite3_column_text(stmt, 3); |
|
say("", "%s(%s%s%s) lacks mlink \"%s\"", name, sec, |
|
'\0' == *arch ? "" : "/", |
|
'\0' == *arch ? "" : arch, key); |
|
} |
|
sqlite3_finalize(stmt); |
|
} |
|
|
sseq = R_FIRST; |
static void |
while (0 == (ch = (*db->seq)(db, &key, &val, sseq))) { |
parse_cat(struct mpage *mpage, int fd) |
sseq = R_NEXT; |
{ |
assert(sizeof(struct db_val) == val.size); |
FILE *stream; |
vbuf = val.data; |
char *line, *p, *title; |
if (*maxrec != vbuf->rec) |
size_t len, plen, titlesz; |
continue; |
|
if (verb) |
|
printf("%s: Deleted keyword: %s\n", |
|
fn, (char *)key.data); |
|
ch = (*db->del)(db, &key, R_CURSOR); |
|
if (ch < 0) |
|
break; |
|
} |
|
if (ch < 0) { |
|
perror(dbf); |
|
exit((int)MANDOCLEVEL_SYSERR); |
|
} |
|
|
|
if (verb) |
stream = (-1 == fd) ? |
printf("%s: Deleted index\n", fn); |
fopen(mpage->mlinks->file, "r") : |
|
fdopen(fd, "r"); |
|
if (NULL == stream) { |
|
if (warnings) |
|
say(mpage->mlinks->file, "&fopen"); |
|
return; |
|
} |
|
|
val.size = 0; |
/* Skip to first blank line. */ |
ch = (*idx->put)(idx, &key, &val, R_CURSOR); |
|
if (ch < 0) { |
|
perror(idxf); |
|
exit((int)MANDOCLEVEL_SYSERR); |
|
} |
|
|
|
if (reccur >= *recsz) { |
while (NULL != (line = fgetln(stream, &len))) |
*recsz += MANDOC_SLOP; |
if ('\n' == *line) |
*recs = mandoc_realloc |
break; |
(*recs, *recsz * sizeof(recno_t)); |
|
|
/* |
|
* Assume the first line that is not indented |
|
* is the first section header. Skip to it. |
|
*/ |
|
|
|
while (NULL != (line = fgetln(stream, &len))) |
|
if ('\n' != *line && ' ' != *line) |
|
break; |
|
|
|
/* |
|
* Read up until the next section into a buffer. |
|
* Strip the leading and trailing newline from each read line, |
|
* appending a trailing space. |
|
* Ignore empty (whitespace-only) lines. |
|
*/ |
|
|
|
titlesz = 0; |
|
title = NULL; |
|
|
|
while (NULL != (line = fgetln(stream, &len))) { |
|
if (' ' != *line || '\n' != line[len - 1]) |
|
break; |
|
while (len > 0 && isspace((unsigned char)*line)) { |
|
line++; |
|
len--; |
} |
} |
|
if (1 == len) |
|
continue; |
|
title = mandoc_realloc(title, titlesz + len); |
|
memcpy(title + titlesz, line, len); |
|
titlesz += len; |
|
title[titlesz - 1] = ' '; |
|
} |
|
|
(*recs)[(int)reccur] = *maxrec; |
/* |
reccur++; |
* If no page content can be found, or the input line |
|
* is already the next section header, or there is no |
|
* trailing newline, reuse the page title as the page |
|
* description. |
|
*/ |
|
|
|
if (NULL == title || '\0' == *title) { |
|
if (warnings) |
|
say(mpage->mlinks->file, |
|
"Cannot find NAME section"); |
|
fclose(stream); |
|
free(title); |
|
return; |
} |
} |
(*maxrec)++; |
|
} |
|
|
|
/* |
title = mandoc_realloc(title, titlesz + 1); |
* Grow the buffer (if necessary) and copy in a binary string. |
title[titlesz] = '\0'; |
*/ |
|
static void |
|
buf_appendb(struct buf *buf, const void *cp, size_t sz) |
|
{ |
|
|
|
/* Overshoot by MANDOC_BUFSZ. */ |
/* |
|
* Skip to the first dash. |
|
* Use the remaining line as the description (no more than 70 |
|
* bytes). |
|
*/ |
|
|
while (buf->len + sz >= buf->size) { |
if (NULL != (p = strstr(title, "- "))) { |
buf->size = buf->len + sz + MANDOC_BUFSZ; |
for (p += 2; ' ' == *p || '\b' == *p; p++) |
buf->cp = mandoc_realloc(buf->cp, buf->size); |
/* Skip to next word. */ ; |
|
} else { |
|
if (warnings) |
|
say(mpage->mlinks->file, |
|
"No dash in title line"); |
|
p = title; |
} |
} |
|
|
memcpy(buf->cp + (int)buf->len, cp, sz); |
plen = strlen(p); |
buf->len += sz; |
|
|
/* Strip backspace-encoding from line. */ |
|
|
|
while (NULL != (line = memchr(p, '\b', plen))) { |
|
len = line - p; |
|
if (0 == len) { |
|
memmove(line, line + 1, plen--); |
|
continue; |
|
} |
|
memmove(line - 1, line + 1, plen - len); |
|
plen -= 2; |
|
} |
|
|
|
mpage->desc = mandoc_strdup(p); |
|
fclose(stream); |
|
free(title); |
} |
} |
|
|
/* |
/* |
* Append a nil-terminated string to the buffer. |
* Put a type/word pair into the word database for this particular file. |
* This can be invoked multiple times. |
|
* The buffer string will be nil-terminated. |
|
* If invoked multiple times, a space is put between strings. |
|
*/ |
*/ |
static void |
static void |
buf_append(struct buf *buf, const char *cp) |
putkey(const struct mpage *mpage, char *value, uint64_t type) |
{ |
{ |
size_t sz; |
char *cp; |
|
|
if (0 == (sz = strlen(cp))) |
assert(NULL != value); |
return; |
if (TYPE_arch == type) |
|
for (cp = value; *cp; cp++) |
if (buf->len) |
if (isupper((unsigned char)*cp)) |
buf->cp[(int)buf->len - 1] = ' '; |
*cp = _tolower((unsigned char)*cp); |
|
putkeys(mpage, value, strlen(value), type); |
buf_appendb(buf, cp, sz + 1); |
|
} |
} |
|
|
/* |
/* |
* Recursively add all text from a given node. |
* Grok all nodes at or below a certain mdoc node into putkey(). |
* This is optimised for general mdoc nodes in this context, which do |
|
* not consist of subexpressions and having a recursive call for n->next |
|
* would be wasteful. |
|
* The "f" variable should be 0 unless called from pmdoc_Nd for the |
|
* description buffer, which does not start at the beginning of the |
|
* buffer. |
|
*/ |
*/ |
static void |
static void |
buf_appendmdoc(struct buf *buf, const struct mdoc_node *n, int f) |
putmdockey(const struct mpage *mpage, |
|
const struct mdoc_node *n, uint64_t m) |
{ |
{ |
|
|
for ( ; n; n = n->next) { |
for ( ; NULL != n; n = n->next) { |
if (n->child) |
if (NULL != n->child) |
buf_appendmdoc(buf, n->child, f); |
putmdockey(mpage, n->child, m); |
|
if (MDOC_TEXT == n->type) |
if (MDOC_TEXT == n->type && f) { |
putkey(mpage, n->string, m); |
f = 0; |
|
buf_appendb(buf, n->string, |
|
strlen(n->string) + 1); |
|
} else if (MDOC_TEXT == n->type) |
|
buf_append(buf, n->string); |
|
|
|
} |
} |
} |
} |
|
|
/* ARGSUSED */ |
|
static void |
static void |
pmdoc_An(MDOC_ARGS) |
parse_man(struct mpage *mpage, const struct man_node *n) |
{ |
{ |
|
const struct man_node *head, *body; |
if (SEC_AUTHORS != n->sec) |
char *start, *title; |
|
char byte; |
|
size_t sz; |
|
|
|
if (NULL == n) |
return; |
return; |
|
|
buf_appendmdoc(buf, n->child, 0); |
/* |
hash_put(hash, buf, TYPE_An); |
* We're only searching for one thing: the first text child in |
|
* the BODY of a NAME section. Since we don't keep track of |
|
* sections in -man, run some hoops to find out whether we're in |
|
* the correct section or not. |
|
*/ |
|
|
|
if (MAN_BODY == n->type && MAN_SH == n->tok) { |
|
body = n; |
|
assert(body->parent); |
|
if (NULL != (head = body->parent->head) && |
|
1 == head->nchild && |
|
NULL != (head = (head->child)) && |
|
MAN_TEXT == head->type && |
|
0 == strcmp(head->string, "NAME") && |
|
NULL != body->child) { |
|
|
|
/* |
|
* Suck the entire NAME section into memory. |
|
* Yes, we might run away. |
|
* But too many manuals have big, spread-out |
|
* NAME sections over many lines. |
|
*/ |
|
|
|
title = NULL; |
|
man_deroff(&title, body); |
|
if (NULL == title) |
|
return; |
|
|
|
/* |
|
* Go through a special heuristic dance here. |
|
* Conventionally, one or more manual names are |
|
* comma-specified prior to a whitespace, then a |
|
* dash, then a description. Try to puzzle out |
|
* the name parts here. |
|
*/ |
|
|
|
start = title; |
|
for ( ;; ) { |
|
sz = strcspn(start, " ,"); |
|
if ('\0' == start[sz]) |
|
break; |
|
|
|
byte = start[sz]; |
|
start[sz] = '\0'; |
|
|
|
/* |
|
* Assume a stray trailing comma in the |
|
* name list if a name begins with a dash. |
|
*/ |
|
|
|
if ('-' == start[0] || |
|
('\\' == start[0] && '-' == start[1])) |
|
break; |
|
|
|
putkey(mpage, start, NAME_TITLE); |
|
|
|
if (' ' == byte) { |
|
start += sz + 1; |
|
break; |
|
} |
|
|
|
assert(',' == byte); |
|
start += sz + 1; |
|
while (' ' == *start) |
|
start++; |
|
} |
|
|
|
if (start == title) { |
|
putkey(mpage, start, NAME_TITLE); |
|
free(title); |
|
return; |
|
} |
|
|
|
while (isspace((unsigned char)*start)) |
|
start++; |
|
|
|
if (0 == strncmp(start, "-", 1)) |
|
start += 1; |
|
else if (0 == strncmp(start, "\\-\\-", 4)) |
|
start += 4; |
|
else if (0 == strncmp(start, "\\-", 2)) |
|
start += 2; |
|
else if (0 == strncmp(start, "\\(en", 4)) |
|
start += 4; |
|
else if (0 == strncmp(start, "\\(em", 4)) |
|
start += 4; |
|
|
|
while (' ' == *start) |
|
start++; |
|
|
|
mpage->desc = mandoc_strdup(start); |
|
free(title); |
|
return; |
|
} |
|
} |
|
|
|
for (n = n->child; n; n = n->next) { |
|
if (NULL != mpage->desc) |
|
break; |
|
parse_man(mpage, n); |
|
} |
} |
} |
|
|
static void |
static void |
hash_reset(DB **db) |
parse_mdoc(struct mpage *mpage, const struct mdoc_node *n) |
{ |
{ |
DB *hash; |
|
|
|
if (NULL != (hash = *db)) |
assert(NULL != n); |
(*hash->close)(hash); |
for (n = n->child; NULL != n; n = n->next) { |
|
switch (n->type) { |
*db = dbopen(NULL, O_CREAT|O_RDWR, 0644, DB_HASH, NULL); |
case (MDOC_ELEM): |
if (NULL == *db) { |
/* FALLTHROUGH */ |
perror("hash"); |
case (MDOC_BLOCK): |
exit((int)MANDOCLEVEL_SYSERR); |
/* FALLTHROUGH */ |
|
case (MDOC_HEAD): |
|
/* FALLTHROUGH */ |
|
case (MDOC_BODY): |
|
/* FALLTHROUGH */ |
|
case (MDOC_TAIL): |
|
if (NULL != mdocs[n->tok].fp) |
|
if (0 == (*mdocs[n->tok].fp)(mpage, n)) |
|
break; |
|
if (mdocs[n->tok].mask) |
|
putmdockey(mpage, n->child, |
|
mdocs[n->tok].mask); |
|
break; |
|
default: |
|
assert(MDOC_ROOT != n->type); |
|
continue; |
|
} |
|
if (NULL != n->child) |
|
parse_mdoc(mpage, n); |
} |
} |
} |
} |
|
|
/* ARGSUSED */ |
static int |
static void |
parse_mdoc_Fd(struct mpage *mpage, const struct mdoc_node *n) |
pmdoc_Fd(MDOC_ARGS) |
|
{ |
{ |
const char *start, *end; |
const char *start, *end; |
size_t sz; |
size_t sz; |
|
|
if (SEC_SYNOPSIS != n->sec) |
|
return; |
|
if (NULL == (n = n->child) || MDOC_TEXT != n->type) |
|
return; |
|
|
|
|
if (SEC_SYNOPSIS != n->sec || |
|
NULL == (n = n->child) || |
|
MDOC_TEXT != n->type) |
|
return(0); |
|
|
/* |
/* |
* Only consider those `Fd' macro fields that begin with an |
* Only consider those `Fd' macro fields that begin with an |
* "inclusion" token (versus, e.g., #define). |
* "inclusion" token (versus, e.g., #define). |
*/ |
*/ |
|
|
if (strcmp("#include", n->string)) |
if (strcmp("#include", n->string)) |
return; |
return(0); |
|
|
if (NULL == (n = n->next) || MDOC_TEXT != n->type) |
if (NULL == (n = n->next) || MDOC_TEXT != n->type) |
return; |
return(0); |
|
|
/* |
/* |
* Strip away the enclosing angle brackets and make sure we're |
* Strip away the enclosing angle brackets and make sure we're |
Line 781 pmdoc_Fd(MDOC_ARGS) |
|
Line 1555 pmdoc_Fd(MDOC_ARGS) |
|
start++; |
start++; |
|
|
if (0 == (sz = strlen(start))) |
if (0 == (sz = strlen(start))) |
return; |
return(0); |
|
|
end = &start[(int)sz - 1]; |
end = &start[(int)sz - 1]; |
if ('>' == *end || '"' == *end) |
if ('>' == *end || '"' == *end) |
end--; |
end--; |
|
|
assert(end >= start); |
if (end > start) |
|
putkeys(mpage, start, end - start + 1, TYPE_In); |
|
return(0); |
|
} |
|
|
buf_appendb(buf, start, (size_t)(end - start + 1)); |
static int |
buf_appendb(buf, "", 1); |
parse_mdoc_Fn(struct mpage *mpage, const struct mdoc_node *n) |
|
{ |
|
char *cp; |
|
|
hash_put(hash, buf, TYPE_In); |
if (NULL == (n = n->child) || MDOC_TEXT != n->type) |
|
return(0); |
|
|
|
/* |
|
* Parse: .Fn "struct type *name" "char *arg". |
|
* First strip away pointer symbol. |
|
* Then store the function name, then type. |
|
* Finally, store the arguments. |
|
*/ |
|
|
|
if (NULL == (cp = strrchr(n->string, ' '))) |
|
cp = n->string; |
|
|
|
while ('*' == *cp) |
|
cp++; |
|
|
|
putkey(mpage, cp, TYPE_Fn); |
|
|
|
if (n->string < cp) |
|
putkeys(mpage, n->string, cp - n->string, TYPE_Ft); |
|
|
|
for (n = n->next; NULL != n; n = n->next) |
|
if (MDOC_TEXT == n->type) |
|
putkey(mpage, n->string, TYPE_Fa); |
|
|
|
return(0); |
} |
} |
|
|
/* ARGSUSED */ |
static int |
static void |
parse_mdoc_Xr(struct mpage *mpage, const struct mdoc_node *n) |
pmdoc_Cd(MDOC_ARGS) |
|
{ |
{ |
|
char *cp; |
if (SEC_SYNOPSIS != n->sec) |
|
return; |
|
|
|
buf_appendmdoc(buf, n->child, 0); |
if (NULL == (n = n->child)) |
hash_put(hash, buf, TYPE_Cd); |
return(0); |
|
|
|
if (NULL == n->next) { |
|
putkey(mpage, n->string, TYPE_Xr); |
|
return(0); |
|
} |
|
|
|
mandoc_asprintf(&cp, "%s(%s)", n->string, n->next->string); |
|
putkey(mpage, cp, TYPE_Xr); |
|
free(cp); |
|
return(0); |
} |
} |
|
|
/* ARGSUSED */ |
static int |
static void |
parse_mdoc_Nd(struct mpage *mpage, const struct mdoc_node *n) |
pmdoc_In(MDOC_ARGS) |
|
{ |
{ |
|
|
if (SEC_SYNOPSIS != n->sec) |
|
return; |
|
if (NULL == n->child || MDOC_TEXT != n->child->type) |
|
return; |
|
|
|
buf_append(buf, n->child->string); |
if (MDOC_BODY == n->type) |
hash_put(hash, buf, TYPE_In); |
mdoc_deroff(&mpage->desc, n); |
|
return(0); |
} |
} |
|
|
/* ARGSUSED */ |
static int |
static void |
parse_mdoc_Nm(struct mpage *mpage, const struct mdoc_node *n) |
pmdoc_Fn(MDOC_ARGS) |
|
{ |
{ |
const char *cp; |
|
|
|
if (SEC_SYNOPSIS != n->sec) |
|
return; |
|
if (NULL == n->child || MDOC_TEXT != n->child->type) |
|
return; |
|
|
|
/* .Fn "struct type *arg" "foo" */ |
if (SEC_NAME == n->sec) |
|
putmdockey(mpage, n->child, NAME_TITLE); |
|
else if (SEC_SYNOPSIS == n->sec && MDOC_HEAD == n->type) |
|
putmdockey(mpage, n->child, NAME_SYN); |
|
return(0); |
|
} |
|
|
cp = strrchr(n->child->string, ' '); |
static int |
if (NULL == cp) |
parse_mdoc_Sh(struct mpage *mpage, const struct mdoc_node *n) |
cp = n->child->string; |
{ |
|
|
/* Strip away pointer symbol. */ |
return(SEC_CUSTOM == n->sec && MDOC_HEAD == n->type); |
|
} |
|
|
while ('*' == *cp) |
static int |
cp++; |
parse_mdoc_head(struct mpage *mpage, const struct mdoc_node *n) |
|
{ |
|
|
buf_append(buf, cp); |
return(MDOC_HEAD == n->type); |
hash_put(hash, buf, TYPE_Fn); |
|
} |
} |
|
|
/* ARGSUSED */ |
static int |
static void |
parse_mdoc_body(struct mpage *mpage, const struct mdoc_node *n) |
pmdoc_St(MDOC_ARGS) |
|
{ |
{ |
|
|
if (SEC_STANDARDS != n->sec) |
|
return; |
|
if (NULL == n->child || MDOC_TEXT != n->child->type) |
|
return; |
|
|
|
buf_append(buf, n->child->string); |
return(MDOC_BODY == n->type); |
hash_put(hash, buf, TYPE_St); |
|
} |
} |
|
|
/* ARGSUSED */ |
/* |
|
* Add a string to the hash table for the current manual. |
|
* Each string has a bitmask telling which macros it belongs to. |
|
* When we finish the manual, we'll dump the table. |
|
*/ |
static void |
static void |
pmdoc_Xr(MDOC_ARGS) |
putkeys(const struct mpage *mpage, |
|
const char *cp, size_t sz, uint64_t v) |
{ |
{ |
|
struct ohash *htab; |
|
struct str *s; |
|
const char *end; |
|
unsigned int slot; |
|
int i; |
|
|
if (NULL == (n = n->child)) |
if (0 == sz) |
return; |
return; |
|
|
buf_appendb(buf, n->string, strlen(n->string)); |
if (TYPE_Nm & v) { |
|
htab = &names; |
|
v &= name_mask; |
|
name_mask &= ~NAME_FIRST; |
|
if (debug > 1) |
|
say(mpage->mlinks->file, |
|
"Adding name %*s", sz, cp); |
|
} else { |
|
htab = &strings; |
|
if (debug > 1) |
|
for (i = 0; i < mansearch_keymax; i++) |
|
if (1 << i & v) |
|
say(mpage->mlinks->file, |
|
"Adding key %s=%*s", |
|
mansearch_keynames[i], sz, cp); |
|
} |
|
|
if (NULL != (n = n->next)) { |
end = cp + sz; |
buf_appendb(buf, ".", 1); |
slot = ohash_qlookupi(htab, cp, &end); |
buf_appendb(buf, n->string, strlen(n->string) + 1); |
s = ohash_find(htab, slot); |
|
|
|
if (NULL != s && mpage == s->mpage) { |
|
s->mask |= v; |
|
return; |
|
} else if (NULL == s) { |
|
s = mandoc_calloc(sizeof(struct str) + sz + 1, 1); |
|
memcpy(s->key, cp, sz); |
|
ohash_insert(htab, slot, s); |
|
} |
|
s->mpage = mpage; |
|
s->mask = v; |
|
} |
|
|
|
/* |
|
* Take a Unicode codepoint and produce its UTF-8 encoding. |
|
* This isn't the best way to do this, but it works. |
|
* The magic numbers are from the UTF-8 packaging. |
|
* They're not as scary as they seem: read the UTF-8 spec for details. |
|
*/ |
|
static size_t |
|
utf8(unsigned int cp, char out[7]) |
|
{ |
|
size_t rc; |
|
|
|
rc = 0; |
|
if (cp <= 0x0000007F) { |
|
rc = 1; |
|
out[0] = (char)cp; |
|
} else if (cp <= 0x000007FF) { |
|
rc = 2; |
|
out[0] = (cp >> 6 & 31) | 192; |
|
out[1] = (cp & 63) | 128; |
|
} else if (cp <= 0x0000FFFF) { |
|
rc = 3; |
|
out[0] = (cp >> 12 & 15) | 224; |
|
out[1] = (cp >> 6 & 63) | 128; |
|
out[2] = (cp & 63) | 128; |
|
} else if (cp <= 0x001FFFFF) { |
|
rc = 4; |
|
out[0] = (cp >> 18 & 7) | 240; |
|
out[1] = (cp >> 12 & 63) | 128; |
|
out[2] = (cp >> 6 & 63) | 128; |
|
out[3] = (cp & 63) | 128; |
|
} else if (cp <= 0x03FFFFFF) { |
|
rc = 5; |
|
out[0] = (cp >> 24 & 3) | 248; |
|
out[1] = (cp >> 18 & 63) | 128; |
|
out[2] = (cp >> 12 & 63) | 128; |
|
out[3] = (cp >> 6 & 63) | 128; |
|
out[4] = (cp & 63) | 128; |
|
} else if (cp <= 0x7FFFFFFF) { |
|
rc = 6; |
|
out[0] = (cp >> 30 & 1) | 252; |
|
out[1] = (cp >> 24 & 63) | 128; |
|
out[2] = (cp >> 18 & 63) | 128; |
|
out[3] = (cp >> 12 & 63) | 128; |
|
out[4] = (cp >> 6 & 63) | 128; |
|
out[5] = (cp & 63) | 128; |
} else |
} else |
buf_appendb(buf, ".", 2); |
return(0); |
|
|
hash_put(hash, buf, TYPE_Xr); |
out[rc] = '\0'; |
|
return(rc); |
} |
} |
|
|
/* ARGSUSED */ |
/* |
|
* Store the rendered version of a key, or alias the pointer |
|
* if the key contains no escape sequences. |
|
*/ |
static void |
static void |
pmdoc_Vt(MDOC_ARGS) |
render_key(struct mchars *mc, struct str *key) |
{ |
{ |
const char *start; |
size_t sz, bsz, pos; |
size_t sz; |
char utfbuf[7], res[6]; |
|
char *buf; |
if (SEC_SYNOPSIS != n->sec) |
const char *seq, *cpp, *val; |
return; |
int len, u; |
if (MDOC_Vt == n->tok && MDOC_BODY != n->type) |
enum mandoc_esc esc; |
return; |
|
if (NULL == n->last || MDOC_TEXT != n->last->type) |
|
return; |
|
|
|
/* |
assert(NULL == key->rendered); |
* Strip away leading pointer symbol '*' and trailing ';'. |
|
*/ |
|
|
|
start = n->last->string; |
res[0] = '\\'; |
|
res[1] = '\t'; |
|
res[2] = ASCII_NBRSP; |
|
res[3] = ASCII_HYPH; |
|
res[4] = ASCII_BREAK; |
|
res[5] = '\0'; |
|
|
while ('*' == *start) |
val = key->key; |
start++; |
bsz = strlen(val); |
|
|
if (0 == (sz = strlen(start))) |
/* |
|
* Pre-check: if we have no stop-characters, then set the |
|
* pointer as ourselvse and get out of here. |
|
*/ |
|
if (strcspn(val, res) == bsz) { |
|
key->rendered = key->key; |
return; |
return; |
|
} |
|
|
if (';' == start[(int)sz - 1]) |
/* Pre-allocate by the length of the input */ |
sz--; |
|
|
|
if (0 == sz) |
buf = mandoc_malloc(++bsz); |
return; |
pos = 0; |
|
|
buf_appendb(buf, start, sz); |
while ('\0' != *val) { |
buf_appendb(buf, "", 1); |
/* |
hash_put(hash, buf, TYPE_Va); |
* Halt on the first escape sequence. |
} |
* This also halts on the end of string, in which case |
|
* we just copy, fallthrough, and exit the loop. |
|
*/ |
|
if ((sz = strcspn(val, res)) > 0) { |
|
memcpy(&buf[pos], val, sz); |
|
pos += sz; |
|
val += sz; |
|
} |
|
|
/* ARGSUSED */ |
switch (*val) { |
static void |
case (ASCII_HYPH): |
pmdoc_Fo(MDOC_ARGS) |
buf[pos++] = '-'; |
{ |
val++; |
|
continue; |
if (SEC_SYNOPSIS != n->sec || MDOC_HEAD != n->type) |
case ('\t'): |
return; |
/* FALLTHROUGH */ |
if (NULL == n->child || MDOC_TEXT != n->child->type) |
case (ASCII_NBRSP): |
return; |
buf[pos++] = ' '; |
|
val++; |
|
/* FALLTHROUGH */ |
|
case (ASCII_BREAK): |
|
continue; |
|
default: |
|
break; |
|
} |
|
if ('\\' != *val) |
|
break; |
|
|
buf_append(buf, n->child->string); |
/* Read past the slash. */ |
hash_put(hash, buf, TYPE_Fn); |
|
} |
|
|
|
|
val++; |
|
|
/* ARGSUSED */ |
/* |
static void |
* Parse the escape sequence and see if it's a |
pmdoc_Nd(MDOC_ARGS) |
* predefined character or special character. |
{ |
*/ |
|
|
if (MDOC_BODY != n->type) |
esc = mandoc_escape |
return; |
((const char **)&val, &seq, &len); |
|
if (ESCAPE_ERROR == esc) |
|
break; |
|
if (ESCAPE_SPECIAL != esc) |
|
continue; |
|
|
buf_appendmdoc(dbuf, n->child, 1); |
/* |
buf_appendmdoc(buf, n->child, 0); |
* Render the special character |
|
* as either UTF-8 or ASCII. |
|
*/ |
|
|
hash_put(hash, buf, TYPE_Nd); |
if (write_utf8) { |
} |
if (0 == (u = mchars_spec2cp(mc, seq, len))) |
|
continue; |
|
cpp = utfbuf; |
|
if (0 == (sz = utf8(u, utfbuf))) |
|
continue; |
|
sz = strlen(cpp); |
|
} else { |
|
cpp = mchars_spec2str(mc, seq, len, &sz); |
|
if (NULL == cpp) |
|
continue; |
|
if (ASCII_NBRSP == *cpp) { |
|
cpp = " "; |
|
sz = 1; |
|
} |
|
} |
|
|
/* ARGSUSED */ |
/* Copy the rendered glyph into the stream. */ |
static void |
|
pmdoc_Er(MDOC_ARGS) |
|
{ |
|
|
|
if (SEC_ERRORS != n->sec) |
bsz += sz; |
return; |
buf = mandoc_realloc(buf, bsz); |
|
memcpy(&buf[pos], cpp, sz); |
buf_appendmdoc(buf, n->child, 0); |
pos += sz; |
hash_put(hash, buf, TYPE_Er); |
} |
} |
|
|
|
/* ARGSUSED */ |
buf[pos] = '\0'; |
static void |
key->rendered = buf; |
pmdoc_Ev(MDOC_ARGS) |
|
{ |
|
|
|
if (SEC_ENVIRONMENT != n->sec) |
|
return; |
|
|
|
buf_appendmdoc(buf, n->child, 0); |
|
hash_put(hash, buf, TYPE_Ev); |
|
} |
} |
|
|
/* ARGSUSED */ |
|
static void |
static void |
pmdoc_Pa(MDOC_ARGS) |
dbadd_mlink(const struct mlink *mlink) |
{ |
{ |
|
size_t i; |
|
|
if (SEC_FILES != n->sec) |
i = 1; |
return; |
SQL_BIND_TEXT(stmts[STMT_INSERT_LINK], i, mlink->dsec); |
|
SQL_BIND_TEXT(stmts[STMT_INSERT_LINK], i, mlink->arch); |
buf_appendmdoc(buf, n->child, 0); |
SQL_BIND_TEXT(stmts[STMT_INSERT_LINK], i, mlink->name); |
hash_put(hash, buf, TYPE_Pa); |
SQL_BIND_INT64(stmts[STMT_INSERT_LINK], i, mlink->mpage->recno); |
|
SQL_STEP(stmts[STMT_INSERT_LINK]); |
|
sqlite3_reset(stmts[STMT_INSERT_LINK]); |
} |
} |
|
|
/* ARGSUSED */ |
/* |
|
* Flush the current page's terms (and their bits) into the database. |
|
* Wrap the entire set of additions in a transaction to make sqlite be a |
|
* little faster. |
|
* Also, handle escape sequences at the last possible moment. |
|
*/ |
static void |
static void |
pmdoc_Nm(MDOC_ARGS) |
dbadd(struct mpage *mpage, struct mchars *mc) |
{ |
{ |
|
struct mlink *mlink; |
if (SEC_NAME == n->sec) { |
struct str *key; |
buf_appendmdoc(buf, n->child, 0); |
size_t i; |
hash_put(hash, buf, TYPE_Nm); |
unsigned int slot; |
return; |
|
} else if (SEC_SYNOPSIS != n->sec || MDOC_HEAD != n->type) |
|
return; |
|
|
|
if (NULL == n->child) |
mlink = mpage->mlinks; |
buf_append(buf, m->name); |
|
|
|
buf_appendmdoc(buf, n->child, 0); |
if (nodb) { |
hash_put(hash, buf, TYPE_Nm); |
while (NULL != mlink) { |
} |
fputs(mlink->name, stdout); |
|
if (NULL == mlink->next || |
static void |
strcmp(mlink->dsec, mlink->next->dsec) || |
hash_put(DB *db, const struct buf *buf, uint64_t mask) |
strcmp(mlink->fsec, mlink->next->fsec) || |
{ |
strcmp(mlink->arch, mlink->next->arch)) { |
DBT key, val; |
putchar('('); |
int rc; |
if ('\0' == *mlink->dsec) |
|
fputs(mlink->fsec, stdout); |
if (buf->len < 2) |
else |
|
fputs(mlink->dsec, stdout); |
|
if ('\0' != *mlink->arch) |
|
printf("/%s", mlink->arch); |
|
putchar(')'); |
|
} |
|
mlink = mlink->next; |
|
if (NULL != mlink) |
|
fputs(", ", stdout); |
|
} |
|
printf(" - %s\n", mpage->desc); |
return; |
return; |
|
} |
|
|
key.data = buf->cp; |
if (debug) |
key.size = buf->len; |
say(mlink->file, "Adding to database"); |
|
|
if ((rc = (*db->get)(db, &key, &val, 0)) < 0) { |
i = 1; |
perror("hash"); |
SQL_BIND_TEXT(stmts[STMT_INSERT_PAGE], i, mpage->desc); |
exit((int)MANDOCLEVEL_SYSERR); |
SQL_BIND_INT(stmts[STMT_INSERT_PAGE], i, FORM_SRC == mpage->form); |
} else if (0 == rc) |
SQL_STEP(stmts[STMT_INSERT_PAGE]); |
mask |= *(uint64_t *)val.data; |
mpage->recno = sqlite3_last_insert_rowid(db); |
|
sqlite3_reset(stmts[STMT_INSERT_PAGE]); |
|
|
val.data = &mask; |
while (NULL != mlink) { |
val.size = sizeof(uint64_t); |
dbadd_mlink(mlink); |
|
mlink = mlink->next; |
|
} |
|
mlink = mpage->mlinks; |
|
|
if ((rc = (*db->put)(db, &key, &val, 0)) < 0) { |
for (key = ohash_first(&names, &slot); NULL != key; |
perror("hash"); |
key = ohash_next(&names, &slot)) { |
exit((int)MANDOCLEVEL_SYSERR); |
assert(key->mpage == mpage); |
} |
if (NULL == key->rendered) |
|
render_key(mc, key); |
|
i = 1; |
|
SQL_BIND_INT64(stmts[STMT_INSERT_NAME], i, key->mask); |
|
SQL_BIND_TEXT(stmts[STMT_INSERT_NAME], i, key->rendered); |
|
SQL_BIND_INT64(stmts[STMT_INSERT_NAME], i, mpage->recno); |
|
SQL_STEP(stmts[STMT_INSERT_NAME]); |
|
sqlite3_reset(stmts[STMT_INSERT_NAME]); |
|
if (key->rendered != key->key) |
|
free(key->rendered); |
|
free(key); |
|
} |
|
for (key = ohash_first(&strings, &slot); NULL != key; |
|
key = ohash_next(&strings, &slot)) { |
|
assert(key->mpage == mpage); |
|
if (NULL == key->rendered) |
|
render_key(mc, key); |
|
i = 1; |
|
SQL_BIND_INT64(stmts[STMT_INSERT_KEY], i, key->mask); |
|
SQL_BIND_TEXT(stmts[STMT_INSERT_KEY], i, key->rendered); |
|
SQL_BIND_INT64(stmts[STMT_INSERT_KEY], i, mpage->recno); |
|
SQL_STEP(stmts[STMT_INSERT_KEY]); |
|
sqlite3_reset(stmts[STMT_INSERT_KEY]); |
|
if (key->rendered != key->key) |
|
free(key->rendered); |
|
free(key); |
|
} |
} |
} |
|
|
static void |
static void |
dbt_put(DB *db, const char *dbn, DBT *key, DBT *val) |
dbprune(void) |
{ |
{ |
|
struct mpage *mpage; |
|
struct mlink *mlink; |
|
size_t i; |
|
unsigned int slot; |
|
|
assert(key->size); |
if (0 == nodb) |
assert(val->size); |
SQL_EXEC("BEGIN TRANSACTION"); |
|
|
if (0 == (*db->put)(db, key, val, 0)) |
for (mpage = ohash_first(&mpages, &slot); NULL != mpage; |
return; |
mpage = ohash_next(&mpages, &slot)) { |
|
mlink = mpage->mlinks; |
perror(dbn); |
if (debug) |
exit((int)MANDOCLEVEL_SYSERR); |
say(mlink->file, "Deleting from database"); |
/* NOTREACHED */ |
if (nodb) |
|
continue; |
|
for ( ; NULL != mlink; mlink = mlink->next) { |
|
i = 1; |
|
SQL_BIND_TEXT(stmts[STMT_DELETE_PAGE], |
|
i, mlink->dsec); |
|
SQL_BIND_TEXT(stmts[STMT_DELETE_PAGE], |
|
i, mlink->arch); |
|
SQL_BIND_TEXT(stmts[STMT_DELETE_PAGE], |
|
i, mlink->name); |
|
SQL_STEP(stmts[STMT_DELETE_PAGE]); |
|
sqlite3_reset(stmts[STMT_DELETE_PAGE]); |
|
} |
|
} |
|
|
|
if (0 == nodb) |
|
SQL_EXEC("END TRANSACTION"); |
} |
} |
|
|
/* |
/* |
* Call out to per-macro handlers after clearing the persistent database |
* Close an existing database and its prepared statements. |
* key. If the macro sets the database key, flush it to the database. |
* If "real" is not set, rename the temporary file into the real one. |
*/ |
*/ |
static void |
static void |
pmdoc_node(MDOC_ARGS) |
dbclose(int real) |
{ |
{ |
|
size_t i; |
|
int status; |
|
pid_t child; |
|
|
if (NULL == n) |
if (nodb) |
return; |
return; |
|
|
switch (n->type) { |
for (i = 0; i < STMT__MAX; i++) { |
case (MDOC_HEAD): |
sqlite3_finalize(stmts[i]); |
/* FALLTHROUGH */ |
stmts[i] = NULL; |
case (MDOC_BODY): |
} |
/* FALLTHROUGH */ |
|
case (MDOC_TAIL): |
|
/* FALLTHROUGH */ |
|
case (MDOC_BLOCK): |
|
/* FALLTHROUGH */ |
|
case (MDOC_ELEM): |
|
if (NULL == mdocs[n->tok]) |
|
break; |
|
|
|
buf->len = 0; |
sqlite3_close(db); |
(*mdocs[n->tok])(hash, buf, dbuf, n, m); |
db = NULL; |
break; |
|
|
if (real) |
|
return; |
|
|
|
if ('\0' == *tempfilename) { |
|
if (-1 == rename(MANDOC_DB "~", MANDOC_DB)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(MANDOC_DB, "&rename"); |
|
} |
|
return; |
|
} |
|
|
|
switch (child = fork()) { |
|
case (-1): |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "&fork cmp"); |
|
return; |
|
case (0): |
|
execlp("cmp", "cmp", "-s", |
|
tempfilename, MANDOC_DB, NULL); |
|
say("", "&exec cmp"); |
|
exit(0); |
default: |
default: |
break; |
break; |
} |
} |
|
if (-1 == waitpid(child, &status, 0)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "&wait cmp"); |
|
} else if (WIFSIGNALED(status)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "cmp died from signal %d", WTERMSIG(status)); |
|
} else if (WEXITSTATUS(status)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(MANDOC_DB, |
|
"Data changed, but cannot replace database"); |
|
} |
|
|
pmdoc_node(hash, buf, dbuf, n->child, m); |
*strrchr(tempfilename, '/') = '\0'; |
pmdoc_node(hash, buf, dbuf, n->next, m); |
switch (child = fork()) { |
|
case (-1): |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "&fork rm"); |
|
return; |
|
case (0): |
|
execlp("rm", "rm", "-rf", tempfilename, NULL); |
|
say("", "&exec rm"); |
|
exit((int)MANDOCLEVEL_SYSERR); |
|
default: |
|
break; |
|
} |
|
if (-1 == waitpid(child, &status, 0)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "&wait rm"); |
|
} else if (WIFSIGNALED(status) || WEXITSTATUS(status)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "%s: Cannot remove temporary directory", |
|
tempfilename); |
|
} |
} |
} |
|
|
|
/* |
|
* This is straightforward stuff. |
|
* Open a database connection to a "temporary" database, then open a set |
|
* of prepared statements we'll use over and over again. |
|
* If "real" is set, we use the existing database; if not, we truncate a |
|
* temporary one. |
|
* Must be matched by dbclose(). |
|
*/ |
static int |
static int |
pman_node(MAN_ARGS) |
dbopen(int real) |
{ |
{ |
const struct man_node *head, *body; |
const char *sql; |
const char *start, *sv; |
int rc, ofl; |
size_t sz; |
|
|
|
if (NULL == n) |
if (nodb) |
return(0); |
return(1); |
|
|
/* |
*tempfilename = '\0'; |
* We're only searching for one thing: the first text child in |
ofl = SQLITE_OPEN_READWRITE; |
* the BODY of a NAME section. Since we don't keep track of |
|
* sections in -man, run some hoops to find out whether we're in |
|
* the correct section or not. |
|
*/ |
|
|
|
if (MAN_BODY == n->type && MAN_SH == n->tok) { |
if (real) { |
body = n; |
rc = sqlite3_open_v2(MANDOC_DB, &db, ofl, NULL); |
assert(body->parent); |
if (SQLITE_OK != rc) { |
if (NULL != (head = body->parent->head) && |
exitcode = (int)MANDOCLEVEL_SYSERR; |
1 == head->nchild && |
say(MANDOC_DB, "%s", sqlite3_errmsg(db)); |
NULL != (head = (head->child)) && |
return(0); |
MAN_TEXT == head->type && |
} |
0 == strcmp(head->string, "NAME") && |
goto prepare_statements; |
NULL != (body = body->child) && |
} |
MAN_TEXT == body->type) { |
|
|
|
assert(body->string); |
ofl |= SQLITE_OPEN_CREATE | SQLITE_OPEN_EXCLUSIVE; |
start = sv = body->string; |
|
|
|
/* |
remove(MANDOC_DB "~"); |
* Go through a special heuristic dance here. |
rc = sqlite3_open_v2(MANDOC_DB "~", &db, ofl, NULL); |
* This is why -man manuals are great! |
if (SQLITE_OK == rc) |
* (I'm being sarcastic: my eyes are bleeding.) |
goto create_tables; |
* Conventionally, one or more manual names are |
if (MPARSE_QUICK & mparse_options) { |
* comma-specified prior to a whitespace, then a |
exitcode = (int)MANDOCLEVEL_SYSERR; |
* dash, then a description. Try to puzzle out |
say(MANDOC_DB "~", "%s", sqlite3_errmsg(db)); |
* the name parts here. |
return(0); |
*/ |
} |
|
|
for ( ;; ) { |
if (strlcpy(tempfilename, "/tmp/mandocdb.XXXXXX", |
sz = strcspn(start, " ,"); |
sizeof(tempfilename)) >= sizeof(tempfilename)) { |
if ('\0' == start[(int)sz]) |
exitcode = (int)MANDOCLEVEL_SYSERR; |
break; |
say("", "/tmp/mandocdb.XXXXXX: Filename too long"); |
|
return(0); |
|
} |
|
if (NULL == mkdtemp(tempfilename)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "&%s", tempfilename); |
|
return(0); |
|
} |
|
if (strlcat(tempfilename, "/" MANDOC_DB, |
|
sizeof(tempfilename)) >= sizeof(tempfilename)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "%s/" MANDOC_DB ": Filename too long", |
|
tempfilename); |
|
return(0); |
|
} |
|
rc = sqlite3_open_v2(tempfilename, &db, ofl, NULL); |
|
if (SQLITE_OK != rc) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "%s: %s", tempfilename, sqlite3_errmsg(db)); |
|
return(0); |
|
} |
|
|
buf->len = 0; |
create_tables: |
buf_appendb(buf, start, sz); |
sql = "CREATE TABLE \"mpages\" (\n" |
buf_appendb(buf, "", 1); |
" \"desc\" TEXT NOT NULL,\n" |
|
" \"form\" INTEGER NOT NULL,\n" |
|
" \"id\" INTEGER PRIMARY KEY AUTOINCREMENT NOT NULL\n" |
|
");\n" |
|
"\n" |
|
"CREATE TABLE \"mlinks\" (\n" |
|
" \"sec\" TEXT NOT NULL,\n" |
|
" \"arch\" TEXT NOT NULL,\n" |
|
" \"name\" TEXT NOT NULL,\n" |
|
" \"pageid\" INTEGER NOT NULL REFERENCES mpages(id) " |
|
"ON DELETE CASCADE\n" |
|
");\n" |
|
"\n" |
|
"CREATE TABLE \"names\" (\n" |
|
" \"bits\" INTEGER NOT NULL,\n" |
|
" \"name\" TEXT NOT NULL,\n" |
|
" \"pageid\" INTEGER NOT NULL REFERENCES mpages(id) " |
|
"ON DELETE CASCADE\n" |
|
");\n" |
|
"\n" |
|
"CREATE TABLE \"keys\" (\n" |
|
" \"bits\" INTEGER NOT NULL,\n" |
|
" \"key\" TEXT NOT NULL,\n" |
|
" \"pageid\" INTEGER NOT NULL REFERENCES mpages(id) " |
|
"ON DELETE CASCADE\n" |
|
");\n"; |
|
|
hash_put(hash, buf, TYPE_Nm); |
if (SQLITE_OK != sqlite3_exec(db, sql, NULL, NULL, NULL)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(MANDOC_DB, "%s", sqlite3_errmsg(db)); |
|
return(0); |
|
} |
|
|
if (' ' == start[(int)sz]) { |
prepare_statements: |
start += (int)sz + 1; |
SQL_EXEC("PRAGMA foreign_keys = ON"); |
break; |
sql = "DELETE FROM mpages WHERE id IN " |
} |
"(SELECT pageid FROM mlinks WHERE " |
|
"sec=? AND arch=? AND name=?)"; |
|
sqlite3_prepare_v2(db, sql, -1, &stmts[STMT_DELETE_PAGE], NULL); |
|
sql = "INSERT INTO mpages " |
|
"(desc,form) VALUES (?,?)"; |
|
sqlite3_prepare_v2(db, sql, -1, &stmts[STMT_INSERT_PAGE], NULL); |
|
sql = "INSERT INTO mlinks " |
|
"(sec,arch,name,pageid) VALUES (?,?,?,?)"; |
|
sqlite3_prepare_v2(db, sql, -1, &stmts[STMT_INSERT_LINK], NULL); |
|
sql = "INSERT INTO names " |
|
"(bits,name,pageid) VALUES (?,?,?)"; |
|
sqlite3_prepare_v2(db, sql, -1, &stmts[STMT_INSERT_NAME], NULL); |
|
sql = "INSERT INTO keys " |
|
"(bits,key,pageid) VALUES (?,?,?)"; |
|
sqlite3_prepare_v2(db, sql, -1, &stmts[STMT_INSERT_KEY], NULL); |
|
|
assert(',' == start[(int)sz]); |
#ifndef __APPLE__ |
start += (int)sz + 1; |
/* |
while (' ' == *start) |
* When opening a new database, we can turn off |
start++; |
* synchronous mode for much better performance. |
} |
*/ |
|
|
buf->len = 0; |
if (real) |
|
SQL_EXEC("PRAGMA synchronous = OFF"); |
|
#endif |
|
|
if (sv == start) { |
return(1); |
buf_append(buf, start); |
} |
return(1); |
|
} |
|
|
|
while (' ' == *start) |
static void * |
start++; |
hash_halloc(size_t sz, void *arg) |
|
{ |
|
|
if (0 == strncmp(start, "-", 1)) |
return(mandoc_calloc(sz, 1)); |
start += 1; |
} |
else if (0 == strncmp(start, "\\-", 2)) |
|
start += 2; |
|
else if (0 == strncmp(start, "\\(en", 4)) |
|
start += 4; |
|
else if (0 == strncmp(start, "\\(em", 4)) |
|
start += 4; |
|
|
|
while (' ' == *start) |
static void * |
start++; |
hash_alloc(size_t sz, void *arg) |
|
{ |
|
|
sz = strlen(start) + 1; |
return(mandoc_malloc(sz)); |
buf_appendb(dbuf, start, sz); |
|
buf_appendb(buf, start, sz); |
|
|
|
hash_put(hash, buf, TYPE_Nd); |
|
} |
|
} |
|
|
|
for (n = n->child; n; n = n->next) |
|
if (pman_node(hash, buf, dbuf, n)) |
|
return(1); |
|
|
|
return(0); |
|
} |
} |
|
|
static void |
static void |
ofile_argbuild(char *argv[], int argc, int verb, struct of **of) |
hash_free(void *p, size_t sz, void *arg) |
{ |
{ |
int i; |
|
struct of *nof; |
|
|
|
for (i = 0; i < argc; i++) { |
free(p); |
nof = mandoc_calloc(1, sizeof(struct of)); |
|
nof->fname = strdup(argv[i]); |
|
if (verb > 2) |
|
printf("%s: Scheduling\n", argv[i]); |
|
if (NULL == *of) { |
|
*of = nof; |
|
(*of)->first = nof; |
|
} else { |
|
nof->first = (*of)->first; |
|
(*of)->next = nof; |
|
*of = nof; |
|
} |
|
} |
|
} |
} |
|
|
/* |
|
* Recursively build up a list of files to parse. |
|
* We use this instead of ftw() and so on because I don't want global |
|
* variables hanging around. |
|
* This ignores the mandoc.db and mandoc.index files, but assumes that |
|
* everything else is a manual. |
|
* Pass in a pointer to a NULL structure for the first invocation. |
|
*/ |
|
static int |
static int |
ofile_dirbuild(const char *dir, int verb, struct of **of) |
set_basedir(const char *targetdir) |
{ |
{ |
char buf[MAXPATHLEN]; |
static char startdir[PATH_MAX]; |
size_t sz; |
static int fd; |
DIR *d; |
|
const char *fn; |
|
struct of *nof; |
|
struct dirent *dp; |
|
|
|
if (NULL == (d = opendir(dir))) { |
/* |
perror(dir); |
* Remember where we started by keeping a fd open to the origin |
return(0); |
* path component: throughout this utility, we chdir() a lot to |
} |
* handle relative paths, and by doing this, we can return to |
|
* the starting point. |
while (NULL != (dp = readdir(d))) { |
*/ |
fn = dp->d_name; |
if ('\0' == *startdir) { |
if (DT_DIR == dp->d_type) { |
if (NULL == getcwd(startdir, PATH_MAX)) { |
if (0 == strcmp(".", fn)) |
exitcode = (int)MANDOCLEVEL_SYSERR; |
continue; |
if (NULL != targetdir) |
if (0 == strcmp("..", fn)) |
say("", "&getcwd"); |
continue; |
|
|
|
buf[0] = '\0'; |
|
strlcat(buf, dir, MAXPATHLEN); |
|
strlcat(buf, "/", MAXPATHLEN); |
|
sz = strlcat(buf, fn, MAXPATHLEN); |
|
|
|
if (sz < MAXPATHLEN) { |
|
if ( ! ofile_dirbuild(buf, verb, of)) |
|
return(0); |
|
continue; |
|
} else if (sz < MAXPATHLEN) |
|
continue; |
|
|
|
fprintf(stderr, "%s: Path too long\n", dir); |
|
return(0); |
return(0); |
} |
} |
if (DT_REG != dp->d_type) |
if (-1 == (fd = open(startdir, O_RDONLY, 0))) { |
continue; |
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "&open %s", startdir); |
if (0 == strcmp(MANDOC_DB, fn) || |
|
0 == strcmp(MANDOC_IDX, fn)) |
|
continue; |
|
|
|
buf[0] = '\0'; |
|
strlcat(buf, dir, MAXPATHLEN); |
|
strlcat(buf, "/", MAXPATHLEN); |
|
sz = strlcat(buf, fn, MAXPATHLEN); |
|
if (sz >= MAXPATHLEN) { |
|
fprintf(stderr, "%s: Path too long\n", dir); |
|
return(0); |
return(0); |
} |
} |
|
if (NULL == targetdir) |
nof = mandoc_calloc(1, sizeof(struct of)); |
targetdir = startdir; |
nof->fname = mandoc_strdup(buf); |
} else { |
|
if (-1 == fd) |
if (verb > 2) |
return(0); |
printf("%s: Scheduling\n", buf); |
if (-1 == fchdir(fd)) { |
|
close(fd); |
if (NULL == *of) { |
basedir[0] = '\0'; |
*of = nof; |
exitcode = (int)MANDOCLEVEL_SYSERR; |
(*of)->first = nof; |
say("", "&chdir %s", startdir); |
} else { |
return(0); |
nof->first = (*of)->first; |
|
(*of)->next = nof; |
|
*of = nof; |
|
} |
} |
|
if (NULL == targetdir) { |
|
close(fd); |
|
return(1); |
|
} |
} |
} |
|
if (NULL == realpath(targetdir, basedir)) { |
closedir(d); |
basedir[0] = '\0'; |
|
exitcode = (int)MANDOCLEVEL_BADARG; |
|
say("", "&%s: realpath", targetdir); |
|
return(0); |
|
} else if (-1 == chdir(basedir)) { |
|
exitcode = (int)MANDOCLEVEL_BADARG; |
|
say("", "&chdir"); |
|
return(0); |
|
} |
return(1); |
return(1); |
} |
} |
|
|
static void |
static void |
ofile_free(struct of *of) |
say(const char *file, const char *format, ...) |
{ |
{ |
struct of *nof; |
va_list ap; |
|
int use_errno; |
|
|
while (of) { |
if ('\0' != *basedir) |
nof = of->next; |
fprintf(stderr, "%s", basedir); |
free(of->fname); |
if ('\0' != *basedir && '\0' != *file) |
free(of); |
fputs("//", stderr); |
of = nof; |
if ('\0' != *file) |
} |
fprintf(stderr, "%s", file); |
} |
|
|
|
static void |
use_errno = 1; |
usage(void) |
if (NULL != format) { |
{ |
switch (*format) { |
|
case ('&'): |
fprintf(stderr, "usage: %s [-v] " |
format++; |
"[-d dir [files...] |" |
break; |
" -u dir [files...] |" |
case ('\0'): |
" dir...]\n", progname); |
format = NULL; |
|
break; |
|
default: |
|
use_errno = 0; |
|
break; |
|
} |
|
} |
|
if (NULL != format) { |
|
if ('\0' != *basedir || '\0' != *file) |
|
fputs(": ", stderr); |
|
va_start(ap, format); |
|
vfprintf(stderr, format, ap); |
|
va_end(ap); |
|
} |
|
if (use_errno) { |
|
if ('\0' != *basedir || '\0' != *file || NULL != format) |
|
fputs(": ", stderr); |
|
perror(NULL); |
|
} else |
|
fputc('\n', stderr); |
} |
} |