version 1.179, 2014/12/09 07:29:42 |
version 1.262, 2018/12/30 00:49:55 |
|
|
/* $Id$ */ |
/* $Id$ */ |
/* |
/* |
* Copyright (c) 2011, 2012 Kristaps Dzonsons <kristaps@bsd.lv> |
* Copyright (c) 2011, 2012 Kristaps Dzonsons <kristaps@bsd.lv> |
* Copyright (c) 2011, 2012, 2013, 2014 Ingo Schwarze <schwarze@openbsd.org> |
* Copyright (c) 2011-2018 Ingo Schwarze <schwarze@openbsd.org> |
|
* Copyright (c) 2016 Ed Maste <emaste@freebsd.org> |
* |
* |
* Permission to use, copy, modify, and distribute this software for any |
* Permission to use, copy, modify, and distribute this software for any |
* purpose with or without fee is hereby granted, provided that the above |
* purpose with or without fee is hereby granted, provided that the above |
* copyright notice and this permission notice appear in all copies. |
* copyright notice and this permission notice appear in all copies. |
* |
* |
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES |
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHORS DISCLAIM ALL WARRANTIES |
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF |
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF |
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR |
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR |
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES |
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES |
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN |
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF |
|
|
#include "config.h" |
#include "config.h" |
|
|
#include <sys/types.h> |
#include <sys/types.h> |
|
#include <sys/mman.h> |
#include <sys/stat.h> |
#include <sys/stat.h> |
#include <sys/wait.h> |
|
|
|
#include <assert.h> |
#include <assert.h> |
#include <ctype.h> |
#include <ctype.h> |
|
#if HAVE_ERR |
|
#include <err.h> |
|
#endif |
#include <errno.h> |
#include <errno.h> |
#include <fcntl.h> |
#include <fcntl.h> |
#if HAVE_FTS |
#if HAVE_FTS |
|
|
#else |
#else |
#include "compat_fts.h" |
#include "compat_fts.h" |
#endif |
#endif |
#include <getopt.h> |
|
#include <limits.h> |
#include <limits.h> |
|
#if HAVE_SANDBOX_INIT |
|
#include <sandbox.h> |
|
#endif |
|
#include <stdarg.h> |
#include <stddef.h> |
#include <stddef.h> |
#include <stdio.h> |
#include <stdio.h> |
#include <stdint.h> |
#include <stdint.h> |
|
|
#include <string.h> |
#include <string.h> |
#include <unistd.h> |
#include <unistd.h> |
|
|
#if HAVE_OHASH |
#include "mandoc_aux.h" |
#include <ohash.h> |
#include "mandoc_ohash.h" |
#else |
#include "mandoc.h" |
#include "compat_ohash.h" |
#include "roff.h" |
#endif |
|
#include <sqlite3.h> |
|
|
|
#include "mdoc.h" |
#include "mdoc.h" |
#include "man.h" |
#include "man.h" |
#include "mandoc.h" |
#include "mandoc_parse.h" |
#include "mandoc_aux.h" |
#include "manconf.h" |
#include "manpath.h" |
|
#include "mansearch.h" |
#include "mansearch.h" |
|
#include "dba_array.h" |
|
#include "dba.h" |
|
|
extern int mansearch_keymax; |
|
extern const char *const mansearch_keynames[]; |
extern const char *const mansearch_keynames[]; |
|
|
#define SQL_EXEC(_v) \ |
|
if (SQLITE_OK != sqlite3_exec(db, (_v), NULL, NULL, NULL)) \ |
|
say("", "%s: %s", (_v), sqlite3_errmsg(db)) |
|
#define SQL_BIND_TEXT(_s, _i, _v) \ |
|
if (SQLITE_OK != sqlite3_bind_text \ |
|
((_s), (_i)++, (_v), -1, SQLITE_STATIC)) \ |
|
say(mlink->file, "%s", sqlite3_errmsg(db)) |
|
#define SQL_BIND_INT(_s, _i, _v) \ |
|
if (SQLITE_OK != sqlite3_bind_int \ |
|
((_s), (_i)++, (_v))) \ |
|
say(mlink->file, "%s", sqlite3_errmsg(db)) |
|
#define SQL_BIND_INT64(_s, _i, _v) \ |
|
if (SQLITE_OK != sqlite3_bind_int64 \ |
|
((_s), (_i)++, (_v))) \ |
|
say(mlink->file, "%s", sqlite3_errmsg(db)) |
|
#define SQL_STEP(_s) \ |
|
if (SQLITE_DONE != sqlite3_step((_s))) \ |
|
say(mlink->file, "%s", sqlite3_errmsg(db)) |
|
|
|
enum op { |
enum op { |
OP_DEFAULT = 0, /* new dbs from dir list or default config */ |
OP_DEFAULT = 0, /* new dbs from dir list or default config */ |
OP_CONFFILE, /* new databases from custom config file */ |
OP_CONFFILE, /* new databases from custom config file */ |
|
|
|
|
struct mpage { |
struct mpage { |
struct inodev inodev; /* used for hashing routine */ |
struct inodev inodev; /* used for hashing routine */ |
int64_t pageid; /* pageid in mpages SQL table */ |
struct dba_array *dba; |
char *sec; /* section from file content */ |
char *sec; /* section from file content */ |
char *arch; /* architecture from file content */ |
char *arch; /* architecture from file content */ |
char *title; /* title from file content */ |
char *title; /* title from file content */ |
char *desc; /* description from file content */ |
char *desc; /* description from file content */ |
|
struct mpage *next; /* singly linked list */ |
struct mlink *mlinks; /* singly linked list */ |
struct mlink *mlinks; /* singly linked list */ |
int form; /* format from file content */ |
|
int name_head_done; |
int name_head_done; |
|
enum form form; /* format from file content */ |
}; |
}; |
|
|
struct mlink { |
struct mlink { |
|
|
char *fsec; /* section from file name suffix */ |
char *fsec; /* section from file name suffix */ |
struct mlink *next; /* singly linked list */ |
struct mlink *next; /* singly linked list */ |
struct mpage *mpage; /* parent */ |
struct mpage *mpage; /* parent */ |
int dform; /* format from directory */ |
|
int fform; /* format from file name suffix */ |
|
int gzip; /* filename has a .gz suffix */ |
int gzip; /* filename has a .gz suffix */ |
|
enum form dform; /* format from directory */ |
|
enum form fform; /* format from file name suffix */ |
}; |
}; |
|
|
enum stmt { |
typedef int (*mdoc_fp)(struct mpage *, const struct roff_meta *, |
STMT_DELETE_PAGE = 0, /* delete mpage */ |
const struct roff_node *); |
STMT_INSERT_PAGE, /* insert mpage */ |
|
STMT_INSERT_LINK, /* insert mlink */ |
|
STMT_INSERT_NAME, /* insert name */ |
|
STMT_SELECT_NAME, /* retrieve existing name flags */ |
|
STMT_INSERT_KEY, /* insert parsed key */ |
|
STMT__MAX |
|
}; |
|
|
|
typedef int (*mdoc_fp)(struct mpage *, const struct mdoc_meta *, |
|
const struct mdoc_node *); |
|
|
|
struct mdoc_handler { |
struct mdoc_handler { |
mdoc_fp fp; /* optional handler */ |
mdoc_fp fp; /* optional handler */ |
uint64_t mask; /* set unless handler returns 0 */ |
uint64_t mask; /* set unless handler returns 0 */ |
|
int taboo; /* node flags that must not be set */ |
}; |
}; |
|
|
static void dbclose(int); |
|
static void dbadd(struct mpage *); |
int mandocdb(int, char *[]); |
|
|
|
static void dbadd(struct dba *, struct mpage *); |
static void dbadd_mlink(const struct mlink *mlink); |
static void dbadd_mlink(const struct mlink *mlink); |
static void dbadd_mlink_name(const struct mlink *mlink); |
static void dbprune(struct dba *); |
static int dbopen(int); |
static void dbwrite(struct dba *); |
static void dbprune(void); |
|
static void filescan(const char *); |
static void filescan(const char *); |
static void *hash_alloc(size_t, void *); |
#if HAVE_FTS_COMPARE_CONST |
static void hash_free(void *, void *); |
static int fts_compare(const FTSENT *const *, const FTSENT *const *); |
static void *hash_calloc(size_t, size_t, void *); |
#else |
|
static int fts_compare(const FTSENT **, const FTSENT **); |
|
#endif |
static void mlink_add(struct mlink *, const struct stat *); |
static void mlink_add(struct mlink *, const struct stat *); |
static void mlink_check(struct mpage *, struct mlink *); |
static void mlink_check(struct mpage *, struct mlink *); |
static void mlink_free(struct mlink *); |
static void mlink_free(struct mlink *); |
static void mlinks_undupe(struct mpage *); |
static void mlinks_undupe(struct mpage *); |
static void mpages_free(void); |
static void mpages_free(void); |
static void mpages_merge(struct mparse *); |
static void mpages_merge(struct dba *, struct mparse *); |
static void names_check(void); |
|
static void parse_cat(struct mpage *, int); |
static void parse_cat(struct mpage *, int); |
static void parse_man(struct mpage *, const struct man_meta *, |
static void parse_man(struct mpage *, const struct roff_meta *, |
const struct man_node *); |
const struct roff_node *); |
static void parse_mdoc(struct mpage *, const struct mdoc_meta *, |
static void parse_mdoc(struct mpage *, const struct roff_meta *, |
const struct mdoc_node *); |
const struct roff_node *); |
static int parse_mdoc_body(struct mpage *, const struct mdoc_meta *, |
static int parse_mdoc_head(struct mpage *, const struct roff_meta *, |
const struct mdoc_node *); |
const struct roff_node *); |
static int parse_mdoc_head(struct mpage *, const struct mdoc_meta *, |
static int parse_mdoc_Fa(struct mpage *, const struct roff_meta *, |
const struct mdoc_node *); |
const struct roff_node *); |
static int parse_mdoc_Fd(struct mpage *, const struct mdoc_meta *, |
static int parse_mdoc_Fd(struct mpage *, const struct roff_meta *, |
const struct mdoc_node *); |
const struct roff_node *); |
static void parse_mdoc_fname(struct mpage *, const struct mdoc_node *); |
static void parse_mdoc_fname(struct mpage *, const struct roff_node *); |
static int parse_mdoc_Fn(struct mpage *, const struct mdoc_meta *, |
static int parse_mdoc_Fn(struct mpage *, const struct roff_meta *, |
const struct mdoc_node *); |
const struct roff_node *); |
static int parse_mdoc_Fo(struct mpage *, const struct mdoc_meta *, |
static int parse_mdoc_Fo(struct mpage *, const struct roff_meta *, |
const struct mdoc_node *); |
const struct roff_node *); |
static int parse_mdoc_Nd(struct mpage *, const struct mdoc_meta *, |
static int parse_mdoc_Nd(struct mpage *, const struct roff_meta *, |
const struct mdoc_node *); |
const struct roff_node *); |
static int parse_mdoc_Nm(struct mpage *, const struct mdoc_meta *, |
static int parse_mdoc_Nm(struct mpage *, const struct roff_meta *, |
const struct mdoc_node *); |
const struct roff_node *); |
static int parse_mdoc_Sh(struct mpage *, const struct mdoc_meta *, |
static int parse_mdoc_Sh(struct mpage *, const struct roff_meta *, |
const struct mdoc_node *); |
const struct roff_node *); |
static int parse_mdoc_Xr(struct mpage *, const struct mdoc_meta *, |
static int parse_mdoc_Va(struct mpage *, const struct roff_meta *, |
const struct mdoc_node *); |
const struct roff_node *); |
|
static int parse_mdoc_Xr(struct mpage *, const struct roff_meta *, |
|
const struct roff_node *); |
static void putkey(const struct mpage *, char *, uint64_t); |
static void putkey(const struct mpage *, char *, uint64_t); |
static void putkeys(const struct mpage *, char *, size_t, uint64_t); |
static void putkeys(const struct mpage *, char *, size_t, uint64_t); |
static void putmdockey(const struct mpage *, |
static void putmdockey(const struct mpage *, |
const struct mdoc_node *, uint64_t); |
const struct roff_node *, uint64_t, int); |
static int render_string(char **, size_t *); |
static int render_string(char **, size_t *); |
static void say(const char *, const char *, ...); |
static void say(const char *, const char *, ...) |
|
__attribute__((__format__ (__printf__, 2, 3))); |
static int set_basedir(const char *, int); |
static int set_basedir(const char *, int); |
static int treescan(void); |
static int treescan(void); |
static size_t utf8(unsigned int, char [7]); |
static size_t utf8(unsigned int, char [7]); |
|
|
static char tempfilename[32]; |
|
static char *progname; |
|
static int nodb; /* no database changes */ |
static int nodb; /* no database changes */ |
static int mparse_options; /* abort the parse early */ |
static int mparse_options; /* abort the parse early */ |
static int use_all; /* use all found files */ |
static int use_all; /* use all found files */ |
Line 199 static int write_utf8; /* write UTF-8 output; else A |
|
Line 179 static int write_utf8; /* write UTF-8 output; else A |
|
static int exitcode; /* to be returned by main */ |
static int exitcode; /* to be returned by main */ |
static enum op op; /* operational mode */ |
static enum op op; /* operational mode */ |
static char basedir[PATH_MAX]; /* current base directory */ |
static char basedir[PATH_MAX]; /* current base directory */ |
static struct mchars *mchars; /* table of named characters */ |
static struct mpage *mpage_head; /* list of distinct manual pages */ |
static struct ohash mpages; /* table of distinct manual pages */ |
static struct ohash mpages; /* table of distinct manual pages */ |
static struct ohash mlinks; /* table of directory entries */ |
static struct ohash mlinks; /* table of directory entries */ |
static struct ohash names; /* table of all names */ |
static struct ohash names; /* table of all names */ |
static struct ohash strings; /* table of all strings */ |
static struct ohash strings; /* table of all strings */ |
static sqlite3 *db = NULL; /* current database */ |
|
static sqlite3_stmt *stmts[STMT__MAX]; /* current statements */ |
|
static uint64_t name_mask; |
static uint64_t name_mask; |
|
|
static const struct mdoc_handler mdocs[MDOC_MAX] = { |
static const struct mdoc_handler mdoc_handlers[MDOC_MAX - MDOC_Dd] = { |
{ NULL, 0 }, /* Ap */ |
{ NULL, 0, NODE_NOPRT }, /* Dd */ |
{ NULL, 0 }, /* Dd */ |
{ NULL, 0, NODE_NOPRT }, /* Dt */ |
{ NULL, 0 }, /* Dt */ |
{ NULL, 0, NODE_NOPRT }, /* Os */ |
{ NULL, 0 }, /* Os */ |
{ parse_mdoc_Sh, TYPE_Sh, 0 }, /* Sh */ |
{ parse_mdoc_Sh, TYPE_Sh }, /* Sh */ |
{ parse_mdoc_head, TYPE_Ss, 0 }, /* Ss */ |
{ parse_mdoc_head, TYPE_Ss }, /* Ss */ |
{ NULL, 0, 0 }, /* Pp */ |
{ NULL, 0 }, /* Pp */ |
{ NULL, 0, 0 }, /* D1 */ |
{ NULL, 0 }, /* D1 */ |
{ NULL, 0, 0 }, /* Dl */ |
{ NULL, 0 }, /* Dl */ |
{ NULL, 0, 0 }, /* Bd */ |
{ NULL, 0 }, /* Bd */ |
{ NULL, 0, 0 }, /* Ed */ |
{ NULL, 0 }, /* Ed */ |
{ NULL, 0, 0 }, /* Bl */ |
{ NULL, 0 }, /* Bl */ |
{ NULL, 0, 0 }, /* El */ |
{ NULL, 0 }, /* El */ |
{ NULL, 0, 0 }, /* It */ |
{ NULL, 0 }, /* It */ |
{ NULL, 0, 0 }, /* Ad */ |
{ NULL, 0 }, /* Ad */ |
{ NULL, TYPE_An, 0 }, /* An */ |
{ NULL, TYPE_An }, /* An */ |
{ NULL, 0, 0 }, /* Ap */ |
{ NULL, TYPE_Ar }, /* Ar */ |
{ NULL, TYPE_Ar, 0 }, /* Ar */ |
{ NULL, TYPE_Cd }, /* Cd */ |
{ NULL, TYPE_Cd, 0 }, /* Cd */ |
{ NULL, TYPE_Cm }, /* Cm */ |
{ NULL, TYPE_Cm, 0 }, /* Cm */ |
{ NULL, TYPE_Dv }, /* Dv */ |
{ NULL, TYPE_Dv, 0 }, /* Dv */ |
{ NULL, TYPE_Er }, /* Er */ |
{ NULL, TYPE_Er, 0 }, /* Er */ |
{ NULL, TYPE_Ev }, /* Ev */ |
{ NULL, TYPE_Ev, 0 }, /* Ev */ |
{ NULL, 0 }, /* Ex */ |
{ NULL, 0, 0 }, /* Ex */ |
{ NULL, TYPE_Fa }, /* Fa */ |
{ parse_mdoc_Fa, 0, 0 }, /* Fa */ |
{ parse_mdoc_Fd, 0 }, /* Fd */ |
{ parse_mdoc_Fd, 0, 0 }, /* Fd */ |
{ NULL, TYPE_Fl }, /* Fl */ |
{ NULL, TYPE_Fl, 0 }, /* Fl */ |
{ parse_mdoc_Fn, 0 }, /* Fn */ |
{ parse_mdoc_Fn, 0, 0 }, /* Fn */ |
{ NULL, TYPE_Ft }, /* Ft */ |
{ NULL, TYPE_Ft | TYPE_Vt, 0 }, /* Ft */ |
{ NULL, TYPE_Ic }, /* Ic */ |
{ NULL, TYPE_Ic, 0 }, /* Ic */ |
{ NULL, TYPE_In }, /* In */ |
{ NULL, TYPE_In, 0 }, /* In */ |
{ NULL, TYPE_Li }, /* Li */ |
{ NULL, TYPE_Li, 0 }, /* Li */ |
{ parse_mdoc_Nd, 0 }, /* Nd */ |
{ parse_mdoc_Nd, 0, 0 }, /* Nd */ |
{ parse_mdoc_Nm, 0 }, /* Nm */ |
{ parse_mdoc_Nm, 0, 0 }, /* Nm */ |
{ NULL, 0 }, /* Op */ |
{ NULL, 0, 0 }, /* Op */ |
{ NULL, 0 }, /* Ot */ |
{ NULL, 0, 0 }, /* Ot */ |
{ NULL, TYPE_Pa }, /* Pa */ |
{ NULL, TYPE_Pa, NODE_NOSRC }, /* Pa */ |
{ NULL, 0 }, /* Rv */ |
{ NULL, 0, 0 }, /* Rv */ |
{ NULL, TYPE_St }, /* St */ |
{ NULL, TYPE_St, 0 }, /* St */ |
{ NULL, TYPE_Va }, /* Va */ |
{ parse_mdoc_Va, TYPE_Va, 0 }, /* Va */ |
{ parse_mdoc_body, TYPE_Va }, /* Vt */ |
{ parse_mdoc_Va, TYPE_Vt, 0 }, /* Vt */ |
{ parse_mdoc_Xr, 0 }, /* Xr */ |
{ parse_mdoc_Xr, 0, 0 }, /* Xr */ |
{ NULL, 0 }, /* %A */ |
{ NULL, 0, 0 }, /* %A */ |
{ NULL, 0 }, /* %B */ |
{ NULL, 0, 0 }, /* %B */ |
{ NULL, 0 }, /* %D */ |
{ NULL, 0, 0 }, /* %D */ |
{ NULL, 0 }, /* %I */ |
{ NULL, 0, 0 }, /* %I */ |
{ NULL, 0 }, /* %J */ |
{ NULL, 0, 0 }, /* %J */ |
{ NULL, 0 }, /* %N */ |
{ NULL, 0, 0 }, /* %N */ |
{ NULL, 0 }, /* %O */ |
{ NULL, 0, 0 }, /* %O */ |
{ NULL, 0 }, /* %P */ |
{ NULL, 0, 0 }, /* %P */ |
{ NULL, 0 }, /* %R */ |
{ NULL, 0, 0 }, /* %R */ |
{ NULL, 0 }, /* %T */ |
{ NULL, 0, 0 }, /* %T */ |
{ NULL, 0 }, /* %V */ |
{ NULL, 0, 0 }, /* %V */ |
{ NULL, 0 }, /* Ac */ |
{ NULL, 0, 0 }, /* Ac */ |
{ NULL, 0 }, /* Ao */ |
{ NULL, 0, 0 }, /* Ao */ |
{ NULL, 0 }, /* Aq */ |
{ NULL, 0, 0 }, /* Aq */ |
{ NULL, TYPE_At }, /* At */ |
{ NULL, TYPE_At, 0 }, /* At */ |
{ NULL, 0 }, /* Bc */ |
{ NULL, 0, 0 }, /* Bc */ |
{ NULL, 0 }, /* Bf */ |
{ NULL, 0, 0 }, /* Bf */ |
{ NULL, 0 }, /* Bo */ |
{ NULL, 0, 0 }, /* Bo */ |
{ NULL, 0 }, /* Bq */ |
{ NULL, 0, 0 }, /* Bq */ |
{ NULL, TYPE_Bsx }, /* Bsx */ |
{ NULL, TYPE_Bsx, NODE_NOSRC }, /* Bsx */ |
{ NULL, TYPE_Bx }, /* Bx */ |
{ NULL, TYPE_Bx, NODE_NOSRC }, /* Bx */ |
{ NULL, 0 }, /* Db */ |
{ NULL, 0, 0 }, /* Db */ |
{ NULL, 0 }, /* Dc */ |
{ NULL, 0, 0 }, /* Dc */ |
{ NULL, 0 }, /* Do */ |
{ NULL, 0, 0 }, /* Do */ |
{ NULL, 0 }, /* Dq */ |
{ NULL, 0, 0 }, /* Dq */ |
{ NULL, 0 }, /* Ec */ |
{ NULL, 0, 0 }, /* Ec */ |
{ NULL, 0 }, /* Ef */ |
{ NULL, 0, 0 }, /* Ef */ |
{ NULL, TYPE_Em }, /* Em */ |
{ NULL, TYPE_Em, 0 }, /* Em */ |
{ NULL, 0 }, /* Eo */ |
{ NULL, 0, 0 }, /* Eo */ |
{ NULL, TYPE_Fx }, /* Fx */ |
{ NULL, TYPE_Fx, NODE_NOSRC }, /* Fx */ |
{ NULL, TYPE_Ms }, /* Ms */ |
{ NULL, TYPE_Ms, 0 }, /* Ms */ |
{ NULL, 0 }, /* No */ |
{ NULL, 0, 0 }, /* No */ |
{ NULL, 0 }, /* Ns */ |
{ NULL, 0, 0 }, /* Ns */ |
{ NULL, TYPE_Nx }, /* Nx */ |
{ NULL, TYPE_Nx, NODE_NOSRC }, /* Nx */ |
{ NULL, TYPE_Ox }, /* Ox */ |
{ NULL, TYPE_Ox, NODE_NOSRC }, /* Ox */ |
{ NULL, 0 }, /* Pc */ |
{ NULL, 0, 0 }, /* Pc */ |
{ NULL, 0 }, /* Pf */ |
{ NULL, 0, 0 }, /* Pf */ |
{ NULL, 0 }, /* Po */ |
{ NULL, 0, 0 }, /* Po */ |
{ NULL, 0 }, /* Pq */ |
{ NULL, 0, 0 }, /* Pq */ |
{ NULL, 0 }, /* Qc */ |
{ NULL, 0, 0 }, /* Qc */ |
{ NULL, 0 }, /* Ql */ |
{ NULL, 0, 0 }, /* Ql */ |
{ NULL, 0 }, /* Qo */ |
{ NULL, 0, 0 }, /* Qo */ |
{ NULL, 0 }, /* Qq */ |
{ NULL, 0, 0 }, /* Qq */ |
{ NULL, 0 }, /* Re */ |
{ NULL, 0, 0 }, /* Re */ |
{ NULL, 0 }, /* Rs */ |
{ NULL, 0, 0 }, /* Rs */ |
{ NULL, 0 }, /* Sc */ |
{ NULL, 0, 0 }, /* Sc */ |
{ NULL, 0 }, /* So */ |
{ NULL, 0, 0 }, /* So */ |
{ NULL, 0 }, /* Sq */ |
{ NULL, 0, 0 }, /* Sq */ |
{ NULL, 0 }, /* Sm */ |
{ NULL, 0, 0 }, /* Sm */ |
{ NULL, 0 }, /* Sx */ |
{ NULL, 0, 0 }, /* Sx */ |
{ NULL, TYPE_Sy }, /* Sy */ |
{ NULL, TYPE_Sy, 0 }, /* Sy */ |
{ NULL, TYPE_Tn }, /* Tn */ |
{ NULL, TYPE_Tn, 0 }, /* Tn */ |
{ NULL, 0 }, /* Ux */ |
{ NULL, 0, NODE_NOSRC }, /* Ux */ |
{ NULL, 0 }, /* Xc */ |
{ NULL, 0, 0 }, /* Xc */ |
{ NULL, 0 }, /* Xo */ |
{ NULL, 0, 0 }, /* Xo */ |
{ parse_mdoc_Fo, 0 }, /* Fo */ |
{ parse_mdoc_Fo, 0, 0 }, /* Fo */ |
{ NULL, 0 }, /* Fc */ |
{ NULL, 0, 0 }, /* Fc */ |
{ NULL, 0 }, /* Oo */ |
{ NULL, 0, 0 }, /* Oo */ |
{ NULL, 0 }, /* Oc */ |
{ NULL, 0, 0 }, /* Oc */ |
{ NULL, 0 }, /* Bk */ |
{ NULL, 0, 0 }, /* Bk */ |
{ NULL, 0 }, /* Ek */ |
{ NULL, 0, 0 }, /* Ek */ |
{ NULL, 0 }, /* Bt */ |
{ NULL, 0, 0 }, /* Bt */ |
{ NULL, 0 }, /* Hf */ |
{ NULL, 0, 0 }, /* Hf */ |
{ NULL, 0 }, /* Fr */ |
{ NULL, 0, 0 }, /* Fr */ |
{ NULL, 0 }, /* Ud */ |
{ NULL, 0, 0 }, /* Ud */ |
{ NULL, TYPE_Lb }, /* Lb */ |
{ NULL, TYPE_Lb, NODE_NOSRC }, /* Lb */ |
{ NULL, 0 }, /* Lp */ |
{ NULL, 0, 0 }, /* Lp */ |
{ NULL, TYPE_Lk }, /* Lk */ |
{ NULL, TYPE_Lk, 0 }, /* Lk */ |
{ NULL, TYPE_Mt }, /* Mt */ |
{ NULL, TYPE_Mt, NODE_NOSRC }, /* Mt */ |
{ NULL, 0 }, /* Brq */ |
{ NULL, 0, 0 }, /* Brq */ |
{ NULL, 0 }, /* Bro */ |
{ NULL, 0, 0 }, /* Bro */ |
{ NULL, 0 }, /* Brc */ |
{ NULL, 0, 0 }, /* Brc */ |
{ NULL, 0 }, /* %C */ |
{ NULL, 0, 0 }, /* %C */ |
{ NULL, 0 }, /* Es */ |
{ NULL, 0, 0 }, /* Es */ |
{ NULL, 0 }, /* En */ |
{ NULL, 0, 0 }, /* En */ |
{ NULL, TYPE_Dx }, /* Dx */ |
{ NULL, TYPE_Dx, NODE_NOSRC }, /* Dx */ |
{ NULL, 0 }, /* %Q */ |
{ NULL, 0, 0 }, /* %Q */ |
{ NULL, 0 }, /* br */ |
{ NULL, 0, 0 }, /* %U */ |
{ NULL, 0 }, /* sp */ |
{ NULL, 0, 0 }, /* Ta */ |
{ NULL, 0 }, /* %U */ |
|
{ NULL, 0 }, /* Ta */ |
|
{ NULL, 0 }, /* ll */ |
|
}; |
}; |
|
|
|
|
int |
int |
mandocdb(int argc, char *argv[]) |
mandocdb(int argc, char *argv[]) |
{ |
{ |
int ch, i; |
struct manconf conf; |
size_t j, sz; |
|
const char *path_arg; |
|
struct manpaths dirs; |
|
struct mparse *mp; |
struct mparse *mp; |
struct ohash_info mpages_info, mlinks_info; |
struct dba *dba; |
|
const char *path_arg, *progname; |
|
size_t j, sz; |
|
int ch, i; |
|
|
memset(stmts, 0, STMT__MAX * sizeof(sqlite3_stmt *)); |
#if HAVE_PLEDGE |
memset(&dirs, 0, sizeof(struct manpaths)); |
if (pledge("stdio rpath wpath cpath", NULL) == -1) { |
|
warn("pledge"); |
|
return (int)MANDOCLEVEL_SYSERR; |
|
} |
|
#endif |
|
|
mpages_info.alloc = mlinks_info.alloc = hash_alloc; |
#if HAVE_SANDBOX_INIT |
mpages_info.calloc = mlinks_info.calloc = hash_calloc; |
if (sandbox_init(kSBXProfileNoInternet, SANDBOX_NAMED, NULL) == -1) { |
mpages_info.free = mlinks_info.free = hash_free; |
warnx("sandbox_init"); |
|
return (int)MANDOCLEVEL_SYSERR; |
|
} |
|
#endif |
|
|
mpages_info.key_offset = offsetof(struct mpage, inodev); |
memset(&conf, 0, sizeof(conf)); |
mlinks_info.key_offset = offsetof(struct mlink, file); |
|
|
|
progname = strrchr(argv[0], '/'); |
|
if (progname == NULL) |
|
progname = argv[0]; |
|
else |
|
++progname; |
|
|
|
/* |
/* |
* We accept a few different invocations. |
* We accept a few different invocations. |
* The CHECKOP macro makes sure that invocation styles don't |
* The CHECKOP macro makes sure that invocation styles don't |
Line 368 mandocdb(int argc, char *argv[]) |
|
Line 343 mandocdb(int argc, char *argv[]) |
|
*/ |
*/ |
#define CHECKOP(_op, _ch) do \ |
#define CHECKOP(_op, _ch) do \ |
if (OP_DEFAULT != (_op)) { \ |
if (OP_DEFAULT != (_op)) { \ |
fprintf(stderr, "%s: -%c: Conflicting option\n", \ |
warnx("-%c: Conflicting option", (_ch)); \ |
progname, (_ch)); \ |
|
goto usage; \ |
goto usage; \ |
} while (/*CONSTCOND*/0) |
} while (/*CONSTCOND*/0) |
|
|
|
mparse_options = MPARSE_VALIDATE; |
path_arg = NULL; |
path_arg = NULL; |
op = OP_DEFAULT; |
op = OP_DEFAULT; |
|
|
Line 405 mandocdb(int argc, char *argv[]) |
|
Line 380 mandocdb(int argc, char *argv[]) |
|
break; |
break; |
case 'T': |
case 'T': |
if (strcmp(optarg, "utf8")) { |
if (strcmp(optarg, "utf8")) { |
fprintf(stderr, "%s: -T%s: " |
warnx("-T%s: Unsupported output format", |
"Unsupported output format\n", |
optarg); |
progname, optarg); |
|
goto usage; |
goto usage; |
} |
} |
write_utf8 = 1; |
write_utf8 = 1; |
Line 433 mandocdb(int argc, char *argv[]) |
|
Line 407 mandocdb(int argc, char *argv[]) |
|
argc -= optind; |
argc -= optind; |
argv += optind; |
argv += optind; |
|
|
|
#if HAVE_PLEDGE |
|
if (nodb) { |
|
if (pledge("stdio rpath", NULL) == -1) { |
|
warn("pledge"); |
|
return (int)MANDOCLEVEL_SYSERR; |
|
} |
|
} |
|
#endif |
|
|
if (OP_CONFFILE == op && argc > 0) { |
if (OP_CONFFILE == op && argc > 0) { |
fprintf(stderr, "%s: -C: Too many arguments\n", |
warnx("-C: Too many arguments"); |
progname); |
|
goto usage; |
goto usage; |
} |
} |
|
|
exitcode = (int)MANDOCLEVEL_OK; |
exitcode = (int)MANDOCLEVEL_OK; |
mchars = mchars_alloc(); |
mchars_alloc(); |
mp = mparse_alloc(mparse_options, MANDOCLEVEL_FATAL, NULL, |
mp = mparse_alloc(mparse_options, MANDOC_OS_OTHER, NULL); |
mchars, NULL); |
mandoc_ohash_init(&mpages, 6, offsetof(struct mpage, inodev)); |
ohash_init(&mpages, 6, &mpages_info); |
mandoc_ohash_init(&mlinks, 6, offsetof(struct mlink, file)); |
ohash_init(&mlinks, 6, &mlinks_info); |
|
|
|
if (OP_UPDATE == op || OP_DELETE == op || OP_TEST == op) { |
if (OP_UPDATE == op || OP_DELETE == op || OP_TEST == op) { |
|
|
Line 455 mandocdb(int argc, char *argv[]) |
|
Line 436 mandocdb(int argc, char *argv[]) |
|
if (OP_TEST != op && 0 == set_basedir(path_arg, 1)) |
if (OP_TEST != op && 0 == set_basedir(path_arg, 1)) |
goto out; |
goto out; |
|
|
if (dbopen(1)) { |
dba = nodb ? dba_new(128) : dba_read(MANDOC_DB); |
|
if (dba != NULL) { |
/* |
/* |
* The existing database is usable. Process |
* The existing database is usable. Process |
* all files specified on the command-line. |
* all files specified on the command-line. |
Line 463 mandocdb(int argc, char *argv[]) |
|
Line 445 mandocdb(int argc, char *argv[]) |
|
use_all = 1; |
use_all = 1; |
for (i = 0; i < argc; i++) |
for (i = 0; i < argc; i++) |
filescan(argv[i]); |
filescan(argv[i]); |
if (OP_TEST != op) |
if (nodb == 0) |
dbprune(); |
dbprune(dba); |
} else { |
} else { |
/* |
/* Database missing or corrupt. */ |
* Database missing or corrupt. |
if (op != OP_UPDATE || errno != ENOENT) |
* Recreate from scratch. |
say(MANDOC_DB, "%s: Automatically recreating" |
*/ |
" from scratch", strerror(errno)); |
exitcode = (int)MANDOCLEVEL_OK; |
exitcode = (int)MANDOCLEVEL_OK; |
op = OP_DEFAULT; |
op = OP_DEFAULT; |
if (0 == treescan()) |
if (0 == treescan()) |
goto out; |
goto out; |
if (0 == dbopen(0)) |
dba = dba_new(128); |
goto out; |
|
} |
} |
if (OP_DELETE != op) |
if (OP_DELETE != op) |
mpages_merge(mp); |
mpages_merge(dba, mp); |
dbclose(OP_DEFAULT == op ? 0 : 1); |
if (nodb == 0) |
|
dbwrite(dba); |
|
dba_free(dba); |
} else { |
} else { |
/* |
/* |
* If we have arguments, use them as our manpaths. |
* If we have arguments, use them as our manpaths. |
* If we don't, grok from manpath(1) or however else |
* If we don't, use man.conf(5). |
* manpath_parse() wants to do it. |
|
*/ |
*/ |
if (argc > 0) { |
if (argc > 0) { |
dirs.paths = mandoc_reallocarray(NULL, |
conf.manpath.paths = mandoc_reallocarray(NULL, |
argc, sizeof(char *)); |
argc, sizeof(char *)); |
dirs.sz = (size_t)argc; |
conf.manpath.sz = (size_t)argc; |
for (i = 0; i < argc; i++) |
for (i = 0; i < argc; i++) |
dirs.paths[i] = mandoc_strdup(argv[i]); |
conf.manpath.paths[i] = mandoc_strdup(argv[i]); |
} else |
} else |
manpath_parse(&dirs, path_arg, NULL, NULL); |
manconf_parse(&conf, path_arg, NULL, NULL); |
|
|
if (0 == dirs.sz) { |
if (conf.manpath.sz == 0) { |
exitcode = (int)MANDOCLEVEL_BADARG; |
exitcode = (int)MANDOCLEVEL_BADARG; |
say("", "Empty manpath"); |
say("", "Empty manpath"); |
} |
} |
Line 506 mandocdb(int argc, char *argv[]) |
|
Line 488 mandocdb(int argc, char *argv[]) |
|
* Ignore zero-length directories and strip trailing |
* Ignore zero-length directories and strip trailing |
* slashes. |
* slashes. |
*/ |
*/ |
for (j = 0; j < dirs.sz; j++) { |
for (j = 0; j < conf.manpath.sz; j++) { |
sz = strlen(dirs.paths[j]); |
sz = strlen(conf.manpath.paths[j]); |
if (sz && '/' == dirs.paths[j][sz - 1]) |
if (sz && conf.manpath.paths[j][sz - 1] == '/') |
dirs.paths[j][--sz] = '\0'; |
conf.manpath.paths[j][--sz] = '\0'; |
if (0 == sz) |
if (0 == sz) |
continue; |
continue; |
|
|
if (j) { |
if (j) { |
ohash_init(&mpages, 6, &mpages_info); |
mandoc_ohash_init(&mpages, 6, |
ohash_init(&mlinks, 6, &mlinks_info); |
offsetof(struct mpage, inodev)); |
|
mandoc_ohash_init(&mlinks, 6, |
|
offsetof(struct mlink, file)); |
} |
} |
|
|
if (0 == set_basedir(dirs.paths[j], argc > 0)) |
if ( ! set_basedir(conf.manpath.paths[j], argc > 0)) |
continue; |
continue; |
if (0 == treescan()) |
if (0 == treescan()) |
continue; |
continue; |
if (0 == dbopen(0)) |
dba = dba_new(128); |
continue; |
mpages_merge(dba, mp); |
|
if (nodb == 0) |
|
dbwrite(dba); |
|
dba_free(dba); |
|
|
mpages_merge(mp); |
if (j + 1 < conf.manpath.sz) { |
if (warnings && !nodb && |
|
! (MPARSE_QUICK & mparse_options)) |
|
names_check(); |
|
dbclose(0); |
|
|
|
if (j + 1 < dirs.sz) { |
|
mpages_free(); |
mpages_free(); |
ohash_delete(&mpages); |
ohash_delete(&mpages); |
ohash_delete(&mlinks); |
ohash_delete(&mlinks); |
Line 539 mandocdb(int argc, char *argv[]) |
|
Line 520 mandocdb(int argc, char *argv[]) |
|
} |
} |
} |
} |
out: |
out: |
manpath_free(&dirs); |
manconf_free(&conf); |
mparse_free(mp); |
mparse_free(mp); |
mchars_free(mchars); |
mchars_free(); |
mpages_free(); |
mpages_free(); |
ohash_delete(&mpages); |
ohash_delete(&mpages); |
ohash_delete(&mlinks); |
ohash_delete(&mlinks); |
return(exitcode); |
return exitcode; |
usage: |
usage: |
|
progname = getprogname(); |
fprintf(stderr, "usage: %s [-aDnpQ] [-C file] [-Tutf8]\n" |
fprintf(stderr, "usage: %s [-aDnpQ] [-C file] [-Tutf8]\n" |
" %s [-aDnpQ] [-Tutf8] dir ...\n" |
" %s [-aDnpQ] [-Tutf8] dir ...\n" |
" %s [-DnpQ] [-Tutf8] -d dir [file ...]\n" |
" %s [-DnpQ] [-Tutf8] -d dir [file ...]\n" |
" %s [-Dnp] -u dir [file ...]\n" |
" %s [-Dnp] -u dir [file ...]\n" |
" %s [-Q] -t file ...\n", |
" %s [-Q] -t file ...\n", |
progname, progname, progname, |
progname, progname, progname, progname, progname); |
progname, progname); |
|
|
|
return((int)MANDOCLEVEL_BADARG); |
return (int)MANDOCLEVEL_BADARG; |
} |
} |
|
|
/* |
/* |
|
* To get a singly linked list in alpha order while inserting entries |
|
* at the beginning, process directory entries in reverse alpha order. |
|
*/ |
|
static int |
|
#if HAVE_FTS_COMPARE_CONST |
|
fts_compare(const FTSENT *const *a, const FTSENT *const *b) |
|
#else |
|
fts_compare(const FTSENT **a, const FTSENT **b) |
|
#endif |
|
{ |
|
return -strcmp((*a)->fts_name, (*b)->fts_name); |
|
} |
|
|
|
/* |
* Scan a directory tree rooted at "basedir" for manpages. |
* Scan a directory tree rooted at "basedir" for manpages. |
* We use fts(), scanning directory parts along the way for clues to our |
* We use fts(), scanning directory parts along the way for clues to our |
* section and architecture. |
* section and architecture. |
|
|
* or |
* or |
* [./]cat<section>[/<arch>]/<name>.0 |
* [./]cat<section>[/<arch>]/<name>.0 |
* |
* |
* TODO: accomodate for multi-language directories. |
* TODO: accommodate for multi-language directories. |
*/ |
*/ |
static int |
static int |
treescan(void) |
treescan(void) |
|
|
FTS *f; |
FTS *f; |
FTSENT *ff; |
FTSENT *ff; |
struct mlink *mlink; |
struct mlink *mlink; |
int dform, gzip; |
int gzip; |
|
enum form dform; |
char *dsec, *arch, *fsec, *cp; |
char *dsec, *arch, *fsec, *cp; |
const char *path; |
const char *path; |
const char *argv[2]; |
const char *argv[2]; |
|
|
argv[0] = "."; |
argv[0] = "."; |
argv[1] = (char *)NULL; |
argv[1] = NULL; |
|
|
f = fts_open((char * const *)argv, |
f = fts_open((char * const *)argv, FTS_PHYSICAL | FTS_NOCHDIR, |
FTS_PHYSICAL | FTS_NOCHDIR, NULL); |
fts_compare); |
if (NULL == f) { |
if (f == NULL) { |
exitcode = (int)MANDOCLEVEL_SYSERR; |
exitcode = (int)MANDOCLEVEL_SYSERR; |
say("", "&fts_open"); |
say("", "&fts_open"); |
return(0); |
return 0; |
} |
} |
|
|
dsec = arch = NULL; |
dsec = arch = NULL; |
dform = FORM_NONE; |
dform = FORM_NONE; |
|
|
while (NULL != (ff = fts_read(f))) { |
while ((ff = fts_read(f)) != NULL) { |
path = ff->fts_path + 2; |
path = ff->fts_path + 2; |
switch (ff->fts_info) { |
switch (ff->fts_info) { |
|
|
|
|
* then get handled just like regular files. |
* then get handled just like regular files. |
*/ |
*/ |
case FTS_SL: |
case FTS_SL: |
if (NULL == realpath(path, buf)) { |
if (realpath(path, buf) == NULL) { |
if (warnings) |
if (warnings) |
say(path, "&realpath"); |
say(path, "&realpath"); |
continue; |
continue; |
} |
} |
if (strstr(buf, basedir) != buf) { |
if (strstr(buf, basedir) != buf |
|
#ifdef HOMEBREWDIR |
|
&& strstr(buf, HOMEBREWDIR) != buf |
|
#endif |
|
) { |
if (warnings) say("", |
if (warnings) say("", |
"%s: outside base directory", buf); |
"%s: outside base directory", buf); |
continue; |
continue; |
} |
} |
/* Use logical inode to avoid mpages dupe. */ |
/* Use logical inode to avoid mpages dupe. */ |
if (-1 == stat(path, ff->fts_statp)) { |
if (stat(path, ff->fts_statp) == -1) { |
if (warnings) |
if (warnings) |
say(path, "&stat"); |
say(path, "&stat"); |
continue; |
continue; |
|
|
* stored directory data and handling the filename. |
* stored directory data and handling the filename. |
*/ |
*/ |
case FTS_F: |
case FTS_F: |
if (0 == strcmp(path, MANDOC_DB)) |
if ( ! strcmp(path, MANDOC_DB)) |
continue; |
continue; |
if ( ! use_all && ff->fts_level < 2) { |
if ( ! use_all && ff->fts_level < 2) { |
if (warnings) |
if (warnings) |
|
|
} |
} |
gzip = 0; |
gzip = 0; |
fsec = NULL; |
fsec = NULL; |
while (NULL == fsec) { |
while (fsec == NULL) { |
fsec = strrchr(ff->fts_name, '.'); |
fsec = strrchr(ff->fts_name, '.'); |
if (NULL == fsec || strcmp(fsec+1, "gz")) |
if (fsec == NULL || strcmp(fsec+1, "gz")) |
break; |
break; |
gzip = 1; |
gzip = 1; |
*fsec = '\0'; |
*fsec = '\0'; |
fsec = NULL; |
fsec = NULL; |
} |
} |
if (NULL == fsec) { |
if (fsec == NULL) { |
if ( ! use_all) { |
if ( ! use_all) { |
if (warnings) |
if (warnings) |
say(path, |
say(path, |
"No filename suffix"); |
"No filename suffix"); |
continue; |
continue; |
} |
} |
} else if (0 == strcmp(++fsec, "html")) { |
} else if ( ! strcmp(++fsec, "html")) { |
if (warnings) |
if (warnings) |
say(path, "Skip html"); |
say(path, "Skip html"); |
continue; |
continue; |
} else if (0 == strcmp(fsec, "ps")) { |
} else if ( ! strcmp(fsec, "ps")) { |
if (warnings) |
if (warnings) |
say(path, "Skip ps"); |
say(path, "Skip ps"); |
continue; |
continue; |
} else if (0 == strcmp(fsec, "pdf")) { |
} else if ( ! strcmp(fsec, "pdf")) { |
if (warnings) |
if (warnings) |
say(path, "Skip pdf"); |
say(path, "Skip pdf"); |
continue; |
continue; |
} else if ( ! use_all && |
} else if ( ! use_all && |
((FORM_SRC == dform && strcmp(fsec, dsec)) || |
((dform == FORM_SRC && |
(FORM_CAT == dform && strcmp(fsec, "0")))) { |
strncmp(fsec, dsec, strlen(dsec))) || |
|
(dform == FORM_CAT && strcmp(fsec, "0")))) { |
if (warnings) |
if (warnings) |
say(path, "Wrong filename suffix"); |
say(path, "Wrong filename suffix"); |
continue; |
continue; |
|
|
continue; |
continue; |
|
|
case FTS_D: |
case FTS_D: |
/* FALLTHROUGH */ |
|
case FTS_DP: |
case FTS_DP: |
break; |
break; |
|
|
|
|
* If we're not in use_all, enforce it. |
* If we're not in use_all, enforce it. |
*/ |
*/ |
cp = ff->fts_name; |
cp = ff->fts_name; |
if (FTS_DP == ff->fts_info) |
if (ff->fts_info == FTS_DP) { |
|
dform = FORM_NONE; |
|
dsec = NULL; |
break; |
break; |
|
} |
|
|
if (0 == strncmp(cp, "man", 3)) { |
if ( ! strncmp(cp, "man", 3)) { |
dform = FORM_SRC; |
dform = FORM_SRC; |
dsec = cp + 3; |
dsec = cp + 3; |
} else if (0 == strncmp(cp, "cat", 3)) { |
} else if ( ! strncmp(cp, "cat", 3)) { |
dform = FORM_CAT; |
dform = FORM_CAT; |
dsec = cp + 3; |
dsec = cp + 3; |
} else { |
} else { |
|
|
dsec = NULL; |
dsec = NULL; |
} |
} |
|
|
if (NULL != dsec || use_all) |
if (dsec != NULL || use_all) |
break; |
break; |
|
|
if (warnings) |
if (warnings) |
|
|
* Possibly our architecture. |
* Possibly our architecture. |
* If we're descending, keep tabs on it. |
* If we're descending, keep tabs on it. |
*/ |
*/ |
if (FTS_DP != ff->fts_info && NULL != dsec) |
if (ff->fts_info != FTS_DP && dsec != NULL) |
arch = ff->fts_name; |
arch = ff->fts_name; |
else |
else |
arch = NULL; |
arch = NULL; |
break; |
break; |
default: |
default: |
if (FTS_DP == ff->fts_info || use_all) |
if (ff->fts_info == FTS_DP || use_all) |
break; |
break; |
if (warnings) |
if (warnings) |
say(path, "Extraneous directory part"); |
say(path, "Extraneous directory part"); |
|
|
} |
} |
|
|
fts_close(f); |
fts_close(f); |
return(1); |
return 1; |
} |
} |
|
|
/* |
/* |
Line 817 filescan(const char *file) |
|
Line 820 filescan(const char *file) |
|
start = buf; |
start = buf; |
else if (strstr(buf, basedir) == buf) |
else if (strstr(buf, basedir) == buf) |
start = buf + strlen(basedir); |
start = buf + strlen(basedir); |
|
#ifdef HOMEBREWDIR |
|
else if (strstr(buf, HOMEBREWDIR) == buf) |
|
start = buf; |
|
#endif |
else { |
else { |
exitcode = (int)MANDOCLEVEL_BADARG; |
exitcode = (int)MANDOCLEVEL_BADARG; |
say("", "%s: outside base directory", buf); |
say("", "%s: outside base directory", buf); |
Line 852 filescan(const char *file) |
|
Line 859 filescan(const char *file) |
|
if (strlcpy(mlink->file, start, sizeof(mlink->file)) >= |
if (strlcpy(mlink->file, start, sizeof(mlink->file)) >= |
sizeof(mlink->file)) { |
sizeof(mlink->file)) { |
say(start, "Filename too long"); |
say(start, "Filename too long"); |
|
free(mlink); |
return; |
return; |
} |
} |
|
|
/* |
/* |
|
* In test mode or when the original name is absolute |
|
* but outside our tree, guess the base directory. |
|
*/ |
|
|
|
if (op == OP_TEST || (start == buf && *start == '/')) { |
|
if (strncmp(buf, "man/", 4) == 0) |
|
start = buf + 4; |
|
else if ((start = strstr(buf, "/man/")) != NULL) |
|
start += 5; |
|
else |
|
start = buf; |
|
} |
|
|
|
/* |
* First try to guess our directory structure. |
* First try to guess our directory structure. |
* If we find a separator, try to look for man* or cat*. |
* If we find a separator, try to look for man* or cat*. |
* If we find one of these and what's underneath is a directory, |
* If we find one of these and what's underneath is a directory, |
Line 931 mlink_add(struct mlink *mlink, const struct stat *st) |
|
Line 953 mlink_add(struct mlink *mlink, const struct stat *st) |
|
assert(NULL == ohash_find(&mlinks, slot)); |
assert(NULL == ohash_find(&mlinks, slot)); |
ohash_insert(&mlinks, slot, mlink); |
ohash_insert(&mlinks, slot, mlink); |
|
|
|
memset(&inodev, 0, sizeof(inodev)); /* Clear padding. */ |
inodev.st_ino = st->st_ino; |
inodev.st_ino = st->st_ino; |
inodev.st_dev = st->st_dev; |
inodev.st_dev = st->st_dev; |
slot = ohash_lookup_memory(&mpages, (char *)&inodev, |
slot = ohash_lookup_memory(&mpages, (char *)&inodev, |
Line 940 mlink_add(struct mlink *mlink, const struct stat *st) |
|
Line 963 mlink_add(struct mlink *mlink, const struct stat *st) |
|
mpage = mandoc_calloc(1, sizeof(struct mpage)); |
mpage = mandoc_calloc(1, sizeof(struct mpage)); |
mpage->inodev.st_ino = inodev.st_ino; |
mpage->inodev.st_ino = inodev.st_ino; |
mpage->inodev.st_dev = inodev.st_dev; |
mpage->inodev.st_dev = inodev.st_dev; |
|
mpage->form = FORM_NONE; |
|
mpage->next = mpage_head; |
|
mpage_head = mpage; |
ohash_insert(&mpages, slot, mpage); |
ohash_insert(&mpages, slot, mpage); |
} else |
} else |
mlink->next = mpage->mlinks; |
mlink->next = mpage->mlinks; |
Line 963 mpages_free(void) |
|
Line 989 mpages_free(void) |
|
{ |
{ |
struct mpage *mpage; |
struct mpage *mpage; |
struct mlink *mlink; |
struct mlink *mlink; |
unsigned int slot; |
|
|
|
mpage = ohash_first(&mpages, &slot); |
while ((mpage = mpage_head) != NULL) { |
while (NULL != mpage) { |
while ((mlink = mpage->mlinks) != NULL) { |
while (NULL != (mlink = mpage->mlinks)) { |
|
mpage->mlinks = mlink->next; |
mpage->mlinks = mlink->next; |
mlink_free(mlink); |
mlink_free(mlink); |
} |
} |
|
mpage_head = mpage->next; |
free(mpage->sec); |
free(mpage->sec); |
free(mpage->arch); |
free(mpage->arch); |
free(mpage->title); |
free(mpage->title); |
free(mpage->desc); |
free(mpage->desc); |
free(mpage); |
free(mpage); |
mpage = ohash_next(&mpages, &slot); |
|
} |
} |
} |
} |
|
|
Line 1053 mlink_check(struct mpage *mpage, struct mlink *mlink) |
|
Line 1077 mlink_check(struct mpage *mpage, struct mlink *mlink) |
|
* architectures. |
* architectures. |
* A few manuals are even shared across completely |
* A few manuals are even shared across completely |
* different architectures, for example fdformat(1) |
* different architectures, for example fdformat(1) |
* on amd64, i386, sparc, and sparc64. |
* on amd64, i386, and sparc64. |
*/ |
*/ |
|
|
if (strcasecmp(mpage->arch, mlink->arch)) |
if (strcasecmp(mpage->arch, mlink->arch)) |
Line 1088 mlink_check(struct mpage *mpage, struct mlink *mlink) |
|
Line 1112 mlink_check(struct mpage *mpage, struct mlink *mlink) |
|
* and filename to determine whether the file is parsable or not. |
* and filename to determine whether the file is parsable or not. |
*/ |
*/ |
static void |
static void |
mpages_merge(struct mparse *mp) |
mpages_merge(struct dba *dba, struct mparse *mp) |
{ |
{ |
char any[] = "any"; |
|
struct ohash_info str_info; |
|
struct mpage *mpage, *mpage_dest; |
struct mpage *mpage, *mpage_dest; |
struct mlink *mlink, *mlink_dest; |
struct mlink *mlink, *mlink_dest; |
struct mdoc *mdoc; |
struct roff_meta *meta; |
struct man *man; |
|
char *sodest; |
|
char *cp; |
char *cp; |
int fd; |
int fd; |
unsigned int pslot; |
|
enum mandoclevel lvl; |
|
|
|
str_info.alloc = hash_alloc; |
for (mpage = mpage_head; mpage != NULL; mpage = mpage->next) { |
str_info.calloc = hash_calloc; |
|
str_info.free = hash_free; |
|
str_info.key_offset = offsetof(struct str, key); |
|
|
|
if ( ! nodb) |
|
SQL_EXEC("BEGIN TRANSACTION"); |
|
|
|
mpage = ohash_first(&mpages, &pslot); |
|
while (mpage != NULL) { |
|
mlinks_undupe(mpage); |
mlinks_undupe(mpage); |
if (mpage->mlinks == NULL) { |
if ((mlink = mpage->mlinks) == NULL) |
mpage = ohash_next(&mpages, &pslot); |
|
continue; |
continue; |
} |
|
|
|
name_mask = NAME_MASK; |
name_mask = NAME_MASK; |
ohash_init(&names, 4, &str_info); |
mandoc_ohash_init(&names, 4, offsetof(struct str, key)); |
ohash_init(&strings, 6, &str_info); |
mandoc_ohash_init(&strings, 6, offsetof(struct str, key)); |
mparse_reset(mp); |
mparse_reset(mp); |
mdoc = NULL; |
meta = NULL; |
man = NULL; |
|
sodest = NULL; |
|
|
|
mparse_open(mp, &fd, mpage->mlinks->file); |
if ((fd = mparse_open(mp, mlink->file)) == -1) { |
if (fd == -1) { |
say(mlink->file, "&open"); |
say(mpage->mlinks->file, "&open"); |
|
goto nextpage; |
goto nextpage; |
} |
} |
|
|
/* |
/* |
* Try interpreting the file as mdoc(7) or man(7) |
* Interpret the file as mdoc(7) or man(7) source |
* source code, unless it is already known to be |
* code, unless it is known to be formatted. |
* formatted. Fall back to formatted mode. |
|
*/ |
*/ |
if (mpage->mlinks->dform != FORM_CAT || |
if (mlink->dform != FORM_CAT || mlink->fform != FORM_CAT) { |
mpage->mlinks->fform != FORM_CAT) { |
mparse_readfd(mp, fd, mlink->file); |
lvl = mparse_readfd(mp, fd, mpage->mlinks->file); |
close(fd); |
if (lvl < MANDOCLEVEL_FATAL) |
fd = -1; |
mparse_result(mp, &mdoc, &man, &sodest); |
meta = mparse_result(mp); |
} |
} |
|
|
if (sodest != NULL) { |
if (meta != NULL && meta->sodest != NULL) { |
mlink_dest = ohash_find(&mlinks, |
mlink_dest = ohash_find(&mlinks, |
ohash_qlookup(&mlinks, sodest)); |
ohash_qlookup(&mlinks, meta->sodest)); |
if (mlink_dest == NULL) { |
if (mlink_dest == NULL) { |
mandoc_asprintf(&cp, "%s.gz", sodest); |
mandoc_asprintf(&cp, "%s.gz", meta->sodest); |
mlink_dest = ohash_find(&mlinks, |
mlink_dest = ohash_find(&mlinks, |
ohash_qlookup(&mlinks, cp)); |
ohash_qlookup(&mlinks, cp)); |
free(cp); |
free(cp); |
Line 1158 mpages_merge(struct mparse *mp) |
|
Line 1161 mpages_merge(struct mparse *mp) |
|
/* The .so target exists. */ |
/* The .so target exists. */ |
|
|
mpage_dest = mlink_dest->mpage; |
mpage_dest = mlink_dest->mpage; |
mlink = mpage->mlinks; |
|
while (1) { |
while (1) { |
mlink->mpage = mpage_dest; |
mlink->mpage = mpage_dest; |
|
|
Line 1171 mpages_merge(struct mparse *mp) |
|
Line 1173 mpages_merge(struct mparse *mp) |
|
* to the target. |
* to the target. |
*/ |
*/ |
|
|
if (mpage_dest->pageid) |
if (mpage_dest->dba != NULL) |
dbadd_mlink_name(mlink); |
dbadd_mlink(mlink); |
|
|
if (mlink->next == NULL) |
if (mlink->next == NULL) |
break; |
break; |
Line 1186 mpages_merge(struct mparse *mp) |
|
Line 1188 mpages_merge(struct mparse *mp) |
|
mpage->mlinks = NULL; |
mpage->mlinks = NULL; |
} |
} |
goto nextpage; |
goto nextpage; |
} else if (mdoc != NULL) { |
} else if (meta != NULL && meta->macroset == MACROSET_MDOC) { |
mpage->form = FORM_SRC; |
mpage->form = FORM_SRC; |
mpage->sec = mdoc_meta(mdoc)->msec; |
mpage->sec = meta->msec; |
mpage->sec = mandoc_strdup( |
mpage->sec = mandoc_strdup( |
mpage->sec == NULL ? "" : mpage->sec); |
mpage->sec == NULL ? "" : mpage->sec); |
mpage->arch = mdoc_meta(mdoc)->arch; |
mpage->arch = meta->arch; |
mpage->arch = mandoc_strdup( |
mpage->arch = mandoc_strdup( |
mpage->arch == NULL ? "" : mpage->arch); |
mpage->arch == NULL ? "" : mpage->arch); |
mpage->title = |
mpage->title = mandoc_strdup(meta->title); |
mandoc_strdup(mdoc_meta(mdoc)->title); |
} else if (meta != NULL && meta->macroset == MACROSET_MAN) { |
} else if (man != NULL) { |
if (*meta->msec != '\0' || *meta->title != '\0') { |
mpage->form = FORM_SRC; |
mpage->form = FORM_SRC; |
mpage->sec = |
mpage->sec = mandoc_strdup(meta->msec); |
mandoc_strdup(man_meta(man)->msec); |
mpage->arch = mandoc_strdup(mlink->arch); |
mpage->arch = |
mpage->title = mandoc_strdup(meta->title); |
mandoc_strdup(mpage->mlinks->arch); |
} else |
mpage->title = |
meta = NULL; |
mandoc_strdup(man_meta(man)->title); |
|
} else { |
|
mpage->form = FORM_CAT; |
|
mpage->sec = |
|
mandoc_strdup(mpage->mlinks->dsec); |
|
mpage->arch = |
|
mandoc_strdup(mpage->mlinks->arch); |
|
mpage->title = |
|
mandoc_strdup(mpage->mlinks->name); |
|
} |
} |
putkey(mpage, mpage->sec, TYPE_sec); |
|
if (*mpage->arch != '\0') |
|
putkey(mpage, mpage->arch, TYPE_arch); |
|
|
|
for (mlink = mpage->mlinks; mlink; mlink = mlink->next) { |
|
if ('\0' != *mlink->dsec) |
|
putkey(mpage, mlink->dsec, TYPE_sec); |
|
if ('\0' != *mlink->fsec) |
|
putkey(mpage, mlink->fsec, TYPE_sec); |
|
putkey(mpage, '\0' == *mlink->arch ? |
|
any : mlink->arch, TYPE_arch); |
|
putkey(mpage, mlink->name, NAME_FILE); |
|
} |
|
|
|
assert(mpage->desc == NULL); |
assert(mpage->desc == NULL); |
if (mdoc != NULL) |
if (meta == NULL) { |
parse_mdoc(mpage, mdoc_meta(mdoc), mdoc_node(mdoc)); |
mpage->form = FORM_CAT; |
else if (man != NULL) |
mpage->sec = mandoc_strdup(mlink->dsec); |
parse_man(mpage, man_meta(man), man_node(man)); |
mpage->arch = mandoc_strdup(mlink->arch); |
else |
mpage->title = mandoc_strdup(mlink->name); |
parse_cat(mpage, fd); |
parse_cat(mpage, fd); |
if (mpage->desc == NULL) |
} else if (meta->macroset == MACROSET_MDOC) |
mpage->desc = mandoc_strdup(mpage->mlinks->name); |
parse_mdoc(mpage, meta, meta->first); |
|
else |
|
parse_man(mpage, meta, meta->first); |
|
if (mpage->desc == NULL) { |
|
mpage->desc = mandoc_strdup(mlink->name); |
|
if (warnings) |
|
say(mlink->file, "No one-line description, " |
|
"using filename \"%s\"", mlink->name); |
|
} |
|
|
if (warnings && !use_all) |
for (mlink = mpage->mlinks; |
for (mlink = mpage->mlinks; mlink; |
mlink != NULL; |
mlink = mlink->next) |
mlink = mlink->next) { |
|
putkey(mpage, mlink->name, NAME_FILE); |
|
if (warnings && !use_all) |
mlink_check(mpage, mlink); |
mlink_check(mpage, mlink); |
|
} |
|
|
dbadd(mpage); |
dbadd(dba, mpage); |
|
|
nextpage: |
nextpage: |
if (mparse_wait(mp) != MANDOCLEVEL_OK) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(mpage->mlinks->file, "&wait gunzip"); |
|
} |
|
ohash_delete(&strings); |
ohash_delete(&strings); |
ohash_delete(&names); |
ohash_delete(&names); |
mpage = ohash_next(&mpages, &pslot); |
|
} |
} |
|
|
if (0 == nodb) |
|
SQL_EXEC("END TRANSACTION"); |
|
} |
} |
|
|
static void |
static void |
names_check(void) |
|
{ |
|
sqlite3_stmt *stmt; |
|
const char *name, *sec, *arch, *key; |
|
int irc; |
|
|
|
sqlite3_prepare_v2(db, |
|
"SELECT name, sec, arch, key FROM (" |
|
"SELECT name AS key, pageid FROM names " |
|
"WHERE bits & ? AND NOT EXISTS (" |
|
"SELECT pageid FROM mlinks " |
|
"WHERE mlinks.pageid == names.pageid " |
|
"AND mlinks.name == names.name" |
|
")" |
|
") JOIN (" |
|
"SELECT sec, arch, name, pageid FROM mlinks " |
|
"GROUP BY pageid" |
|
") USING (pageid);", |
|
-1, &stmt, NULL); |
|
|
|
if (SQLITE_OK != sqlite3_bind_int64(stmt, 1, NAME_TITLE)) |
|
say("", "%s", sqlite3_errmsg(db)); |
|
|
|
while (SQLITE_ROW == (irc = sqlite3_step(stmt))) { |
|
name = (const char *)sqlite3_column_text(stmt, 0); |
|
sec = (const char *)sqlite3_column_text(stmt, 1); |
|
arch = (const char *)sqlite3_column_text(stmt, 2); |
|
key = (const char *)sqlite3_column_text(stmt, 3); |
|
say("", "%s(%s%s%s) lacks mlink \"%s\"", name, sec, |
|
'\0' == *arch ? "" : "/", |
|
'\0' == *arch ? "" : arch, key); |
|
} |
|
sqlite3_finalize(stmt); |
|
} |
|
|
|
static void |
|
parse_cat(struct mpage *mpage, int fd) |
parse_cat(struct mpage *mpage, int fd) |
{ |
{ |
FILE *stream; |
FILE *stream; |
char *line, *p, *title; |
struct mlink *mlink; |
size_t len, plen, titlesz; |
char *line, *p, *title, *sec; |
|
size_t linesz, plen, titlesz; |
|
ssize_t len; |
|
int offs; |
|
|
stream = (-1 == fd) ? |
mlink = mpage->mlinks; |
fopen(mpage->mlinks->file, "r") : |
stream = fd == -1 ? fopen(mlink->file, "r") : fdopen(fd, "r"); |
fdopen(fd, "r"); |
if (stream == NULL) { |
if (NULL == stream) { |
if (fd != -1) |
if (-1 != fd) |
|
close(fd); |
close(fd); |
if (warnings) |
if (warnings) |
say(mpage->mlinks->file, "&fopen"); |
say(mlink->file, "&fopen"); |
return; |
return; |
} |
} |
|
|
|
line = NULL; |
|
linesz = 0; |
|
|
|
/* Parse the section number from the header line. */ |
|
|
|
while (getline(&line, &linesz, stream) != -1) { |
|
if (*line == '\n') |
|
continue; |
|
if ((sec = strchr(line, '(')) == NULL) |
|
break; |
|
if ((p = strchr(++sec, ')')) == NULL) |
|
break; |
|
free(mpage->sec); |
|
mpage->sec = mandoc_strndup(sec, p - sec); |
|
if (warnings && *mlink->dsec != '\0' && |
|
strcasecmp(mpage->sec, mlink->dsec)) |
|
say(mlink->file, |
|
"Section \"%s\" manual in %s directory", |
|
mpage->sec, mlink->dsec); |
|
break; |
|
} |
|
|
/* Skip to first blank line. */ |
/* Skip to first blank line. */ |
|
|
while (NULL != (line = fgetln(stream, &len))) |
while (line == NULL || *line != '\n') |
if ('\n' == *line) |
if (getline(&line, &linesz, stream) == -1) |
break; |
break; |
|
|
/* |
/* |
Line 1323 parse_cat(struct mpage *mpage, int fd) |
|
Line 1294 parse_cat(struct mpage *mpage, int fd) |
|
* is the first section header. Skip to it. |
* is the first section header. Skip to it. |
*/ |
*/ |
|
|
while (NULL != (line = fgetln(stream, &len))) |
while (getline(&line, &linesz, stream) != -1) |
if ('\n' != *line && ' ' != *line) |
if (*line != '\n' && *line != ' ') |
break; |
break; |
|
|
/* |
/* |
Line 1337 parse_cat(struct mpage *mpage, int fd) |
|
Line 1308 parse_cat(struct mpage *mpage, int fd) |
|
titlesz = 0; |
titlesz = 0; |
title = NULL; |
title = NULL; |
|
|
while (NULL != (line = fgetln(stream, &len))) { |
while ((len = getline(&line, &linesz, stream)) != -1) { |
if (' ' != *line || '\n' != line[len - 1]) |
if (*line != ' ') |
break; |
break; |
while (len > 0 && isspace((unsigned char)*line)) { |
offs = 0; |
line++; |
while (isspace((unsigned char)line[offs])) |
len--; |
offs++; |
} |
if (line[offs] == '\0') |
if (1 == len) |
|
continue; |
continue; |
title = mandoc_realloc(title, titlesz + len); |
title = mandoc_realloc(title, titlesz + len - offs); |
memcpy(title + titlesz, line, len); |
memcpy(title + titlesz, line + offs, len - offs); |
titlesz += len; |
titlesz += len - offs; |
title[titlesz - 1] = ' '; |
title[titlesz - 1] = ' '; |
} |
} |
|
free(line); |
|
|
/* |
/* |
* If no page content can be found, or the input line |
* If no page content can be found, or the input line |
Line 1361 parse_cat(struct mpage *mpage, int fd) |
|
Line 1332 parse_cat(struct mpage *mpage, int fd) |
|
|
|
if (NULL == title || '\0' == *title) { |
if (NULL == title || '\0' == *title) { |
if (warnings) |
if (warnings) |
say(mpage->mlinks->file, |
say(mlink->file, "Cannot find NAME section"); |
"Cannot find NAME section"); |
|
fclose(stream); |
fclose(stream); |
free(title); |
free(title); |
return; |
return; |
} |
} |
|
|
title = mandoc_realloc(title, titlesz + 1); |
title[titlesz - 1] = '\0'; |
title[titlesz] = '\0'; |
|
|
|
/* |
/* |
* Skip to the first dash. |
* Skip to the first dash. |
Line 1382 parse_cat(struct mpage *mpage, int fd) |
|
Line 1351 parse_cat(struct mpage *mpage, int fd) |
|
/* Skip to next word. */ ; |
/* Skip to next word. */ ; |
} else { |
} else { |
if (warnings) |
if (warnings) |
say(mpage->mlinks->file, |
say(mlink->file, "No dash in title line, " |
"No dash in title line"); |
"reusing \"%s\" as one-line description", title); |
p = title; |
p = title; |
} |
} |
|
|
Line 1401 parse_cat(struct mpage *mpage, int fd) |
|
Line 1370 parse_cat(struct mpage *mpage, int fd) |
|
plen -= 2; |
plen -= 2; |
} |
} |
|
|
mpage->desc = mandoc_strdup(p); |
/* |
|
* Cut off excessive one-line descriptions. |
|
* Bad pages are not worth better heuristics. |
|
*/ |
|
|
|
mpage->desc = mandoc_strndup(p, 150); |
fclose(stream); |
fclose(stream); |
free(title); |
free(title); |
} |
} |
Line 1412 parse_cat(struct mpage *mpage, int fd) |
|
Line 1386 parse_cat(struct mpage *mpage, int fd) |
|
static void |
static void |
putkey(const struct mpage *mpage, char *value, uint64_t type) |
putkey(const struct mpage *mpage, char *value, uint64_t type) |
{ |
{ |
char *cp; |
|
|
|
assert(NULL != value); |
|
if (TYPE_arch == type) |
|
for (cp = value; *cp; cp++) |
|
if (isupper((unsigned char)*cp)) |
|
*cp = _tolower((unsigned char)*cp); |
|
putkeys(mpage, value, strlen(value), type); |
putkeys(mpage, value, strlen(value), type); |
} |
} |
|
|
Line 1427 putkey(const struct mpage *mpage, char *value, uint64_ |
|
Line 1394 putkey(const struct mpage *mpage, char *value, uint64_ |
|
*/ |
*/ |
static void |
static void |
putmdockey(const struct mpage *mpage, |
putmdockey(const struct mpage *mpage, |
const struct mdoc_node *n, uint64_t m) |
const struct roff_node *n, uint64_t m, int taboo) |
{ |
{ |
|
|
for ( ; NULL != n; n = n->next) { |
for ( ; NULL != n; n = n->next) { |
|
if (n->flags & taboo) |
|
continue; |
if (NULL != n->child) |
if (NULL != n->child) |
putmdockey(mpage, n->child, m); |
putmdockey(mpage, n->child, m, taboo); |
if (MDOC_TEXT == n->type) |
if (n->type == ROFFT_TEXT) |
putkey(mpage, n->string, m); |
putkey(mpage, n->string, m); |
} |
} |
} |
} |
|
|
static void |
static void |
parse_man(struct mpage *mpage, const struct man_meta *meta, |
parse_man(struct mpage *mpage, const struct roff_meta *meta, |
const struct man_node *n) |
const struct roff_node *n) |
{ |
{ |
const struct man_node *head, *body; |
const struct roff_node *head, *body; |
char *start, *title; |
char *start, *title; |
char byte; |
char byte; |
size_t sz; |
size_t sz; |
|
|
if (NULL == n) |
if (n == NULL) |
return; |
return; |
|
|
/* |
/* |
Line 1457 parse_man(struct mpage *mpage, const struct man_meta * |
|
Line 1426 parse_man(struct mpage *mpage, const struct man_meta * |
|
* the correct section or not. |
* the correct section or not. |
*/ |
*/ |
|
|
if (MAN_BODY == n->type && MAN_SH == n->tok) { |
if (n->type == ROFFT_BODY && n->tok == MAN_SH) { |
body = n; |
body = n; |
assert(body->parent); |
if ((head = body->parent->head) != NULL && |
if (NULL != (head = body->parent->head) && |
(head = head->child) != NULL && |
1 == head->nchild && |
head->next == NULL && |
NULL != (head = (head->child)) && |
head->type == ROFFT_TEXT && |
MAN_TEXT == head->type && |
strcmp(head->string, "NAME") == 0 && |
0 == strcmp(head->string, "NAME") && |
body->child != NULL) { |
NULL != body->child) { |
|
|
|
/* |
/* |
* Suck the entire NAME section into memory. |
* Suck the entire NAME section into memory. |
Line 1475 parse_man(struct mpage *mpage, const struct man_meta * |
|
Line 1443 parse_man(struct mpage *mpage, const struct man_meta * |
|
*/ |
*/ |
|
|
title = NULL; |
title = NULL; |
man_deroff(&title, body); |
deroff(&title, body); |
if (NULL == title) |
if (NULL == title) |
return; |
return; |
|
|
Line 1551 parse_man(struct mpage *mpage, const struct man_meta * |
|
Line 1519 parse_man(struct mpage *mpage, const struct man_meta * |
|
while (' ' == *start) |
while (' ' == *start) |
start++; |
start++; |
|
|
mpage->desc = mandoc_strdup(start); |
/* |
|
* Cut off excessive one-line descriptions. |
|
* Bad pages are not worth better heuristics. |
|
*/ |
|
|
|
mpage->desc = mandoc_strndup(start, 150); |
free(title); |
free(title); |
return; |
return; |
} |
} |
Line 1565 parse_man(struct mpage *mpage, const struct man_meta * |
|
Line 1538 parse_man(struct mpage *mpage, const struct man_meta * |
|
} |
} |
|
|
static void |
static void |
parse_mdoc(struct mpage *mpage, const struct mdoc_meta *meta, |
parse_mdoc(struct mpage *mpage, const struct roff_meta *meta, |
const struct mdoc_node *n) |
const struct roff_node *n) |
{ |
{ |
|
const struct mdoc_handler *handler; |
|
|
assert(NULL != n); |
for (n = n->child; n != NULL; n = n->next) { |
for (n = n->child; NULL != n; n = n->next) { |
if (n->tok == TOKEN_NONE || n->tok < ROFF_MAX) |
|
continue; |
|
assert(n->tok >= MDOC_Dd && n->tok < MDOC_MAX); |
|
handler = mdoc_handlers + (n->tok - MDOC_Dd); |
|
if (n->flags & handler->taboo) |
|
continue; |
|
|
switch (n->type) { |
switch (n->type) { |
case MDOC_ELEM: |
case ROFFT_ELEM: |
/* FALLTHROUGH */ |
case ROFFT_BLOCK: |
case MDOC_BLOCK: |
case ROFFT_HEAD: |
/* FALLTHROUGH */ |
case ROFFT_BODY: |
case MDOC_HEAD: |
case ROFFT_TAIL: |
/* FALLTHROUGH */ |
if (handler->fp != NULL && |
case MDOC_BODY: |
(*handler->fp)(mpage, meta, n) == 0) |
/* FALLTHROUGH */ |
break; |
case MDOC_TAIL: |
if (handler->mask) |
if (NULL != mdocs[n->tok].fp) |
|
if (0 == (*mdocs[n->tok].fp)(mpage, meta, n)) |
|
break; |
|
if (mdocs[n->tok].mask) |
|
putmdockey(mpage, n->child, |
putmdockey(mpage, n->child, |
mdocs[n->tok].mask); |
handler->mask, handler->taboo); |
break; |
break; |
default: |
default: |
assert(MDOC_ROOT != n->type); |
|
continue; |
continue; |
} |
} |
if (NULL != n->child) |
if (NULL != n->child) |
Line 1598 parse_mdoc(struct mpage *mpage, const struct mdoc_meta |
|
Line 1573 parse_mdoc(struct mpage *mpage, const struct mdoc_meta |
|
} |
} |
|
|
static int |
static int |
parse_mdoc_Fd(struct mpage *mpage, const struct mdoc_meta *meta, |
parse_mdoc_Fa(struct mpage *mpage, const struct roff_meta *meta, |
const struct mdoc_node *n) |
const struct roff_node *n) |
{ |
{ |
|
uint64_t mask; |
|
|
|
mask = TYPE_Fa; |
|
if (n->sec == SEC_SYNOPSIS) |
|
mask |= TYPE_Vt; |
|
|
|
putmdockey(mpage, n->child, mask, 0); |
|
return 0; |
|
} |
|
|
|
static int |
|
parse_mdoc_Fd(struct mpage *mpage, const struct roff_meta *meta, |
|
const struct roff_node *n) |
|
{ |
char *start, *end; |
char *start, *end; |
size_t sz; |
size_t sz; |
|
|
if (SEC_SYNOPSIS != n->sec || |
if (SEC_SYNOPSIS != n->sec || |
NULL == (n = n->child) || |
NULL == (n = n->child) || |
MDOC_TEXT != n->type) |
n->type != ROFFT_TEXT) |
return(0); |
return 0; |
|
|
/* |
/* |
* Only consider those `Fd' macro fields that begin with an |
* Only consider those `Fd' macro fields that begin with an |
Line 1615 parse_mdoc_Fd(struct mpage *mpage, const struct mdoc_m |
|
Line 1604 parse_mdoc_Fd(struct mpage *mpage, const struct mdoc_m |
|
*/ |
*/ |
|
|
if (strcmp("#include", n->string)) |
if (strcmp("#include", n->string)) |
return(0); |
return 0; |
|
|
if (NULL == (n = n->next) || MDOC_TEXT != n->type) |
if ((n = n->next) == NULL || n->type != ROFFT_TEXT) |
return(0); |
return 0; |
|
|
/* |
/* |
* Strip away the enclosing angle brackets and make sure we're |
* Strip away the enclosing angle brackets and make sure we're |
Line 1630 parse_mdoc_Fd(struct mpage *mpage, const struct mdoc_m |
|
Line 1619 parse_mdoc_Fd(struct mpage *mpage, const struct mdoc_m |
|
start++; |
start++; |
|
|
if (0 == (sz = strlen(start))) |
if (0 == (sz = strlen(start))) |
return(0); |
return 0; |
|
|
end = &start[(int)sz - 1]; |
end = &start[(int)sz - 1]; |
if ('>' == *end || '"' == *end) |
if ('>' == *end || '"' == *end) |
Line 1638 parse_mdoc_Fd(struct mpage *mpage, const struct mdoc_m |
|
Line 1627 parse_mdoc_Fd(struct mpage *mpage, const struct mdoc_m |
|
|
|
if (end > start) |
if (end > start) |
putkeys(mpage, start, end - start + 1, TYPE_In); |
putkeys(mpage, start, end - start + 1, TYPE_In); |
return(0); |
return 0; |
} |
} |
|
|
static void |
static void |
parse_mdoc_fname(struct mpage *mpage, const struct mdoc_node *n) |
parse_mdoc_fname(struct mpage *mpage, const struct roff_node *n) |
{ |
{ |
char *cp; |
char *cp; |
size_t sz; |
size_t sz; |
|
|
if (n->type != MDOC_TEXT) |
if (n->type != ROFFT_TEXT) |
return; |
return; |
|
|
/* Skip function pointer punctuation. */ |
/* Skip function pointer punctuation. */ |
Line 1663 parse_mdoc_fname(struct mpage *mpage, const struct mdo |
|
Line 1652 parse_mdoc_fname(struct mpage *mpage, const struct mdo |
|
} |
} |
|
|
static int |
static int |
parse_mdoc_Fn(struct mpage *mpage, const struct mdoc_meta *meta, |
parse_mdoc_Fn(struct mpage *mpage, const struct roff_meta *meta, |
const struct mdoc_node *n) |
const struct roff_node *n) |
{ |
{ |
|
uint64_t mask; |
|
|
if (n->child == NULL) |
if (n->child == NULL) |
return(0); |
return 0; |
|
|
parse_mdoc_fname(mpage, n->child); |
parse_mdoc_fname(mpage, n->child); |
|
|
for (n = n->child->next; n != NULL; n = n->next) |
n = n->child->next; |
if (n->type == MDOC_TEXT) |
if (n != NULL && n->type == ROFFT_TEXT) { |
putkey(mpage, n->string, TYPE_Fa); |
mask = TYPE_Fa; |
|
if (n->sec == SEC_SYNOPSIS) |
|
mask |= TYPE_Vt; |
|
putmdockey(mpage, n, mask, 0); |
|
} |
|
|
return(0); |
return 0; |
} |
} |
|
|
static int |
static int |
parse_mdoc_Fo(struct mpage *mpage, const struct mdoc_meta *meta, |
parse_mdoc_Fo(struct mpage *mpage, const struct roff_meta *meta, |
const struct mdoc_node *n) |
const struct roff_node *n) |
{ |
{ |
|
|
if (n->type != MDOC_HEAD) |
if (n->type != ROFFT_HEAD) |
return(1); |
return 1; |
|
|
if (n->child != NULL) |
if (n->child != NULL) |
parse_mdoc_fname(mpage, n->child); |
parse_mdoc_fname(mpage, n->child); |
|
|
return(0); |
return 0; |
} |
} |
|
|
static int |
static int |
parse_mdoc_Xr(struct mpage *mpage, const struct mdoc_meta *meta, |
parse_mdoc_Va(struct mpage *mpage, const struct roff_meta *meta, |
const struct mdoc_node *n) |
const struct roff_node *n) |
{ |
{ |
|
char *cp; |
|
|
|
if (n->type != ROFFT_ELEM && n->type != ROFFT_BODY) |
|
return 0; |
|
|
|
if (n->child != NULL && |
|
n->child->next == NULL && |
|
n->child->type == ROFFT_TEXT) |
|
return 1; |
|
|
|
cp = NULL; |
|
deroff(&cp, n); |
|
if (cp != NULL) { |
|
putkey(mpage, cp, TYPE_Vt | (n->tok == MDOC_Va || |
|
n->type == ROFFT_BODY ? TYPE_Va : 0)); |
|
free(cp); |
|
} |
|
|
|
return 0; |
|
} |
|
|
|
static int |
|
parse_mdoc_Xr(struct mpage *mpage, const struct roff_meta *meta, |
|
const struct roff_node *n) |
|
{ |
char *cp; |
char *cp; |
|
|
if (NULL == (n = n->child)) |
if (NULL == (n = n->child)) |
return(0); |
return 0; |
|
|
if (NULL == n->next) { |
if (NULL == n->next) { |
putkey(mpage, n->string, TYPE_Xr); |
putkey(mpage, n->string, TYPE_Xr); |
return(0); |
return 0; |
} |
} |
|
|
mandoc_asprintf(&cp, "%s(%s)", n->string, n->next->string); |
mandoc_asprintf(&cp, "%s(%s)", n->string, n->next->string); |
putkey(mpage, cp, TYPE_Xr); |
putkey(mpage, cp, TYPE_Xr); |
free(cp); |
free(cp); |
return(0); |
return 0; |
} |
} |
|
|
static int |
static int |
parse_mdoc_Nd(struct mpage *mpage, const struct mdoc_meta *meta, |
parse_mdoc_Nd(struct mpage *mpage, const struct roff_meta *meta, |
const struct mdoc_node *n) |
const struct roff_node *n) |
{ |
{ |
|
|
if (MDOC_BODY == n->type) |
if (n->type == ROFFT_BODY) |
mdoc_deroff(&mpage->desc, n); |
deroff(&mpage->desc, n); |
return(0); |
return 0; |
} |
} |
|
|
static int |
static int |
parse_mdoc_Nm(struct mpage *mpage, const struct mdoc_meta *meta, |
parse_mdoc_Nm(struct mpage *mpage, const struct roff_meta *meta, |
const struct mdoc_node *n) |
const struct roff_node *n) |
{ |
{ |
|
|
if (SEC_NAME == n->sec) |
if (SEC_NAME == n->sec) |
putmdockey(mpage, n->child, NAME_TITLE); |
putmdockey(mpage, n->child, NAME_TITLE, 0); |
else if (SEC_SYNOPSIS == n->sec && MDOC_HEAD == n->type) { |
else if (n->sec == SEC_SYNOPSIS && n->type == ROFFT_HEAD) { |
if (n->child == NULL) |
if (n->child == NULL) |
putkey(mpage, meta->name, NAME_SYN); |
putkey(mpage, meta->name, NAME_SYN); |
else |
else |
putmdockey(mpage, n->child, NAME_SYN); |
putmdockey(mpage, n->child, NAME_SYN, 0); |
} |
} |
if ( ! (mpage->name_head_done || |
if ( ! (mpage->name_head_done || |
n->child == NULL || n->child->string == NULL || |
n->child == NULL || n->child->string == NULL || |
Line 1742 parse_mdoc_Nm(struct mpage *mpage, const struct mdoc_m |
|
Line 1761 parse_mdoc_Nm(struct mpage *mpage, const struct mdoc_m |
|
putkey(mpage, n->child->string, NAME_HEAD); |
putkey(mpage, n->child->string, NAME_HEAD); |
mpage->name_head_done = 1; |
mpage->name_head_done = 1; |
} |
} |
return(0); |
return 0; |
} |
} |
|
|
static int |
static int |
parse_mdoc_Sh(struct mpage *mpage, const struct mdoc_meta *meta, |
parse_mdoc_Sh(struct mpage *mpage, const struct roff_meta *meta, |
const struct mdoc_node *n) |
const struct roff_node *n) |
{ |
{ |
|
|
return(SEC_CUSTOM == n->sec && MDOC_HEAD == n->type); |
return n->sec == SEC_CUSTOM && n->type == ROFFT_HEAD; |
} |
} |
|
|
static int |
static int |
parse_mdoc_head(struct mpage *mpage, const struct mdoc_meta *meta, |
parse_mdoc_head(struct mpage *mpage, const struct roff_meta *meta, |
const struct mdoc_node *n) |
const struct roff_node *n) |
{ |
{ |
|
|
return(MDOC_HEAD == n->type); |
return n->type == ROFFT_HEAD; |
} |
} |
|
|
static int |
|
parse_mdoc_body(struct mpage *mpage, const struct mdoc_meta *meta, |
|
const struct mdoc_node *n) |
|
{ |
|
|
|
return(MDOC_BODY == n->type); |
|
} |
|
|
|
/* |
/* |
* Add a string to the hash table for the current manual. |
* Add a string to the hash table for the current manual. |
* Each string has a bitmask telling which macros it belongs to. |
* Each string has a bitmask telling which macros it belongs to. |
Line 1795 putkeys(const struct mpage *mpage, char *cp, size_t sz |
|
Line 1806 putkeys(const struct mpage *mpage, char *cp, size_t sz |
|
name_mask &= ~NAME_FIRST; |
name_mask &= ~NAME_FIRST; |
if (debug > 1) |
if (debug > 1) |
say(mpage->mlinks->file, |
say(mpage->mlinks->file, |
"Adding name %*s, bits=%d", sz, cp, v); |
"Adding name %*s, bits=0x%llx", (int)sz, cp, |
|
(unsigned long long)v); |
} else { |
} else { |
htab = &strings; |
htab = &strings; |
if (debug > 1) |
if (debug > 1) |
for (i = 0; i < mansearch_keymax; i++) |
for (i = 0; i < KEY_MAX; i++) |
if ((uint64_t)1 << i & v) |
if ((uint64_t)1 << i & v) |
say(mpage->mlinks->file, |
say(mpage->mlinks->file, |
"Adding key %s=%*s", |
"Adding key %s=%*s", |
mansearch_keynames[i], sz, cp); |
mansearch_keynames[i], (int)sz, cp); |
} |
} |
|
|
end = cp + sz; |
end = cp + sz; |
Line 1871 utf8(unsigned int cp, char out[7]) |
|
Line 1883 utf8(unsigned int cp, char out[7]) |
|
out[4] = (cp >> 6 & 63) | 128; |
out[4] = (cp >> 6 & 63) | 128; |
out[5] = (cp & 63) | 128; |
out[5] = (cp & 63) | 128; |
} else |
} else |
return(0); |
return 0; |
|
|
out[rc] = '\0'; |
out[rc] = '\0'; |
return(rc); |
return rc; |
} |
} |
|
|
/* |
/* |
Line 1932 render_string(char **public, size_t *psz) |
|
Line 1944 render_string(char **public, size_t *psz) |
|
case '\\': |
case '\\': |
break; |
break; |
case '\t': |
case '\t': |
/* FALLTHROUGH */ |
|
case ASCII_NBRSP: |
case ASCII_NBRSP: |
dst[dsz++] = ' '; |
dst[dsz++] = ' '; |
scp++; |
scp++; |
Line 1963 render_string(char **public, size_t *psz) |
|
Line 1974 render_string(char **public, size_t *psz) |
|
*/ |
*/ |
|
|
if (write_utf8) { |
if (write_utf8) { |
unicode = mchars_spec2cp(mchars, seq, seqlen); |
unicode = mchars_spec2cp(seq, seqlen); |
if (unicode <= 0) |
if (unicode <= 0) |
continue; |
continue; |
addsz = utf8(unicode, utfbuf); |
addsz = utf8(unicode, utfbuf); |
Line 1971 render_string(char **public, size_t *psz) |
|
Line 1982 render_string(char **public, size_t *psz) |
|
continue; |
continue; |
addcp = utfbuf; |
addcp = utfbuf; |
} else { |
} else { |
addcp = mchars_spec2str(mchars, seq, seqlen, &addsz); |
addcp = mchars_spec2str(seq, seqlen, &addsz); |
if (addcp == NULL) |
if (addcp == NULL) |
continue; |
continue; |
if (*addcp == ASCII_NBRSP) { |
if (*addcp == ASCII_NBRSP) { |
Line 1998 render_string(char **public, size_t *psz) |
|
Line 2009 render_string(char **public, size_t *psz) |
|
--*psz; |
--*psz; |
if (dst != NULL) { |
if (dst != NULL) { |
(*public)[*psz] = '\0'; |
(*public)[*psz] = '\0'; |
return(1); |
return 1; |
} else |
} else |
return(0); |
return 0; |
} |
} |
|
|
static void |
static void |
dbadd_mlink(const struct mlink *mlink) |
dbadd_mlink(const struct mlink *mlink) |
{ |
{ |
size_t i; |
dba_page_alias(mlink->mpage->dba, mlink->name, NAME_FILE); |
|
dba_page_add(mlink->mpage->dba, DBP_SECT, mlink->dsec); |
i = 1; |
dba_page_add(mlink->mpage->dba, DBP_SECT, mlink->fsec); |
SQL_BIND_TEXT(stmts[STMT_INSERT_LINK], i, mlink->dsec); |
dba_page_add(mlink->mpage->dba, DBP_ARCH, mlink->arch); |
SQL_BIND_TEXT(stmts[STMT_INSERT_LINK], i, mlink->arch); |
dba_page_add(mlink->mpage->dba, DBP_FILE, mlink->file); |
SQL_BIND_TEXT(stmts[STMT_INSERT_LINK], i, mlink->name); |
|
SQL_BIND_INT64(stmts[STMT_INSERT_LINK], i, mlink->mpage->pageid); |
|
SQL_STEP(stmts[STMT_INSERT_LINK]); |
|
sqlite3_reset(stmts[STMT_INSERT_LINK]); |
|
} |
} |
|
|
static void |
|
dbadd_mlink_name(const struct mlink *mlink) |
|
{ |
|
uint64_t bits; |
|
size_t i; |
|
|
|
dbadd_mlink(mlink); |
|
|
|
i = 1; |
|
SQL_BIND_INT64(stmts[STMT_SELECT_NAME], i, mlink->mpage->pageid); |
|
bits = NAME_FILE & NAME_MASK; |
|
if (sqlite3_step(stmts[STMT_SELECT_NAME]) == SQLITE_ROW) { |
|
bits |= sqlite3_column_int64(stmts[STMT_SELECT_NAME], 0); |
|
sqlite3_reset(stmts[STMT_SELECT_NAME]); |
|
} |
|
|
|
i = 1; |
|
SQL_BIND_INT64(stmts[STMT_INSERT_NAME], i, bits); |
|
SQL_BIND_TEXT(stmts[STMT_INSERT_NAME], i, mlink->name); |
|
SQL_BIND_INT64(stmts[STMT_INSERT_NAME], i, mlink->mpage->pageid); |
|
SQL_STEP(stmts[STMT_INSERT_NAME]); |
|
sqlite3_reset(stmts[STMT_INSERT_NAME]); |
|
} |
|
|
|
/* |
/* |
* Flush the current page's terms (and their bits) into the database. |
* Flush the current page's terms (and their bits) into the database. |
* Wrap the entire set of additions in a transaction to make sqlite be a |
|
* little faster. |
|
* Also, handle escape sequences at the last possible moment. |
* Also, handle escape sequences at the last possible moment. |
*/ |
*/ |
static void |
static void |
dbadd(struct mpage *mpage) |
dbadd(struct dba *dba, struct mpage *mpage) |
{ |
{ |
struct mlink *mlink; |
struct mlink *mlink; |
struct str *key; |
struct str *key; |
char *cp; |
char *cp; |
|
uint64_t mask; |
size_t i; |
size_t i; |
unsigned int slot; |
unsigned int slot; |
int mustfree; |
int mustfree; |
Line 2097 dbadd(struct mpage *mpage) |
|
Line 2079 dbadd(struct mpage *mpage) |
|
cp = mpage->desc; |
cp = mpage->desc; |
i = strlen(cp); |
i = strlen(cp); |
mustfree = render_string(&cp, &i); |
mustfree = render_string(&cp, &i); |
i = 1; |
mpage->dba = dba_page_new(dba->pages, |
SQL_BIND_TEXT(stmts[STMT_INSERT_PAGE], i, cp); |
*mpage->arch == '\0' ? mlink->arch : mpage->arch, |
SQL_BIND_INT(stmts[STMT_INSERT_PAGE], i, mpage->form); |
cp, mlink->file, mpage->form); |
SQL_STEP(stmts[STMT_INSERT_PAGE]); |
|
mpage->pageid = sqlite3_last_insert_rowid(db); |
|
sqlite3_reset(stmts[STMT_INSERT_PAGE]); |
|
if (mustfree) |
if (mustfree) |
free(cp); |
free(cp); |
|
dba_page_add(mpage->dba, DBP_SECT, mpage->sec); |
|
|
while (NULL != mlink) { |
while (mlink != NULL) { |
dbadd_mlink(mlink); |
dbadd_mlink(mlink); |
mlink = mlink->next; |
mlink = mlink->next; |
} |
} |
mlink = mpage->mlinks; |
|
|
|
for (key = ohash_first(&names, &slot); NULL != key; |
for (key = ohash_first(&names, &slot); NULL != key; |
key = ohash_next(&names, &slot)) { |
key = ohash_next(&names, &slot)) { |
assert(key->mpage == mpage); |
assert(key->mpage == mpage); |
i = 1; |
dba_page_alias(mpage->dba, key->key, key->mask); |
SQL_BIND_INT64(stmts[STMT_INSERT_NAME], i, key->mask); |
|
SQL_BIND_TEXT(stmts[STMT_INSERT_NAME], i, key->key); |
|
SQL_BIND_INT64(stmts[STMT_INSERT_NAME], i, mpage->pageid); |
|
SQL_STEP(stmts[STMT_INSERT_NAME]); |
|
sqlite3_reset(stmts[STMT_INSERT_NAME]); |
|
free(key); |
free(key); |
} |
} |
for (key = ohash_first(&strings, &slot); NULL != key; |
for (key = ohash_first(&strings, &slot); NULL != key; |
key = ohash_next(&strings, &slot)) { |
key = ohash_next(&strings, &slot)) { |
assert(key->mpage == mpage); |
assert(key->mpage == mpage); |
i = 1; |
i = 0; |
SQL_BIND_INT64(stmts[STMT_INSERT_KEY], i, key->mask); |
for (mask = TYPE_Xr; mask <= TYPE_Lb; mask *= 2) { |
SQL_BIND_TEXT(stmts[STMT_INSERT_KEY], i, key->key); |
if (key->mask & mask) |
SQL_BIND_INT64(stmts[STMT_INSERT_KEY], i, mpage->pageid); |
dba_macro_add(dba->macros, i, |
SQL_STEP(stmts[STMT_INSERT_KEY]); |
key->key, mpage->dba); |
sqlite3_reset(stmts[STMT_INSERT_KEY]); |
i++; |
|
} |
free(key); |
free(key); |
} |
} |
} |
} |
|
|
static void |
static void |
dbprune(void) |
dbprune(struct dba *dba) |
{ |
{ |
struct mpage *mpage; |
struct dba_array *page, *files; |
struct mlink *mlink; |
char *file; |
size_t i; |
|
unsigned int slot; |
|
|
|
if (0 == nodb) |
dba_array_FOREACH(dba->pages, page) { |
SQL_EXEC("BEGIN TRANSACTION"); |
files = dba_array_get(page, DBP_FILE); |
|
dba_array_FOREACH(files, file) { |
for (mpage = ohash_first(&mpages, &slot); NULL != mpage; |
if (*file < ' ') |
mpage = ohash_next(&mpages, &slot)) { |
file++; |
mlink = mpage->mlinks; |
if (ohash_find(&mlinks, ohash_qlookup(&mlinks, |
if (debug) |
file)) != NULL) { |
say(mlink->file, "Deleting from database"); |
if (debug) |
if (nodb) |
say(file, "Deleting from database"); |
continue; |
dba_array_del(dba->pages); |
for ( ; NULL != mlink; mlink = mlink->next) { |
break; |
i = 1; |
} |
SQL_BIND_TEXT(stmts[STMT_DELETE_PAGE], |
|
i, mlink->dsec); |
|
SQL_BIND_TEXT(stmts[STMT_DELETE_PAGE], |
|
i, mlink->arch); |
|
SQL_BIND_TEXT(stmts[STMT_DELETE_PAGE], |
|
i, mlink->name); |
|
SQL_STEP(stmts[STMT_DELETE_PAGE]); |
|
sqlite3_reset(stmts[STMT_DELETE_PAGE]); |
|
} |
} |
} |
} |
|
|
if (0 == nodb) |
|
SQL_EXEC("END TRANSACTION"); |
|
} |
} |
|
|
/* |
/* |
* Close an existing database and its prepared statements. |
* Write the database from memory to disk. |
* If "real" is not set, rename the temporary file into the real one. |
|
*/ |
*/ |
static void |
static void |
dbclose(int real) |
dbwrite(struct dba *dba) |
{ |
{ |
size_t i; |
struct stat sb1, sb2; |
int status; |
char tfn[33], *cp1, *cp2; |
pid_t child; |
off_t i; |
|
int fd1, fd2; |
|
|
if (nodb) |
/* |
return; |
* Do not write empty databases, and delete existing ones |
|
* when makewhatis -u causes them to become empty. |
|
*/ |
|
|
for (i = 0; i < STMT__MAX; i++) { |
dba_array_start(dba->pages); |
sqlite3_finalize(stmts[i]); |
if (dba_array_next(dba->pages) == NULL) { |
stmts[i] = NULL; |
if (unlink(MANDOC_DB) == -1 && errno != ENOENT) |
|
say(MANDOC_DB, "&unlink"); |
|
return; |
} |
} |
|
|
sqlite3_close(db); |
/* |
db = NULL; |
* Build the database in a temporary file, |
|
* then atomically move it into place. |
|
*/ |
|
|
if (real) |
if (dba_write(MANDOC_DB "~", dba) != -1) { |
return; |
if (rename(MANDOC_DB "~", MANDOC_DB) == -1) { |
|
|
if ('\0' == *tempfilename) { |
|
if (-1 == rename(MANDOC_DB "~", MANDOC_DB)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
exitcode = (int)MANDOCLEVEL_SYSERR; |
say(MANDOC_DB, "&rename"); |
say(MANDOC_DB, "&rename"); |
|
unlink(MANDOC_DB "~"); |
} |
} |
return; |
return; |
} |
} |
|
|
switch (child = fork()) { |
/* |
case -1: |
* We lack write permission and cannot replace the database |
exitcode = (int)MANDOCLEVEL_SYSERR; |
* file, but let's at least check whether the data changed. |
say("", "&fork cmp"); |
*/ |
return; |
|
case 0: |
|
execlp("cmp", "cmp", "-s", |
|
tempfilename, MANDOC_DB, NULL); |
|
say("", "&exec cmp"); |
|
exit(0); |
|
default: |
|
break; |
|
} |
|
if (-1 == waitpid(child, &status, 0)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "&wait cmp"); |
|
} else if (WIFSIGNALED(status)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "cmp died from signal %d", WTERMSIG(status)); |
|
} else if (WEXITSTATUS(status)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(MANDOC_DB, |
|
"Data changed, but cannot replace database"); |
|
} |
|
|
|
*strrchr(tempfilename, '/') = '\0'; |
(void)strlcpy(tfn, "/tmp/mandocdb.XXXXXXXX", sizeof(tfn)); |
switch (child = fork()) { |
if (mkdtemp(tfn) == NULL) { |
case -1: |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
exitcode = (int)MANDOCLEVEL_SYSERR; |
say("", "&fork rm"); |
say("", "&%s", tfn); |
return; |
return; |
case 0: |
|
execlp("rm", "rm", "-rf", tempfilename, NULL); |
|
say("", "&exec rm"); |
|
exit((int)MANDOCLEVEL_SYSERR); |
|
default: |
|
break; |
|
} |
} |
if (-1 == waitpid(child, &status, 0)) { |
cp1 = cp2 = MAP_FAILED; |
exitcode = (int)MANDOCLEVEL_SYSERR; |
fd1 = fd2 = -1; |
say("", "&wait rm"); |
(void)strlcat(tfn, "/" MANDOC_DB, sizeof(tfn)); |
} else if (WIFSIGNALED(status) || WEXITSTATUS(status)) { |
if (dba_write(tfn, dba) == -1) { |
exitcode = (int)MANDOCLEVEL_SYSERR; |
say(tfn, "&dba_write"); |
say("", "%s: Cannot remove temporary directory", |
goto err; |
tempfilename); |
|
} |
} |
} |
if ((fd1 = open(MANDOC_DB, O_RDONLY, 0)) == -1) { |
|
say(MANDOC_DB, "&open"); |
/* |
goto err; |
* This is straightforward stuff. |
|
* Open a database connection to a "temporary" database, then open a set |
|
* of prepared statements we'll use over and over again. |
|
* If "real" is set, we use the existing database; if not, we truncate a |
|
* temporary one. |
|
* Must be matched by dbclose(). |
|
*/ |
|
static int |
|
dbopen(int real) |
|
{ |
|
const char *sql; |
|
int rc, ofl; |
|
|
|
if (nodb) |
|
return(1); |
|
|
|
*tempfilename = '\0'; |
|
ofl = SQLITE_OPEN_READWRITE; |
|
|
|
if (real) { |
|
rc = sqlite3_open_v2(MANDOC_DB, &db, ofl, NULL); |
|
if (SQLITE_OK != rc) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
if (SQLITE_CANTOPEN != rc) |
|
say(MANDOC_DB, "%s", sqlite3_errstr(rc)); |
|
return(0); |
|
} |
|
goto prepare_statements; |
|
} |
} |
|
if ((fd2 = open(tfn, O_RDONLY, 0)) == -1) { |
ofl |= SQLITE_OPEN_CREATE | SQLITE_OPEN_EXCLUSIVE; |
say(tfn, "&open"); |
|
goto err; |
remove(MANDOC_DB "~"); |
|
rc = sqlite3_open_v2(MANDOC_DB "~", &db, ofl, NULL); |
|
if (SQLITE_OK == rc) |
|
goto create_tables; |
|
if (MPARSE_QUICK & mparse_options) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(MANDOC_DB "~", "%s", sqlite3_errstr(rc)); |
|
return(0); |
|
} |
} |
|
if (fstat(fd1, &sb1) == -1) { |
(void)strlcpy(tempfilename, "/tmp/mandocdb.XXXXXX", |
say(MANDOC_DB, "&fstat"); |
sizeof(tempfilename)); |
goto err; |
if (NULL == mkdtemp(tempfilename)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "&%s", tempfilename); |
|
return(0); |
|
} |
} |
(void)strlcat(tempfilename, "/" MANDOC_DB, |
if (fstat(fd2, &sb2) == -1) { |
sizeof(tempfilename)); |
say(tfn, "&fstat"); |
rc = sqlite3_open_v2(tempfilename, &db, ofl, NULL); |
goto err; |
if (SQLITE_OK != rc) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say("", "%s: %s", tempfilename, sqlite3_errstr(rc)); |
|
return(0); |
|
} |
} |
|
if (sb1.st_size != sb2.st_size) |
create_tables: |
goto err; |
sql = "CREATE TABLE \"mpages\" (\n" |
if ((cp1 = mmap(NULL, sb1.st_size, PROT_READ, MAP_PRIVATE, |
" \"desc\" TEXT NOT NULL,\n" |
fd1, 0)) == MAP_FAILED) { |
" \"form\" INTEGER NOT NULL,\n" |
say(MANDOC_DB, "&mmap"); |
" \"pageid\" INTEGER PRIMARY KEY AUTOINCREMENT NOT NULL\n" |
goto err; |
");\n" |
|
"\n" |
|
"CREATE TABLE \"mlinks\" (\n" |
|
" \"sec\" TEXT NOT NULL,\n" |
|
" \"arch\" TEXT NOT NULL,\n" |
|
" \"name\" TEXT NOT NULL,\n" |
|
" \"pageid\" INTEGER NOT NULL REFERENCES mpages(pageid) " |
|
"ON DELETE CASCADE\n" |
|
");\n" |
|
"CREATE INDEX mlinks_pageid_idx ON mlinks (pageid);\n" |
|
"\n" |
|
"CREATE TABLE \"names\" (\n" |
|
" \"bits\" INTEGER NOT NULL,\n" |
|
" \"name\" TEXT NOT NULL,\n" |
|
" \"pageid\" INTEGER NOT NULL REFERENCES mpages(pageid) " |
|
"ON DELETE CASCADE,\n" |
|
" UNIQUE (\"name\", \"pageid\") ON CONFLICT REPLACE\n" |
|
");\n" |
|
"\n" |
|
"CREATE TABLE \"keys\" (\n" |
|
" \"bits\" INTEGER NOT NULL,\n" |
|
" \"key\" TEXT NOT NULL,\n" |
|
" \"pageid\" INTEGER NOT NULL REFERENCES mpages(pageid) " |
|
"ON DELETE CASCADE\n" |
|
");\n" |
|
"CREATE INDEX keys_pageid_idx ON keys (pageid);\n"; |
|
|
|
if (SQLITE_OK != sqlite3_exec(db, sql, NULL, NULL, NULL)) { |
|
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(MANDOC_DB, "%s", sqlite3_errmsg(db)); |
|
sqlite3_close(db); |
|
return(0); |
|
} |
} |
|
if ((cp2 = mmap(NULL, sb2.st_size, PROT_READ, MAP_PRIVATE, |
prepare_statements: |
fd2, 0)) == MAP_FAILED) { |
if (SQLITE_OK != sqlite3_exec(db, |
say(tfn, "&mmap"); |
"PRAGMA foreign_keys = ON", NULL, NULL, NULL)) { |
goto err; |
exitcode = (int)MANDOCLEVEL_SYSERR; |
|
say(MANDOC_DB, "PRAGMA foreign_keys: %s", |
|
sqlite3_errmsg(db)); |
|
sqlite3_close(db); |
|
return(0); |
|
} |
} |
|
for (i = 0; i < sb1.st_size; i++) |
|
if (cp1[i] != cp2[i]) |
|
goto err; |
|
goto out; |
|
|
sql = "DELETE FROM mpages WHERE pageid IN " |
err: |
"(SELECT pageid FROM mlinks WHERE " |
exitcode = (int)MANDOCLEVEL_SYSERR; |
"sec=? AND arch=? AND name=?)"; |
say(MANDOC_DB, "Data changed, but cannot replace database"); |
sqlite3_prepare_v2(db, sql, -1, &stmts[STMT_DELETE_PAGE], NULL); |
|
sql = "INSERT INTO mpages " |
|
"(desc,form) VALUES (?,?)"; |
|
sqlite3_prepare_v2(db, sql, -1, &stmts[STMT_INSERT_PAGE], NULL); |
|
sql = "INSERT INTO mlinks " |
|
"(sec,arch,name,pageid) VALUES (?,?,?,?)"; |
|
sqlite3_prepare_v2(db, sql, -1, &stmts[STMT_INSERT_LINK], NULL); |
|
sql = "SELECT bits FROM names where pageid = ?"; |
|
sqlite3_prepare_v2(db, sql, -1, &stmts[STMT_SELECT_NAME], NULL); |
|
sql = "INSERT INTO names " |
|
"(bits,name,pageid) VALUES (?,?,?)"; |
|
sqlite3_prepare_v2(db, sql, -1, &stmts[STMT_INSERT_NAME], NULL); |
|
sql = "INSERT INTO keys " |
|
"(bits,key,pageid) VALUES (?,?,?)"; |
|
sqlite3_prepare_v2(db, sql, -1, &stmts[STMT_INSERT_KEY], NULL); |
|
|
|
#ifndef __APPLE__ |
out: |
/* |
if (cp1 != MAP_FAILED) |
* When opening a new database, we can turn off |
munmap(cp1, sb1.st_size); |
* synchronous mode for much better performance. |
if (cp2 != MAP_FAILED) |
*/ |
munmap(cp2, sb2.st_size); |
|
if (fd1 != -1) |
if (real && SQLITE_OK != sqlite3_exec(db, |
close(fd1); |
"PRAGMA synchronous = OFF", NULL, NULL, NULL)) { |
if (fd2 != -1) |
exitcode = (int)MANDOCLEVEL_SYSERR; |
close(fd2); |
say(MANDOC_DB, "PRAGMA synchronous: %s", |
unlink(tfn); |
sqlite3_errmsg(db)); |
*strrchr(tfn, '/') = '\0'; |
sqlite3_close(db); |
rmdir(tfn); |
return(0); |
|
} |
|
#endif |
|
|
|
return(1); |
|
} |
} |
|
|
static void * |
|
hash_calloc(size_t n, size_t sz, void *arg) |
|
{ |
|
|
|
return(mandoc_calloc(n, sz)); |
|
} |
|
|
|
static void * |
|
hash_alloc(size_t sz, void *arg) |
|
{ |
|
|
|
return(mandoc_malloc(sz)); |
|
} |
|
|
|
static void |
|
hash_free(void *p, void *arg) |
|
{ |
|
|
|
free(p); |
|
} |
|
|
|
static int |
static int |
set_basedir(const char *targetdir, int report_baddir) |
set_basedir(const char *targetdir, int report_baddir) |
{ |
{ |
Line 2458 set_basedir(const char *targetdir, int report_baddir) |
|
Line 2278 set_basedir(const char *targetdir, int report_baddir) |
|
if (2 == getcwd_status) { |
if (2 == getcwd_status) { |
exitcode = (int)MANDOCLEVEL_SYSERR; |
exitcode = (int)MANDOCLEVEL_SYSERR; |
say("", "getcwd: %s", startdir); |
say("", "getcwd: %s", startdir); |
return(0); |
return 0; |
} |
} |
if (-1 == chdir(startdir)) { |
if (-1 == chdir(startdir)) { |
exitcode = (int)MANDOCLEVEL_SYSERR; |
exitcode = (int)MANDOCLEVEL_SYSERR; |
say("", "&chdir %s", startdir); |
say("", "&chdir %s", startdir); |
return(0); |
return 0; |
} |
} |
} |
} |
|
|
Line 2477 set_basedir(const char *targetdir, int report_baddir) |
|
Line 2297 set_basedir(const char *targetdir, int report_baddir) |
|
exitcode = (int)MANDOCLEVEL_BADARG; |
exitcode = (int)MANDOCLEVEL_BADARG; |
say("", "&%s: realpath", targetdir); |
say("", "&%s: realpath", targetdir); |
} |
} |
return(0); |
return 0; |
} else if (-1 == chdir(basedir)) { |
} else if (-1 == chdir(basedir)) { |
if (report_baddir || errno != ENOENT) { |
if (report_baddir || errno != ENOENT) { |
exitcode = (int)MANDOCLEVEL_BADARG; |
exitcode = (int)MANDOCLEVEL_BADARG; |
say("", "&chdir"); |
say("", "&chdir"); |
} |
} |
return(0); |
return 0; |
} |
} |
chdir_status = 1; |
chdir_status = 1; |
cp = strchr(basedir, '\0'); |
cp = strchr(basedir, '\0'); |
Line 2491 set_basedir(const char *targetdir, int report_baddir) |
|
Line 2311 set_basedir(const char *targetdir, int report_baddir) |
|
if (cp - basedir >= PATH_MAX - 1) { |
if (cp - basedir >= PATH_MAX - 1) { |
exitcode = (int)MANDOCLEVEL_SYSERR; |
exitcode = (int)MANDOCLEVEL_SYSERR; |
say("", "Filename too long"); |
say("", "Filename too long"); |
return(0); |
return 0; |
} |
} |
*cp++ = '/'; |
*cp++ = '/'; |
*cp = '\0'; |
*cp = '\0'; |
} |
} |
return(1); |
return 1; |
} |
} |
|
|
static void |
static void |