You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
610 lines
13 KiB
610 lines
13 KiB
// Part of the ht://Dig package <http://www.htdig.org/>
|
|
// Copyright (c) 1999-2004 The ht://Dig Group
|
|
// For copyright details, see the file COPYING in your distribution
|
|
// or the GNU Library General Public License (LGPL) version 2 or later
|
|
// <http://www.gnu.org/copyleft/lgpl.html>
|
|
//
|
|
|
|
/*-
|
|
* See the file LICENSE for redistribution information.
|
|
*
|
|
* Copyright (c) 1996, 1997, 1998, 1999
|
|
* Sleepycat Software. All rights reserved.
|
|
*/
|
|
|
|
#include "db_config.h"
|
|
#include "htconfig.h"
|
|
|
|
#ifndef lint
|
|
static const char copyright[] =
|
|
"@(#) Copyright (c) 1996, 1997, 1998, 1999\n\
|
|
Sleepycat Software Inc. All rights reserved.\n";
|
|
static const char sccsid[] = "@(#)db_dump.c 11.12 (Sleepycat) 11/10/99";
|
|
#endif
|
|
|
|
#ifndef NO_SYSTEM_INCLUDES
|
|
#include <sys/types.h>
|
|
|
|
#include <errno.h>
|
|
#include <signal.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <unistd.h>
|
|
#ifdef HAVE_GETOPT_H
|
|
#include <getopt.h>
|
|
#endif /* HAVE_GETOPT_H */
|
|
#endif
|
|
|
|
extern "C" {
|
|
#include "db_int.h"
|
|
#include "db_page.h"
|
|
#include "db_shash.h"
|
|
#include "btree.h"
|
|
#include "hash.h"
|
|
#include "lock.h"
|
|
}
|
|
|
|
#include "WordContext.h"
|
|
#include "WordDBCompress.h"
|
|
|
|
void configure __P((char *));
|
|
int db_init __P((char *, int));
|
|
int dump __P((DB *, int, int));
|
|
int dump_sub __P((DB *, char *, int, int));
|
|
int is_sub __P((DB *, int *));
|
|
int main __P((int, char *[]));
|
|
void onint __P((int));
|
|
int pheader __P((DB *, char *, int, int));
|
|
int show_subs __P((DB *));
|
|
void siginit __P((void));
|
|
void usage __P((void));
|
|
|
|
DB_ENV *dbenv;
|
|
int interrupted;
|
|
const char
|
|
*progname = "htdb_dump"; /* Program name. */
|
|
|
|
int
|
|
main(int argc, char *argv[])
|
|
{
|
|
extern char *optarg;
|
|
extern int optind;
|
|
DB *dbp;
|
|
int ch, d_close;
|
|
int e_close, exitval, lflag, Nflag, pflag, ret, subs, keyflag;
|
|
char *dopt, *home, *subname;
|
|
int compress = 0;
|
|
int wordlist = 0;
|
|
u_int32_t cachesize = 0;
|
|
Configuration *config = 0;
|
|
|
|
dbp = NULL;
|
|
d_close = e_close = exitval = lflag = Nflag = pflag = 0;
|
|
keyflag = 0;
|
|
dopt = home = subname = NULL;
|
|
while ((ch = getopt(argc, argv, "d:f:h:klNps:C:zW")) != EOF)
|
|
switch (ch) {
|
|
case 'd':
|
|
dopt = optarg;
|
|
break;
|
|
case 'f':
|
|
if (freopen(optarg, "w", stdout) == NULL) {
|
|
fprintf(stderr, "%s: %s: reopen: %s\n",
|
|
progname, optarg, strerror(errno));
|
|
exit (1);
|
|
}
|
|
break;
|
|
case 'h':
|
|
home = optarg;
|
|
break;
|
|
case 'k':
|
|
keyflag = 1;
|
|
break;
|
|
case 'l':
|
|
lflag = 1;
|
|
break;
|
|
case 'N':
|
|
Nflag = 1;
|
|
break;
|
|
case 'p':
|
|
pflag = 1;
|
|
break;
|
|
case 's':
|
|
subname = optarg;
|
|
break;
|
|
case 'C':
|
|
cachesize = atoi(optarg);
|
|
break;
|
|
case 'z':
|
|
compress = DB_COMPRESS;
|
|
break;
|
|
case 'W':
|
|
wordlist = 1;
|
|
break;
|
|
case '?':
|
|
default:
|
|
usage();
|
|
}
|
|
argc -= optind;
|
|
argv += optind;
|
|
|
|
if (argc != 1)
|
|
usage();
|
|
|
|
if (dopt != NULL && pflag) {
|
|
fprintf(stderr,
|
|
"%s: the -d and -p options may not both be specified\n",
|
|
progname);
|
|
exit (1);
|
|
}
|
|
if (lflag && subname != NULL) {
|
|
fprintf(stderr,
|
|
"%s: the -l and -s options may not both be specified\n",
|
|
progname);
|
|
exit (1);
|
|
}
|
|
|
|
/* Handle possible interruptions. */
|
|
siginit();
|
|
|
|
if(wordlist && compress) {
|
|
static ConfigDefaults defaults[] = {
|
|
{ "wordlist_wordkey_description", "Word/DocID 32/Flag 8/Location 16"},
|
|
{ "wordlist_env_skip", "true"},
|
|
{ 0, 0, 0 }
|
|
};
|
|
config = WordContext::Initialize(defaults);
|
|
}
|
|
|
|
/*
|
|
* Create an environment object and initialize it for error
|
|
* reporting.
|
|
*/
|
|
if ((ret = CDB_db_env_create(&dbenv, 0)) != 0) {
|
|
fprintf(stderr,
|
|
"%s: CDB_db_env_create: %s\n", progname, CDB_db_strerror(ret));
|
|
exit (1);
|
|
}
|
|
|
|
e_close = 1;
|
|
dbenv->set_errfile(dbenv, stderr);
|
|
dbenv->set_errpfx(dbenv, progname);
|
|
if(compress && wordlist) dbenv->mp_cmpr_info = (new WordDBCompress)->CmprInfo();
|
|
|
|
/* Initialize the environment. */
|
|
if (db_init(home, Nflag) != 0)
|
|
goto err;
|
|
|
|
/* Create the DB object and open the file. */
|
|
if ((ret = CDB_db_create(&dbp, dbenv, 0)) != 0) {
|
|
dbenv->err(dbenv, ret, "CDB_db_create");
|
|
goto err;
|
|
}
|
|
if(cachesize > 0) dbp->set_cachesize(dbp, 0, cachesize, 1);
|
|
d_close = 1;
|
|
if ((ret = dbp->open(dbp,
|
|
argv[0], subname, DB_UNKNOWN, (DB_RDONLY | compress), 0)) != 0) {
|
|
dbp->err(dbp, ret, "open: %s", argv[0]);
|
|
goto err;
|
|
}
|
|
|
|
if (dopt != NULL) {
|
|
if (CDB___db_dump(dbp, dopt, NULL)) {
|
|
dbp->err(dbp, ret, "CDB___db_dump: %s", argv[0]);
|
|
goto err;
|
|
}
|
|
} else if (lflag) {
|
|
if (is_sub(dbp, &subs))
|
|
goto err;
|
|
if (subs == 0) {
|
|
dbp->errx(dbp,
|
|
"%s: does not contain subdatabases", argv[0]);
|
|
goto err;
|
|
}
|
|
if (show_subs(dbp))
|
|
goto err;
|
|
} else {
|
|
subs = 0;
|
|
if (subname == NULL && is_sub(dbp, &subs))
|
|
goto err;
|
|
if (subs) {
|
|
if (dump_sub(dbp, argv[0], pflag, keyflag))
|
|
goto err;
|
|
} else
|
|
if (pheader(dbp, NULL, pflag, keyflag)
|
|
|| dump(dbp, pflag, keyflag))
|
|
goto err;
|
|
}
|
|
|
|
if (0) {
|
|
err: exitval = 1;
|
|
}
|
|
if (d_close && (ret = dbp->close(dbp, 0)) != 0) {
|
|
exitval = 1;
|
|
dbp->err(dbp, ret, "close");
|
|
}
|
|
if (e_close && (ret = dbenv->close(dbenv, 0)) != 0) {
|
|
exitval = 1;
|
|
fprintf(stderr,
|
|
"%s: dbenv->close: %s\n", progname, CDB_db_strerror(ret));
|
|
}
|
|
|
|
if (interrupted) {
|
|
(void)signal(interrupted, SIG_DFL);
|
|
(void)raise(interrupted);
|
|
/* NOTREACHED */
|
|
}
|
|
|
|
if(config) {
|
|
WordContext::Finish();
|
|
delete config;
|
|
}
|
|
|
|
return (exitval);
|
|
}
|
|
|
|
/*
|
|
* db_init --
|
|
* Initialize the environment.
|
|
*/
|
|
int
|
|
db_init(char *home, int Nflag)
|
|
{
|
|
u_int32_t flags;
|
|
int ret;
|
|
|
|
/* Optionally turn mutexes off. */
|
|
if (Nflag) {
|
|
if ((ret = dbenv->set_mutexlocks(dbenv, 0)) != 0) {
|
|
dbenv->err(dbenv, ret, "set_mutexlocks");
|
|
return (1);
|
|
}
|
|
if ((ret = dbenv->set_panic(dbenv, 0)) != 0) {
|
|
dbenv->err(dbenv, ret, "set_panic");
|
|
return (1);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Try and use the shared memory pool region when dumping a database,
|
|
* so our information is as up-to-date as possible, even if the mpool
|
|
* cache hasn't been flushed.
|
|
*/
|
|
flags = DB_USE_ENVIRON | DB_INIT_MPOOL | DB_INIT_LOCK;
|
|
if (dbenv->open(dbenv, home, NULL, flags, 0) == 0)
|
|
return (0);
|
|
|
|
/*
|
|
* An environment is required because we may be trying to look at
|
|
* databases in directories other than the current one. We could
|
|
* avoid using an environment iff the -h option wasn't specified,
|
|
* but that seems like more work than it's worth.
|
|
*
|
|
* No environment exists (or, at least no environment that includes
|
|
* an mpool region exists). Create one, but make it private so that
|
|
* no files are actually created.
|
|
*/
|
|
LF_SET(DB_CREATE | DB_PRIVATE);
|
|
if ((ret = dbenv->open(dbenv, home, NULL, flags, 0)) == 0)
|
|
return (0);
|
|
|
|
/* An environment is required. */
|
|
dbenv->err(dbenv, ret, "open");
|
|
return (1);
|
|
}
|
|
|
|
/*
|
|
* pheader --
|
|
* Write out the header information.
|
|
*/
|
|
int
|
|
pheader(DB *dbp, char *subname, int pflag, int keyflag)
|
|
{
|
|
DB_BTREE_STAT *btsp;
|
|
DB_HASH_STAT *hsp;
|
|
DB_QUEUE_STAT *qsp;
|
|
int ret;
|
|
|
|
printf("VERSION=2\n");
|
|
printf("format=%s\n", pflag ? "print" : "bytevalue");
|
|
if (subname != NULL)
|
|
printf("subdatabase=%s\n", subname);
|
|
switch (dbp->type) {
|
|
case DB_BTREE:
|
|
printf("type=btree\n");
|
|
if ((ret = dbp->stat(dbp, &btsp, NULL, 0)) != 0) {
|
|
dbp->err(dbp, ret, "DB->stat");
|
|
return (1);
|
|
}
|
|
if (F_ISSET(dbp, BTM_RECNUM))
|
|
printf("recnum=1\n");
|
|
if (btsp->bt_maxkey != 0)
|
|
printf("bt_maxkey=%lu\n", (u_long)btsp->bt_maxkey);
|
|
if (btsp->bt_minkey != 0 && btsp->bt_minkey != DEFMINKEYPAGE)
|
|
printf("bt_minkey=%lu\n", (u_long)btsp->bt_minkey);
|
|
break;
|
|
case DB_HASH:
|
|
printf("type=hash\n");
|
|
if ((ret = dbp->stat(dbp, &hsp, NULL, 0)) != 0) {
|
|
dbp->err(dbp, ret, "DB->stat");
|
|
return (1);
|
|
}
|
|
if (hsp->hash_ffactor != 0)
|
|
printf("h_ffactor=%lu\n", (u_long)hsp->hash_ffactor);
|
|
if (hsp->hash_nelem != 0 || hsp->hash_nrecs != 0)
|
|
printf("h_nelem=%lu\n",
|
|
hsp->hash_nelem > hsp->hash_nrecs ?
|
|
(u_long)hsp->hash_nelem : (u_long)hsp->hash_nrecs);
|
|
break;
|
|
case DB_QUEUE:
|
|
printf("type=queue\n");
|
|
if ((ret = dbp->stat(dbp, &qsp, NULL, 0)) != 0) {
|
|
dbp->err(dbp, ret, "DB->stat");
|
|
return (1);
|
|
}
|
|
printf("re_len=%lu\n", (u_long)qsp->qs_re_len);
|
|
if (qsp->qs_re_pad != 0 && qsp->qs_re_pad != ' ')
|
|
printf("re_pad=%#x\n", qsp->qs_re_pad);
|
|
break;
|
|
case DB_RECNO:
|
|
printf("type=recno\n");
|
|
if ((ret = dbp->stat(dbp, &btsp, NULL, 0)) != 0) {
|
|
dbp->err(dbp, ret, "DB->stat");
|
|
return (1);
|
|
}
|
|
if (F_ISSET(dbp, BTM_RENUMBER))
|
|
printf("renumber=1\n");
|
|
if (F_ISSET(dbp, BTM_FIXEDLEN))
|
|
printf("re_len=%lu\n", (u_long)btsp->bt_re_len);
|
|
if (btsp->bt_re_pad != 0 && btsp->bt_re_pad != ' ')
|
|
printf("re_pad=%#x\n", btsp->bt_re_pad);
|
|
break;
|
|
case DB_UNKNOWN:
|
|
abort(); /* Impossible. */
|
|
/* NOTREACHED */
|
|
}
|
|
|
|
if (F_ISSET(dbp, DB_AM_DUP))
|
|
printf("duplicates=1\n");
|
|
|
|
if (!F_ISSET(dbp, DB_AM_PGDEF))
|
|
printf("db_pagesize=%lu\n", (u_long)dbp->pgsize);
|
|
|
|
if (keyflag)
|
|
printf("keys=1\n");
|
|
|
|
printf("HEADER=END\n");
|
|
return (0);
|
|
}
|
|
|
|
/*
|
|
* is_sub --
|
|
* Return if the database contains subdatabases.
|
|
*/
|
|
int
|
|
is_sub(DB *dbp, int *yesno)
|
|
{
|
|
DB_BTREE_STAT *btsp;
|
|
DB_HASH_STAT *hsp;
|
|
int ret;
|
|
|
|
switch (dbp->type) {
|
|
case DB_BTREE:
|
|
case DB_RECNO:
|
|
if ((ret = dbp->stat(dbp, &btsp, NULL, 0)) != 0) {
|
|
dbp->err(dbp, ret, "DB->stat");
|
|
break;
|
|
}
|
|
*yesno = btsp->bt_metaflags & BTM_SUBDB ? 1 : 0;
|
|
free(btsp);
|
|
break;
|
|
case DB_HASH:
|
|
if ((ret = dbp->stat(dbp, &hsp, NULL, 0)) != 0) {
|
|
dbp->err(dbp, ret, "DB->stat");
|
|
break;
|
|
}
|
|
*yesno = hsp->hash_metaflags & DB_HASH_SUBDB ? 1 : 0;
|
|
free(hsp);
|
|
break;
|
|
case DB_QUEUE:
|
|
return (0);
|
|
default:
|
|
abort();
|
|
/* NOTREACHED */
|
|
}
|
|
return (ret);
|
|
}
|
|
|
|
/*
|
|
* dump_sub --
|
|
* Dump out the records for a DB containing subdatabases.
|
|
*/
|
|
int
|
|
dump_sub(DB *parent_dbp, char *parent_name, int pflag, int keyflag)
|
|
{
|
|
DB *dbp;
|
|
DBC *dbcp;
|
|
DBT key, data;
|
|
int ret;
|
|
char *subdb;
|
|
|
|
/*
|
|
* Get a cursor and step through the database, dumping out each
|
|
* subdatabase.
|
|
*/
|
|
if ((ret = parent_dbp->cursor(parent_dbp, NULL, &dbcp, 0)) != 0) {
|
|
dbenv->err(dbenv, ret, "DB->cursor");
|
|
return (1);
|
|
}
|
|
|
|
memset(&key, 0, sizeof(key));
|
|
memset(&data, 0, sizeof(data));
|
|
while ((ret = dbcp->c_get(dbcp, &key, &data, DB_NEXT)) == 0) {
|
|
/* Nul terminate the subdatabase name. */
|
|
if ((subdb = (char*)malloc(key.size + 1)) == NULL) {
|
|
dbenv->err(dbenv, ENOMEM, NULL);
|
|
return (1);
|
|
}
|
|
memcpy(subdb, key.data, key.size);
|
|
subdb[key.size] = '\0';
|
|
|
|
/* Create the DB object and open the file. */
|
|
if ((ret = CDB_db_create(&dbp, dbenv, 0)) != 0) {
|
|
dbenv->err(dbenv, ret, "CDB_db_create");
|
|
free(subdb);
|
|
return (1);
|
|
}
|
|
if ((ret = dbp->open(dbp,
|
|
parent_name, subdb, DB_UNKNOWN, DB_RDONLY, 0)) != 0)
|
|
dbp->err(dbp, ret,
|
|
"DB->open: %s:%s", parent_name, subdb);
|
|
if (ret == 0 &&
|
|
(pheader(dbp, subdb, pflag, keyflag) ||
|
|
dump(dbp, pflag, keyflag)))
|
|
ret = 1;
|
|
(void)dbp->close(dbp, 0);
|
|
free(subdb);
|
|
if (ret != 0)
|
|
return (1);
|
|
}
|
|
if (ret != DB_NOTFOUND) {
|
|
dbp->err(dbp, ret, "DBcursor->get");
|
|
return (1);
|
|
}
|
|
|
|
if ((ret = dbcp->c_close(dbcp)) != 0) {
|
|
dbp->err(dbp, ret, "DBcursor->close");
|
|
return (1);
|
|
}
|
|
|
|
return (0);
|
|
}
|
|
|
|
/*
|
|
* show_subs --
|
|
* Display the subdatabases for a database.
|
|
*/
|
|
int
|
|
show_subs(DB *dbp)
|
|
{
|
|
DBC *dbcp;
|
|
DBT key, data;
|
|
int ret;
|
|
|
|
/*
|
|
* Get a cursor and step through the database, printing out the key
|
|
* of each key/data pair.
|
|
*/
|
|
if ((ret = dbp->cursor(dbp, NULL, &dbcp, 0)) != 0) {
|
|
dbp->err(dbp, ret, "DB->cursor");
|
|
return (1);
|
|
}
|
|
|
|
memset(&key, 0, sizeof(key));
|
|
memset(&data, 0, sizeof(data));
|
|
while ((ret = dbcp->c_get(dbcp, &key, &data, DB_NEXT)) == 0) {
|
|
if ((ret = CDB___db_prdbt(&key, 1, NULL, stdout, 0)) != 0) {
|
|
dbp->errx(dbp, NULL);
|
|
return (1);
|
|
}
|
|
}
|
|
if (ret != DB_NOTFOUND) {
|
|
dbp->err(dbp, ret, "DBcursor->get");
|
|
return (1);
|
|
}
|
|
|
|
if ((ret = dbcp->c_close(dbcp)) != 0) {
|
|
dbp->err(dbp, ret, "DBcursor->close");
|
|
return (1);
|
|
}
|
|
return (0);
|
|
}
|
|
|
|
/*
|
|
* dump --
|
|
* Dump out the records for a DB.
|
|
*/
|
|
int
|
|
dump(DB *dbp, int pflag, int keyflag)
|
|
{
|
|
DBC *dbcp;
|
|
DBT key, data;
|
|
int ret, is_recno;
|
|
|
|
/*
|
|
* Get a cursor and step through the database, printing out each
|
|
* key/data pair.
|
|
*/
|
|
if ((ret = dbp->cursor(dbp, NULL, &dbcp, 0)) != 0) {
|
|
dbp->err(dbp, ret, "DB->cursor");
|
|
return (1);
|
|
}
|
|
|
|
memset(&key, 0, sizeof(key));
|
|
memset(&data, 0, sizeof(data));
|
|
is_recno = (dbp->type == DB_RECNO || dbp->type == DB_QUEUE);
|
|
keyflag = is_recno ? keyflag : 1;
|
|
while ((ret = dbcp->c_get(dbcp, &key, &data, DB_NEXT)) == 0)
|
|
if ((keyflag && (ret =
|
|
CDB___db_prdbt(&key, pflag, " ", stdout, is_recno)) != 0) ||
|
|
(ret = CDB___db_prdbt(&data, pflag, " ", stdout, 0)) != 0) {
|
|
dbp->errx(dbp, NULL);
|
|
return (1);
|
|
}
|
|
if (ret != DB_NOTFOUND) {
|
|
dbp->err(dbp, ret, "DBcursor->get");
|
|
return (1);
|
|
}
|
|
|
|
if ((ret = dbcp->c_close(dbcp)) != 0) {
|
|
dbp->err(dbp, ret, "DBcursor->close");
|
|
return (1);
|
|
}
|
|
|
|
printf("DATA=END\n");
|
|
return (0);
|
|
}
|
|
|
|
/*
|
|
* siginit --
|
|
* Initialize the set of signals for which we want to clean up.
|
|
* Generally, we try not to leave the shared regions locked if
|
|
* we can.
|
|
*/
|
|
void
|
|
siginit()
|
|
{
|
|
#ifdef SIGHUP
|
|
(void)signal(SIGHUP, onint);
|
|
#endif
|
|
(void)signal(SIGINT, onint);
|
|
#ifdef SIGPIPE
|
|
(void)signal(SIGPIPE, onint);
|
|
#endif
|
|
(void)signal(SIGTERM, onint);
|
|
}
|
|
|
|
/*
|
|
* onint --
|
|
* Interrupt signal handler.
|
|
*/
|
|
void
|
|
onint(int signo)
|
|
{
|
|
if ((interrupted = signo) == 0)
|
|
interrupted = SIGINT;
|
|
}
|
|
|
|
/*
|
|
* usage --
|
|
* Display the usage message.
|
|
*/
|
|
void
|
|
usage()
|
|
{
|
|
(void)fprintf(stderr,
|
|
"usage: htdb_dump [-klNpWz] [-C cachesize] [-d ahr] [-f file] [-h home] [-s subdb] db_file\n");
|
|
exit(1);
|
|
}
|