You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
97 lines
2.7 KiB
97 lines
2.7 KiB
#! /bin/sh
|
|
|
|
# rundig.sh
|
|
# a script to drive ht://Dig updates
|
|
# Copyright (c) 1998 Colin Viebrock <cmv@shmooze.net>
|
|
# Copyright (c) 1998-1999 Geoff Hutchison <ghutchis@wso.williams.edu>
|
|
# Updated for ht://Dig 3.2.0b3 Feb 2001, Copyright (c) 2001 Geoff Hutchison
|
|
# Distributed under the GNU GPL version 2 or later
|
|
|
|
if [ "$1" = "-v" ]; then
|
|
verbose="-v"
|
|
fi
|
|
|
|
# This is the directory where htdig lives
|
|
BASEDIR=/export/htdig
|
|
|
|
# This is the db dir
|
|
DBDIR=$BASEDIR/db/
|
|
|
|
# This is the name of a temporary report file
|
|
REPORT=/tmp/htdig.report
|
|
|
|
# This is who gets the report
|
|
REPORT_DEST="webmaster@yourdomain.com"
|
|
export REPORT_DEST
|
|
|
|
# This is the subject line of the report
|
|
SUBJECT="cron: htdig report for domain"
|
|
|
|
# This is the name of the conf file to use
|
|
CONF=htdig.conf
|
|
|
|
# This is the directory htdig will use for temporary sort files
|
|
TMPDIR=$DBDIR
|
|
export TMPDIR
|
|
|
|
# This is the PATH used by this script. Change it if you have problems
|
|
# with not finding wc or grep.
|
|
PATH=/usr/local/bin:/usr/bin:/bin
|
|
|
|
##### Dig phase
|
|
STARTTIME=`date`
|
|
echo Start time: $STARTTIME
|
|
echo rundig: Start time: $STARTTIME > $REPORT
|
|
$BASEDIR/bin/htdig $verbose -s -a -c $BASEDIR/conf/$CONF >> $REPORT
|
|
TIME=`date`
|
|
echo Done Digging: $TIME
|
|
echo rundig: Done Digging: $TIME >> $REPORT
|
|
|
|
##### Purge Phase
|
|
# (clean out broken links, etc.)
|
|
$BASEDIR/bin/htpurge $verbose -a -c $BASEDIR/conf/$CONF >> $REPORT
|
|
TIME=`date`
|
|
echo Done Purging: $TIME
|
|
echo rundig: Done Purging: $TIME >> $REPORT
|
|
|
|
##### Cleanup Phase
|
|
# To enable htnotify or the soundex search, uncomment the following lines
|
|
# $BASEDIR/bin/htnotify $verbose >>$REPORT
|
|
# $BASEDIR/bin/htfuzzy $verbose soundex
|
|
# To get additional statistics, uncomment the following line
|
|
# $BASEDIR/bin/htstat $verbose >>$REPORT
|
|
|
|
# Move 'em into place. Since these are only used by htdig for update digs
|
|
# and we always use -a, we just leave them as .work
|
|
# mv $DBDIR/db.docs.index.work $DBDIR/db.docs.index
|
|
# (this is just a mapping from a URL to a DocID)
|
|
# We need the .work for next time as an update dig, plus the copy for searching
|
|
cp $DBDIR/db.docdb.work $DBDIR/db.docdb
|
|
cp $DBDIR/db.excerpts.work $DBDIR/db.excerpts
|
|
cp $DBDIR/db.words.db.work $DBDIR/db.words.db
|
|
test -f $DBDIR/db.words.db.work_weakcmpr &&
|
|
cp $DBDIR/db.words.db.work_weakcmpr $DBDIR/db.words.db_weakcmpr
|
|
|
|
END=`date`
|
|
echo End time: $END
|
|
echo rundig: End time: $END >> $REPORT
|
|
echo
|
|
|
|
# Grab the important statistics from the report file
|
|
# All lines begin with htdig: or htmerge:
|
|
fgrep "htdig:" $REPORT
|
|
echo
|
|
fgrep "htmerge:" $REPORT
|
|
echo
|
|
fgrep "rundig:" $REPORT
|
|
echo
|
|
|
|
WC=`wc -l $REPORT`
|
|
echo Total lines in $REPORT: $WC
|
|
|
|
# Send out the report ...
|
|
mail -s "$SUBJECT - $STARTTIME" $REPORT_DEST < $REPORT
|
|
|
|
# ... and clean up
|
|
rm $REPORT
|