#! /bin/sh # rundig.sh # a script to drive ht://Dig updates # Copyright (c) 1998 Colin Viebrock # Copyright (c) 1998-1999 Geoff Hutchison # Updated for ht://Dig 3.2.0b3 Feb 2001, Copyright (c) 2001 Geoff Hutchison # Distributed under the GNU GPL version 2 or later if [ "$1" = "-v" ]; then verbose="-v" fi # This is the directory where htdig lives BASEDIR=/export/htdig # This is the db dir DBDIR=$BASEDIR/db/ # This is the name of a temporary report file REPORT=/tmp/htdig.report # This is who gets the report REPORT_DEST="webmaster@yourdomain.com" export REPORT_DEST # This is the subject line of the report SUBJECT="cron: htdig report for domain" # This is the name of the conf file to use CONF=htdig.conf # This is the directory htdig will use for temporary sort files TMPDIR=$DBDIR export TMPDIR # This is the PATH used by this script. Change it if you have problems # with not finding wc or grep. PATH=/usr/local/bin:/usr/bin:/bin ##### Dig phase STARTTIME=`date` echo Start time: $STARTTIME echo rundig: Start time: $STARTTIME > $REPORT $BASEDIR/bin/htdig $verbose -s -a -c $BASEDIR/conf/$CONF >> $REPORT TIME=`date` echo Done Digging: $TIME echo rundig: Done Digging: $TIME >> $REPORT ##### Purge Phase # (clean out broken links, etc.) $BASEDIR/bin/htpurge $verbose -a -c $BASEDIR/conf/$CONF >> $REPORT TIME=`date` echo Done Purging: $TIME echo rundig: Done Purging: $TIME >> $REPORT ##### Cleanup Phase # To enable htnotify or the soundex search, uncomment the following lines # $BASEDIR/bin/htnotify $verbose >>$REPORT # $BASEDIR/bin/htfuzzy $verbose soundex # To get additional statistics, uncomment the following line # $BASEDIR/bin/htstat $verbose >>$REPORT # Move 'em into place. Since these are only used by htdig for update digs # and we always use -a, we just leave them as .work # mv $DBDIR/db.docs.index.work $DBDIR/db.docs.index # (this is just a mapping from a URL to a DocID) # We need the .work for next time as an update dig, plus the copy for searching cp $DBDIR/db.docdb.work $DBDIR/db.docdb cp $DBDIR/db.excerpts.work $DBDIR/db.excerpts cp $DBDIR/db.words.db.work $DBDIR/db.words.db test -f $DBDIR/db.words.db.work_weakcmpr && cp $DBDIR/db.words.db.work_weakcmpr $DBDIR/db.words.db_weakcmpr END=`date` echo End time: $END echo rundig: End time: $END >> $REPORT echo # Grab the important statistics from the report file # All lines begin with htdig: or htmerge: fgrep "htdig:" $REPORT echo fgrep "htmerge:" $REPORT echo fgrep "rundig:" $REPORT echo WC=`wc -l $REPORT` echo Total lines in $REPORT: $WC # Send out the report ... mail -s "$SUBJECT - $STARTTIME" $REPORT_DEST < $REPORT # ... and clean up rm $REPORT