Bogofilter FAQ

insicura · sa

    bogofilter -s < spam.mbox
    bogofilter -n < ham.mbox
    bogominitrain.pl -fnv ~/.bogofilter ham.mbox spam.mbox '-o 0.9,0.3'
    randomtrain -s spam.mbox -n ham.mbox
    #! /bin/sh
    #  class3 -- classify one message as bad, good or unsure
    cat >msg.$$
    bogofilter $* <msg.$$
    res=$?
    if [ $res = 0 ]; then
	cat msg.$$ >>corpus.bad
    elif [ $res = 1 ]; then
	cat msg.$$ >>corpus.good
    elif [ $res = 2 ]; then
	cat msg.$$ >>corpus.unsure
    fi
    rm msg.$$
    #! /bin/sh
    # classify -- put all messages in mbox through class3
    src=$1;
    shift
    formail -s class3 $* <$src
    classify spam.mbox [bogofilter options]
    bogofilter -s < corpus.good
    rm -f corpus.*
    classify ham.mbox [bogofilter options]
    bogofilter -n < corpus.bad
    rm -f corpus.*
    mailtool copy /percorso/completo/di/mail.mbox '#driver.unix//percorso/completo/di//mbox'
    for MSG in /full/path/to/maildir/* ; do 
	    formail -I Status: < "$MSG" >> /full/path/to/mbox
    done
    X-Bogosity: Ham, tests=bogofilter, spamicity=0.500000
    X-Bogosity: Ham, tests=bogofilter, spamicity=0.500000
      int  cnt    prob   spamicity  histogram
     0.00   29  0.000209  0.000052  #############################
     0.10    2  0.179065  0.003425  ##
     0.20    2  0.276880  0.008870  ##
     0.30   18  0.363295  0.069245  ##################
     0.40    0  0.000000  0.069245
     0.50    0  0.000000  0.069245
     0.60   37  0.667823  0.257307  #####################################
     0.70    5  0.767436  0.278892  #####
     0.80   13  0.836789  0.334980  #############
     0.90   32  0.984903  0.499835  ################################
    X-Bogosity: Ham, tests=bogofilter, spamicity=0.500000
			      n    pgood     pbad      fw     U
    "which"              10  0.208333  0.000000  0.000041 +
    "own"                 7  0.145833  0.000000  0.000059 +
    "having"              6  0.125000  0.000000  0.000069 +
    ...
    "unsubscribe.asp"     2  0.000000  0.095238  0.999708 +
    "million"             4  0.000000  0.190476  0.999854 +
    "copy"                5  0.000000  0.238095  0.999883 +
    N_P_Q_S_s_x_md      138  0.00e+00  0.00e+00  5.00e-01
			     1.00e-03  4.15e-01  0.100
    #### CUTOFF Values
    #
    #    both ham_cutoff and spam_cutoff are allowed.
    #    setting ham_cutoff to a non-zero value will
    #    enable tri-state results (Spam/Ham/Unsure).
    #
    #ham_cutoff  = 0.45
    #spam_cutoff = 0.99
    #
    #    for two-state classification:
    #
    ## ham_cutoff = 0.00
    ## spam_cutoff= 0.99
    ## spamicity_tags = Yes, No, Unsure
    Se l'intestazione contiene "X-Bogosity: Spam", metti il messaggio nella cartella Spam
    Se l'intestazione contiene "X-Bogosity: Unsure", metti il messaggio nella cartella Incerti
    #### SPAM_SUBJECT_TAG
    #
    #    dicitura aggiunta alla linea "Oggetto:" per identificare spam o gli incerti
    #    l'impostazione predefinita non aggiunge nulla
    #
    ##spam_subject_tag=***SPAM***
    ##unsure_subject_tag=???UNSURE???
    Se l'oggetto contiene "***SPAM***" metti il messaggio nella cartella Spam
    Se l'oggetto contiene "???UNSURE???" metti il messaggio nella cartella Incerti
    BOGOFILTER     = "/usr/bin/bogofilter"
    BOGOFILTER_DIR = "training"
    SPAMASSASSIN  = "/usr/bin/spamassassin"

    :0 HBc
    * ? $SPAMASSASSIN -e
    #spam yields non-zero
    #non-spam yields zero
    | $BOGOFILTER -n -d $BOGOFILTER_DIR
    #else (E)
    :0Ec
    | $BOGOFILTER -s -d $BOGOFILTER_DIR

    :0fw
    | $BOGOFILTER -p -e

    :0:
    * ^X-Bogosity:.Spam
    spam

    :0:
    * ^X-Bogosity:.Ham
    non-spam
    ## Silently drop all Asian language mail
    UNREADABLE='[^?"]*big5|iso-2022-jp|ISO-2022-KR|euc-kr|gb2312|ks_c_5601-1987'
    :0:
    * 1^0 $ ^Subject:.*=\?($UNREADABLE)
    * 1^0 $ ^Content-Type:.*charset="?($UNREADABLE)
    spam-unreadable

    :0:
    * ^Content-Type:.*multipart
    * B ?? $ ^Content-Type:.*^?.*charset="?($UNREADABLE)
    spam-unreadable
    bf_compact ~/.bogofilter wordlist.db
    cd ~/.bogofilter
    bogoutil -d wordlist.db | bogoutil -l wordlist.db.new
    mv wordlist.db wordlist.db.prv
    mv wordlist.db.new wordlist.db
    wordlist R,user,~/wordlist.db,1
    wordlist R,system,/var/spool/bogofilter/wordlist.db,1
    wordlist R,user,~/wordlist.db,2
    wordlist R,system,/var/spool/bogofilter/wordlist.db,3
    wordlist R,user,~/wordlist.db,5
    wordlist R,system,/var/spool/bogofilter/wordlist.db,4
 wordlist I,ignore,~/ignorelist.db,7
      wordlist R,system,/var/spool/bogofilter/wordlist.db,8
  echo ignore.me | bogoutil -l ~/ignorelist.db
    db_verify wordlist.db
    bogoutil -d wordlist.db | bogoutil -l wordlist.new.db
    db_dump -r wordlist.db > wordlist.txt
    db_load wordlist.new.db < wordlist.txt
    bogoutil -d wordlist.db > wordlist.txt
    bogoutil -l wordlist.db.new < wordlist.txt
    bogoutil -d wordlist.db > wordlist.raw.txt
    iconv -f iso-8859-1 -t utf-8 < wordlist.raw.txt > wordlist.utf8.txt
    bogoutil -l wordlist.db.new < wordlist.utf8.txt
    bogoutil --unicode=yes -m wordlist.db
    bogoutil -d wordlist.db > wordlist.utf8.txt
    iconv -f utf-8  -t iso-8859-1 < wordlist.utf8.txt > wordlist.raw.txt
    bogoutil -l wordlist.db.new < wordlist.raw.txt
    bogoutil --unicode=no -m wordlist.db
    cd ~/.bogofilter
    bogoutil -d wordlist.db > wordlist.txt
    mv wordlist.db wordlist.db.old
    bogoutil --db-transaction=yes -l wordlist.db < wordlist.txt
    rm wordlist.db.old wordlist.txt
    cd ~/.bogofilter
    bogoutil -d wordlist.db > wordlist.txt
    mv wordlist.db wordlist.db.old
    rm -f log.?????????? __db.???
    bogoutil --db-transaction=no -l wordlist.db < wordlist.txt
 bogoutil --db-recover /your/bogofilter/directory
    ls -lh $BOGOFILTER_DIR/wordlist.db
    postconf | grep mailbox_size_limit
    postconf -e mailbox_size_limit=73000000
    bogoutil -d wordlist.db | \
    awk '{print $1 " " $2 " 0"}' | grep -v " 0 0" | \
    bogoutil -l wordlist.new.db
    bogoutil -d wordlist.db | \
    awk '{print $1 " 0 " $3}' | grep -v " 0 0" | \
    bogoutil -l wordlist.new.db
    $ cd build_unix
    $ sh ../dist/configure
    $ make
    # make install
    $ ./configure --with-libdb-prefix=/usr/local/BerkeleyDB.4.4
    $ make
    # make install-strip
    $ LD_LIBRARY_PATH=/usr/lib:/usr/local/lib:/usr/local/BerkeleyDB.4.4
    $ export LD_LIBRARY_PATH
    # pkg_add -r portupgrade
    # pkg_add -r portsnap
    # portupgrade -N bogofilter
    $ env CPPFLAGS=-I/usr/local/include/db3 LIBS=-ldb3 LDFLAGS=-L/usr/local/lib ./configure
    macro index S "|bogofilter -s\ns=junkmail"  "Ricorda come spam e cestinalo"
    macro pager S "|bogofilter -s\ns=junkmail"  "Ricorda come spam e cestinalo"
    macro index H "|bogofilter -n\ns="          "Ricorda come ham e salvalo"
    macro pager H "|bogofilter -n\ns="          "Ricorda come ham e salvalo"
    condition:
    * test "bogofilter < %F"
    action:
    * move "#mh/YOUR_SPAM_BOX"
    Mark as ham / spam:
    * bogofilter -n -v -B "%f" (mark ham)
    * bogofilter -s -v -B "%f" (mark spam)
    #!/bin/sh
    CONFIGDIR=~/.bogofilter
    SPAMDIRS="$CONFIGDIR/spamdirs"
    MARKFILE="$CONFIGDIR/lastbogorun"
    for D in `cat "$SPAMDIRS"`; do
	find "$D" -type f -newer "$MARKFILE" -not -name ".sylpheed*"
    done|bogofilter -bNsv
    touch "$MARKFILE"
    Condition:
	header "X-Bogosity" matchcase "Spam"
    Action:
	move "#mh/Mailbox/Spam"
    Condition:
	header "X-Bogosity" matchcase "Unsure"
    Action:
	move "#mh/Mailbox/Unsure"
    Register Spam:
	bogofilter -s < "%f"

    Register Ham:
	bogofilter -n < "%f"

    Unregister Spam:
	bogofilter -S < "%f"

    Unregister Ham:
	bogofilter -N < "%f"
    BogoTest -vv:
	bogofilter -vv < "%f"

    BogoTest -vvv:
	bogofilter -vvv < "%f"
;; load bogofilter capabilities (spam)
;;
(require 'vm-bogofilter)

;; short-key for bogofilter
;; C (shift-c) means spam message
;; K (shift-k) means ham message
(define-key vm-mode-map "K" 'vm-bogofilter-is-spam)
(define-key vm-mode-map "C" 'vm-bogofilter-is-clean)

Bogofilter FAQ

Convenzioni tipografiche

Domande poste frequentemente e loro risposte

Che cos'è bogofilter?

Bogo-che?

Come funziona bogofilter?

Liste di discussione

Come avvio l'apprendimento di bogofilter?

Confronto tra i metodi

Come posso mantenere alta l'accuratezza nell'assegnazione del punteggio?

Quali formati di posta sono supportati da bogofilter?

Cosa significa l'output verboso di bogofilter?

Che cos'è la modalità insicura?

Cosa sono l'"apprendimento dagli errori" e l'"apprendimento per esaurimento"

Cosa fa l'opzione '-u' (autoaggiornamento)?

Come posso utilizzare SpamAssassin per istruire bogofilter?

Cosa posso fare contro lo spam asiatico?

Come posso compattare il database?

Come si fa una ricerca manuale sul database?

Posso usare liste di termini multiple?

Posso dire a bogofilter di ignorare certi termini?

Come faccio ad aggiornare da un database di termini separati al formato con liste di termini combinate?

Come faccio a capire se le mie liste di termini sono corrotte?

Come converto la mia lista di termini in/da unicode?

Come passo dalla modalità non-transaction a quella transaction?

Come passo dalla modalità transaction a quella non-transaction?

Perché bogofilter muore dopo aver stampato "Lock table is out of available locks" oppure "Lock table is out of available object entries"?

Perché ottengo messaggi DB_PAGE_NOTFOUND?

Perché ottengo "Berkeley DB library configured to support only DB_PRIVATE environments" o "Berkeley DB library configured to support only private environments"?

Bogofilter può essere usato in un ambiente multiutente?

Posso condividere le liste di termini attraverso NFS?

Perché bogofilter restituisce codici come 0 e 256 quando viene lanciato dall'interno di un programma?

Ora che ho aggiornato perché si sono corrotti i miei scripts?

Ora che ho aggiornato perché bogofilter sta lavorando peggio?

Come posso eliminare tutti i token dello spam (o quelli non-spam)?

Come faccio a far funzionare bogofilter su Solaris, BSD, ecc?

Su Solaris

Su FreeBSD

Su NetBSD e altri sistemi che usano "pkgsrc"

Su HP-UX

Posso usare il comando make sul mio sistema operativo?

Come compilo bogofilter come utente non-root per installarlo in una directory non standard?

Come compilo bogofilter con le patch?

Come rendo gli eseguibili più piccoli?

datastore_db.c non compila!

Con quali programmi di posta funziona bogofilter?

Come uso bogofilter con mutt?

Come uso bogofilter con Sylpheed Claws?

Come uso bogofilter con VM (uno strumento di Emacs per la posta)?

Come uso bogofilter con MH-E (l'interfaccia Emacs al sistema di posta MH)?