X-Git-Url: https://git.donarmstrong.com/?a=blobdiff_plain;f=bin%2Fdebbugs-spam;h=ba026da4547af6a1ac3b79d07df1e9af9c5b940f;hb=64267ddd252ea24e5aeb4bb999a22a1b1f0f2d85;hp=d3cb29d9d872ce3fbff3e0ed88437283a4f304c7;hpb=813e992044d2be62428d9288751ba599ebfa4a46;p=debbugs.git diff --git a/bin/debbugs-spam b/bin/debbugs-spam index d3cb29d..ba026da 100755 --- a/bin/debbugs-spam +++ b/bin/debbugs-spam @@ -78,11 +78,25 @@ id Mark messages as ham if there is a regex match to subject or message id +=item B + +Learn from messages which are ham/spam + =back =head1 EXAMPLES +Start spamd: + + /usr/sbin/spamd --socketpath=/home/debbugs/spamd_socket \ + --nouser-config --cf='include /home/debbugs/.spamassassin/user_prefs' \ + --cf='allow_user_rules 1' --allow-tell; + +Then score bugs: + + debbugs-spam --spamc-opts '-U' --spamc-opts '/home/debbugs/spamd_socket' \ + score 859123; =cut @@ -130,6 +144,8 @@ my %subcommands = }, 'mark-ham' => {function => \&mark_ham, }, + 'learn' => {fuction => \&learn, + }, 'help' => {function => sub {pod2usage({verbose => 2});}} ); @@ -192,11 +208,49 @@ sub mark_it { if ($mid =~ /\Q$regex\E/) { $is_match = 1; } - if ($spam_ham eq 'spam') { - $spam->add_spam($mid); + if ($is_match) { + print STDERR "it's a match" if $DEBUG; + if ($spam_ham eq 'spam') { + $spam->add_spam($mid); + } else { + $spam->add_ham($mid); + } + } + }, + $bug_num + ); + $spam->save(); + } +} + +sub learn { + my ($options,$opts,$config,$argv) = @_; + for my $bug_num (@{$argv}) { + my $spam = Debbugs::Log::Spam->new(bug_num => $bug_num) or + die "Unable to open bug log spam for $bug_num"; + foreachmsg(sub { + my ($bn,$rec,$mid) = @_; + my $score; + if ($spam->is_spam($mid)) { + $score //= + spam_score($rec,$options->{spamc}, + [@{$options->{spamc_opts}}, + '-L','spam' + ] + ); + print STDERR "learning spam" if $DEBUG; + } elsif ($spam->is_ham($mid)) { + $score //= + spam_score($rec,$options->{spamc}, + [@{$options->{spamc_opts}}, + '-L','ham' + ] + ); + print STDERR "learning ham" if $DEBUG; } else { - $spam->add_ham($mid); + print STDERR "not learning" if $DEBUG; } + print STDERR " from $mid" if $DEBUG; }, $bug_num ); @@ -344,17 +398,18 @@ sub foreachmsg { my ($msg_id) = record_regex($record, qr/^Message-Id:\s+<(.+)>/mi); next unless defined $msg_id; + print STDERR "examining $msg_id: " if $DEBUG; if ($msg_id =~ /$config{email_domain}$/) { - print STDERR "skipping $msg_id\n" if $DEBUG; + print STDERR "skipping\n" if $DEBUG; next; } - print STDERR "examining $msg_id: " if $DEBUG; if ($seen_msgids{$msg_id}) { print STDERR "already seen\n" if $DEBUG; next; } $seen_msgids{$msg_id}=1; $sub->($bug_num,$record,$msg_id); + print STDERR "\n" if $DEBUG; } }