]> git.donarmstrong.com Git - bin.git/blob - learn_from_spam
abstract out run through spam
[bin.git] / learn_from_spam
1 #!/bin/bash
2
3 # these are for non-spamc setups
4 SPAM_REPORT="spamassassin --report"
5 HAM_REPORT="spamassassin --revoke"
6 SPAM_CHECK="spamassassin -e"
7
8 # these are for spamc
9 SPAM_REPORT="spamc --learntype=spam -s $((100 * 1024 * 1024))"
10 HAM_REPORT="spamc --learntype=ham -s $((100 * 1024 * 1024))"
11 SPAM_CHECK="spamc -s $((100 * 1024 * 1024)) -c"
12
13 # needs rules directories
14 NEEDS_SPAM_RULES="$(echo ~/Maildir/spam/needs_rules)"
15 NEEDS_HAM_RULES="$(echo ~/Maildir/spam/needs_ham_rules)"
16
17 run_through_spamc () {
18     # destdir
19     DESTDIR="$1"
20     FILENAME="$2"
21     mkdir -p "$1"
22     TMP="$(mktemp -d)"
23     DESTFILE="$DESTDIR/$(basename "$FILENAME")"
24     DESTFILE_NO_SIZE="$DESTDIR/$(basename "$FILENAME"|sed 's/,S=.*//g')"
25     spamc -s $((100 * 1024 * 1024)) < "$FILENAME" > "$TMP/file" 2>/dev/null;
26     mv "$TMP/file" "DESTFILE"
27     mv "$DESTFILE" "$DESTFILE_NO_SIZE"
28     trap - EXIT;
29     rmdir "$TMP";
30 }
31
32 if [ "$(basename $0)" = "learn_from_spam" ]; then
33     for file in "$@"; do
34         if ! formail -c < "$file"|grep -q '^List-Id'; then
35             $SPAM_REPORT < "$file" >/dev/null 2>&1;
36         else
37             spamasssin --local --report < "$file" >/dev/null 2>&1;
38         fi
39         formail -c < "$file" | grep -e '^From ' -e 'From: ' | spamassassin --add-to-blacklist >/dev/null 2>&1;
40         formail -c < "$file" | grep -e '^From ' -e 'From: ' | spamassassin --remove-from-whitelist >/dev/null 2>&1;
41         # check to see if it's still ham
42         if $SPAM_CHECK < "$file" >/dev/null 2>&1; then
43             run_through_spamc "${NEEDS_SPAM_RULES}/cur" "$file";
44         elif [ "$(pwd)" = "${NEEDS_SPAM_RULES}" ]; then
45             rm -f "$file";
46         fi;
47     done;
48 elif [ "$(basename $0)" = "learn_from_ham" ]; then
49     for file in "$@"; do
50         $HAM_REPORT < "$file" >/dev/null 2>&1;
51         formail -c < "$file" |grep -e '^From ' -e 'From: ' -e 'To: ' -e 'Cc: '|spamassassin --add-to-whitelist >/dev/null 2>&1;
52         if ! $SPAM_CHECK < "$file" >/dev/null 2>&1; then
53             run_through_spamc "${NEEDS_HAM_RULES}/cur" "$file";
54         elif [ "$(pwd)" = "${NEEDS_HAM_RULES}" ]; then
55             rm -f "$file";
56         fi;
57     done;
58 else
59     "Called in a way this script cannot recognize";
60 fi;