46992a38834d45c3d4a3196285aa4ef2a451d375
[scripts.git] / gma.sh
1 #!/bin/bash
2
3 #########################################################################
4 # This program is free software: you can redistribute it and/or modify  #
5 # it under the terms of the version 3 of the GNU General Public License #
6 # as published by the Free Software Foundation.                         #
7 #                                                                       #
8 # This program is distributed in the hope that it will be useful, but   #
9 # WITHOUT ANY WARRANTY; without even the implied warranty of            #
10 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU      #
11 # General Public License for more details.                              #
12 #                                                                       #
13 # You should have received a copy of the GNU General Public License     #
14 # along with this program. If not, see <http://www.gnu.org/licenses/>.  #
15 #                                                                       #
16 # Written by and Copyright (C) Francois Fleuret                         #
17 # Contact <francois.fleuret@idiap.ch> for comments & bug reports        #
18 #########################################################################
19
20 set -e
21
22 function usage () {
23     echo "gma.sh [--body] [--keepspam] [--subject|--from|--to|--fromto] <pattern> [<year>]"
24 }
25
26 RESULT_MBOX="/tmp/gma"
27
28 if [[ -z "${MAIL_ARCHIVE_DIR}" ]]; then
29     echo "Undefined \$MAIL_ARCHIVE_DIR" >&2
30     exit 1
31 fi
32
33 HEADER_ONLY="-H"
34
35 while [[ $1 ]]; do
36
37     case $1 in
38
39         "--help"|"-h")
40             usage
41             exit 0
42             ;;
43
44         "--body")
45             HEADER_ONLY=""
46             ;;
47
48         "--keepspam")
49             KEEP_SPAM=1
50             ;;
51
52         "--from")
53             RE_PREFIX="^From:.*"
54             ;;
55
56         "--to")
57             RE_PREFIX="^To:.*"
58             ;;
59
60         "--fromto")
61             RE_PREFIX="^(From|To):.*"
62             ;;
63
64         "--subject")
65             RE_PREFIX="^Subject:.*"
66             ;;
67
68         *)
69             if [[ ${PATTERN} ]]; then
70                 if [[ ${FILE_PATTERN} ]]; then
71                     usage
72                     exit 1
73                 else
74                     FILE_PATTERN="${MAIL_ARCHIVE_DIR}/${1}/*/*"
75                     SIZE_FILE_PATTERN="${MAIL_ARCHIVE_DIR}/${1}"
76                 fi
77             else
78                 PATTERN=$1
79             fi
80             ;;
81     esac
82     shift
83 done
84
85 if [[ -z "${PATTERN}" ]]; then
86     usage
87     exit 1
88 fi
89
90 [[ ${FILE_PATTERN} ]] || FILE_PATTERN="${MAIL_ARCHIVE_DIR}/*/*/*"
91 [[ ${SIZE_FILE_PATTERN} ]] || SIZE_FILE_PATTERN="${MAIL_ARCHIVE_DIR}/"
92
93 SIZE=$(\dus ${SIZE_FILE_PATTERN} | cut -f 1 -d" ")
94
95 echo "Looking for ${RE_PREFIX}${PATTERN}"
96 echo "        in ${FILE_PATTERN}"
97 echo "        writing result in ${RESULT_MBOX}"
98
99 if [[ ${KEEP_SPAM} ]]; then
100
101     cat ${FILE_PATTERN} \
102         | pv -s ${SIZE} -p -t -e - \
103         | mboxgrep ${HEADER_ONLY} -i "${RE_PREFIX}${PATTERN}" > ${RESULT_MBOX}
104
105 else
106
107     cat ${FILE_PATTERN} \
108         | pv -s ${SIZE} -p -t -e - \
109         | mboxgrep ${HEADER_ONLY} -i "${RE_PREFIX}${PATTERN}" \
110         | mboxgrep ${HEADER_ONLY} -v '^Subject:.*SPAM' > ${RESULT_MBOX}
111
112 fi
113
114 echo "Found "$(grep ^"From " ${RESULT_MBOX} | wc -l)" messages."