2003 and 2006 and haven't been tracked by any SCM. The changes are the following, in reverse order: * src/mboxgrep.h, src/main.c, src/mbox.c, src/mbox.h, src/scan.c: Temporary mbox file (used for deleting messages) is now created by tmpmbox_create(); tmpp global pointer is killed; portions of code in scan.c are replaced by single call of mbox_write_message(); scan.c no longer includes zlib.h and bzlib.h. * src/mboxgrep.h, src/main.c, src/maildir.c, src/scan.c: Got rid off tmpp and maildir_count global variables (code cleanup). * src/mboxgrep.h, src/main.c, src/scan.c: Introduction of the global runtime_t structure; mailbox counter, MD5 hash and other global variables are now part of it (code cleanup). * src/mboxgrep.h, src/re.c, src/re.h, src/scan.c: Portions of scan_mailbox() have been moved to new functions, pcre_match() and regex_match() (code cleanup). * src/main.c, src/mboxgrep.h, src/re.c, src/re.h, src/scan.c: main() has been partially uncluttered by moving portions of the code to functions pcre_init() and regex_init(). * src/main.c, src/mboxgrep.h, src/misc.c, src/misc.h: Variables regex_s and haveregex are now part of the option_t structure (code cleanup). * src/main.c, src/misc.c, src/misc.h: Parts of main() have been moved to set_default_options() and get_runtime_options() (code cleanup). * src/mbox.c, src/mbox.h: File mode and ownership-altering code has been moved to a separate function, tmpfile_mod_own (code cleanup). * src/mbox.c, src/mbox.h: Portions of the code from tmpfile_open moved to a new function, tmpfile_name (code cleanup). * src/maildir.c, src/mh.c: Removed some unused variables (have_return_path). * src/mboxgrep.h, src/maildir.c, src/mh.c, src/mbox.c, src/scan.c, src/main.c: boxname, outboxname, pipecmd and tmpfilename are now a part of the config_t structure and no longer global variables. * src/scan.c, src/misc.c, src/misc.h: Created postmark_print() to unclutter scan_mailbox(). * src/misc.c, src/misc.h, src/mbox.c, src/maildir.c, src/mh.c: Some repetitive code moved to malloc_message(). * src/mbox.c: Cleanup of mbox_write_message(); use of gzwrite_loop() and bzwrite_loop(). * src/scan.c, src/wrap.h, src/wrap.c: Wrote gzwrite_loop() and bzwrite_loop() to remove some repetitive code from scan.c. * src/scan.c: md5_check_message(): array b and cast in strncmp are no longer unsigned. * src/info.c, src/mboxgrep.h: Updated copyright information, changed author's email address to the one at Panix. * src/mbox.h, src/mbox.c, src/scan.c, src/main.c: mbox_write_message(); further fixes of message deletion code. * src/scan.c: Fixed deleting messages from mbox folders compressed with bzip2. * src/main.c, src/mbox.c: Moved James P. Dugal's ownership-preserving code from main() to tmpfile_open(). * src/info.c: If bzip2 support is compiled in, `--help' command should list `bz2mbox' as a valid option to `--mailbox-format='.
285 lines
6.9 KiB
C
285 lines
6.9 KiB
C
/* -*- C -*-
|
|
mboxgrep - scan mailbox for messages matching a regular expression
|
|
Copyright (C) 2000, 2001, 2002, 2003, 2004, 2006 Daniel Spiljar
|
|
|
|
Mboxgrep is free software; you can redistribute it and/or modify it
|
|
under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
Mboxgrep is distributed in the hope that it will be useful, but
|
|
WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with mboxgrep; if not, write to the Free Software Foundation,
|
|
Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
|
|
$Id: scan.c,v 1.32 2006-10-22 23:34:49 dspiljar Exp $ */
|
|
|
|
#include <config.h>
|
|
|
|
#include <unistd.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <sys/types.h>
|
|
|
|
#ifdef HAVE_DIRENT_H
|
|
# include <dirent.h>
|
|
# define NAMLEN(dirent) strlen((dirent)->d_name)
|
|
#else
|
|
# define dirent direct
|
|
# define NAMLEN(dirent) (dirent)->d_namlen
|
|
# ifdef HAVE_SYS_NDIR_H
|
|
# include <sys/ndir.h>
|
|
# endif /* HAVE_SYS_NDIR_H */
|
|
# ifdef HAVE_SYS_DIR_H
|
|
# include <sys/dir.h>
|
|
# endif /* HAVE_SYS_DIR_H */
|
|
# ifdef HAVE_NDIR_H
|
|
# include <ndir.h>
|
|
# endif /* HAVE_NDIR_H */
|
|
#endif /* HAVE_DIRENT_H */
|
|
|
|
#include <time.h>
|
|
#include <errno.h>
|
|
#include <string.h>
|
|
#define BUFLEN 16384
|
|
|
|
#include "mboxgrep.h"
|
|
#include "scan.h"
|
|
#include "mbox.h"
|
|
#include "mh.h"
|
|
#include "maildir.h"
|
|
#include "wrap.h"
|
|
#include "md5.h"
|
|
#include "misc.h"
|
|
#include "re.h"
|
|
#ifdef HAVE_FTS_OPEN
|
|
# include <sys/stat.h>
|
|
# include <fts.h>
|
|
#else
|
|
# ifdef HAVE_FTW
|
|
# include <ftw.h>
|
|
# endif /* HAVE_FTW */
|
|
#endif /* HAVE_FTS_OPEN */
|
|
|
|
#ifdef HAVE_LIBDMALLOC
|
|
#include <dmalloc.h>
|
|
#endif /* HAVE_LIBDMALLOC */
|
|
|
|
void scan_mailbox (char path[])
|
|
/* {{{ */
|
|
{
|
|
static FILE *outf;
|
|
static mbox_t *mbox, *out;
|
|
static DIR *boxd, *foo;
|
|
static maildir_t *maildird;
|
|
static message_t *msg;
|
|
int delete = 0;
|
|
int isdup = 0;
|
|
|
|
if (config.format == MAILDIR && config.action == WRITE)
|
|
{
|
|
foo = opendir (config.outboxname); /* do NOT change this to m_opendir! */
|
|
if (foo == NULL && errno == ENOENT)
|
|
maildir_create (config.outboxname);
|
|
else closedir (foo);
|
|
|
|
if (-1 == maildir_check (config.outboxname))
|
|
{
|
|
if (config.merr)
|
|
fprintf (stderr, "%s: %s: Not a maildir folder\n", APPNAME,
|
|
config.outboxname);
|
|
exit (2);
|
|
}
|
|
}
|
|
|
|
runtime.count = 0;
|
|
if (config.action == DELETE)
|
|
delete = 1;
|
|
|
|
if ((config.format == MBOX) || (config.format == ZMBOX) ||
|
|
(config.format == BZ2MBOX))
|
|
{
|
|
mbox = (mbox_t *) mbox_open (path, "r");
|
|
if (mbox == NULL) return;
|
|
}
|
|
else if ((config.format == MH) || (config.format == NNMH) ||
|
|
(config.format == NNML))
|
|
{
|
|
boxd = mh_open (path);
|
|
if (boxd == NULL) return;
|
|
}
|
|
else if (config.format == MAILDIR)
|
|
{
|
|
maildird = maildir_open (path);
|
|
if (maildird == NULL) return;
|
|
}
|
|
|
|
for (;;)
|
|
{
|
|
config.res1 = 1;
|
|
config.res2 = 1;
|
|
|
|
if ((config.format == MBOX) || (config.format == ZMBOX) ||
|
|
(config.format == BZ2MBOX))
|
|
msg = (message_t *) mbox_read_message (mbox);
|
|
else if ((config.format == MH) || (config.format == NNMH) ||
|
|
(config.format == NNML))
|
|
msg = (message_t *) mh_read_message (boxd);
|
|
else if (config.format == MAILDIR)
|
|
msg = (message_t *) maildir_read_message (maildird);
|
|
|
|
if (msg == NULL) break;
|
|
|
|
if (msg->from == NULL) msg->from = (char *) xstrdup ("nobody");
|
|
|
|
#ifdef HAVE_LIBPCRE
|
|
if (config.perl)
|
|
pcre_match (msg);
|
|
else
|
|
#endif /* HAVE_LIBPCRE */
|
|
regex_match (msg);
|
|
|
|
if (config.dedup)
|
|
isdup = md5_check_message (msg->body, runtime.cs);
|
|
|
|
if (((config.res1 == 0) | (config.res2 == 0)) ^
|
|
((config.invert ^ delete)) &&
|
|
((config.dedup && !isdup) || !config.dedup))
|
|
{
|
|
if (config.action == DISPLAY)
|
|
{
|
|
if (config.format != MBOX && config.format != ZMBOX
|
|
&& config.format != BZ2MBOX
|
|
&& 0 != strncmp ("From ", msg->headers, 5))
|
|
postmark_print (msg);
|
|
fprintf (stdout, "%s\n%s", msg->headers, msg->body);
|
|
}
|
|
else if (config.action == WRITE)
|
|
{
|
|
if (config.format == MAILDIR)
|
|
maildir_write_message (msg, config.outboxname);
|
|
else if (config.format == MH || config.format == NNMH ||
|
|
config.format == NNML)
|
|
mh_write_message (msg, config.outboxname);
|
|
else if ((config.format == MBOX) || (config.format == ZMBOX) ||
|
|
(config.format == BZ2MBOX))
|
|
{
|
|
out = mbox_open (config.outboxname, "w");
|
|
/* fprintf (out->fp, "%s\n%s", msg->headers, msg->body); */
|
|
mbox_write_message (msg, out);
|
|
mbox_close (out);
|
|
}
|
|
}
|
|
else if (config.action == PIPE)
|
|
{
|
|
outf = popen (config.pipecmd, "w");
|
|
if (outf == NULL)
|
|
{
|
|
if (config.merr)
|
|
{
|
|
fprintf (stderr, "%s: %s: ", APPNAME, config.pipecmd);
|
|
perror (NULL);
|
|
}
|
|
exit (2);
|
|
} /* if */
|
|
fprintf (outf, "%s\n%s", msg->headers, msg->body);
|
|
pclose (outf);
|
|
}
|
|
else if (config.action == COUNT)
|
|
runtime.count++;
|
|
else if (config.action == DELETE &&
|
|
((config.format == MBOX) || (config.format == ZMBOX) ||
|
|
(config.format == BZ2MBOX)))
|
|
mbox_write_message (msg, runtime.tmp_mbox);
|
|
}
|
|
|
|
else if (((((config.res1 == 0) | (config.res2 == 0)) ^
|
|
config.invert) && delete) &&
|
|
((config.format == MH) || (config.format == NNMH) ||
|
|
(config.format == NNML) || (config.format == MAILDIR)))
|
|
m_unlink(msg->filename);
|
|
|
|
free(msg->body);
|
|
free(msg->headers);
|
|
free(msg);
|
|
} /* for */
|
|
if ((config.format == MBOX) || (config.format == ZMBOX) ||
|
|
(config.format == BZ2MBOX))
|
|
mbox_close (mbox);
|
|
else if ((config.format == MH) || (config.format == NNMH) ||
|
|
(config.format == NNML))
|
|
mh_close(boxd);
|
|
}
|
|
/* }}} */
|
|
|
|
void recursive_scan (char path[])
|
|
/* {{{ */
|
|
|
|
{
|
|
#ifdef HAVE_FTS_OPEN
|
|
FTS *ftsfoo;
|
|
FTSENT *ftsbar;
|
|
#endif /* HAVE_FTS_OPEN */
|
|
|
|
#ifdef HAVE_FTS_OPEN
|
|
{
|
|
char *p[2];
|
|
|
|
p[0] = strdup (path);
|
|
p[1] = 0;
|
|
|
|
ftsfoo = fts_open (p, FTS_NOCHDIR, NULL);
|
|
|
|
if (ftsfoo == NULL)
|
|
{
|
|
/* fixme (?) */
|
|
perror(APPNAME);
|
|
exit (2);
|
|
}
|
|
|
|
while ((ftsbar = fts_read (ftsfoo)))
|
|
scan_mailbox (ftsbar->fts_path);
|
|
|
|
fts_close (ftsfoo);
|
|
}
|
|
#else
|
|
ftw (path, (void *) scan_mailbox, 1);
|
|
#endif /* HAVE_FTS_OPEN */
|
|
}
|
|
|
|
/* }}} */
|
|
|
|
int md5_check_message (char *body, checksum_t *chksum)
|
|
/* {{{ */
|
|
{
|
|
struct md5_ctx a;
|
|
char b[16];
|
|
int i;
|
|
|
|
md5_init_ctx (&a);
|
|
if (body == NULL)
|
|
md5_process_bytes ("", 0, &a);
|
|
else
|
|
md5_process_bytes (body, strlen(body), &a);
|
|
md5_finish_ctx(&a, b);
|
|
|
|
for (i = 0; i < chksum->n; i++)
|
|
{
|
|
if (0 == strncmp ((char *)chksum->md5[i], b, 16))
|
|
return 1;
|
|
}
|
|
|
|
chksum->md5 =
|
|
(char **) xrealloc (chksum->md5, (1 + chksum->n) * sizeof (char *));
|
|
chksum->md5[chksum->n] = xstrdup (b);
|
|
|
|
(chksum->n)++;
|
|
|
|
return 0;
|
|
}
|
|
/* }}} */
|