mboxgrep/src/scan.c

296 lines
8.0 KiB
C

/*
mboxgrep - scan mailbox for messages matching a regular expression
Copyright (C) 2000 - 2004, 2006, 2023 Daniel Spiljar
Mboxgrep is free software; you can redistribute it and/or modify it
under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
Mboxgrep is distributed in the hope that it will be useful, but
WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with mboxgrep; if not, write to the Free Software Foundation,
Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
*/
#include <config.h>
#include <unistd.h>
#include <stdio.h>
#include <stdlib.h>
#include <sys/types.h>
#ifdef HAVE_DIRENT_H
# include <dirent.h>
# define NAMLEN(dirent) strlen((dirent)->d_name)
#else
# define dirent direct
# define NAMLEN(dirent) (dirent)->d_namlen
# ifdef HAVE_SYS_NDIR_H
# include <sys/ndir.h>
# endif
/* HAVE_SYS_NDIR_H */
# ifdef HAVE_SYS_DIR_H
# include <sys/dir.h>
# endif
/* HAVE_SYS_DIR_H */
# ifdef HAVE_NDIR_H
# include <ndir.h>
# endif
/* HAVE_NDIR_H */
#endif /* HAVE_DIRENT_H */
#include <time.h>
#include <errno.h>
#include <string.h>
#define BUFLEN 16384
#include "mboxgrep.h"
#include "scan.h"
#include "mbox.h"
#include "mh.h"
#include "maildir.h"
#include "wrap.h"
#include "md5.h"
#include "misc.h"
#include "re.h"
#ifdef HAVE_FTS_OPEN
# include <sys/stat.h>
# include <fts.h>
#else
# ifdef HAVE_FTW
# include <ftw.h>
# endif
/* HAVE_FTW */
#endif /* HAVE_FTS_OPEN */
#ifdef HAVE_LIBDMALLOC
# include <dmalloc.h>
#endif /* HAVE_LIBDMALLOC */
void
scan_mailbox (char path[])
{
static FILE *outf;
static mbox_t *mbox, *out;
static DIR *boxd, *foo;
static maildir_t *maildird;
static message_t *msg;
int delete = 0;
int isdup = 0;
if (config.format == FORMAT_MAILDIR && config.action == ACTION_WRITE)
{
foo = opendir (config.outboxname); /* do NOT change this to m_opendir! */
if (foo == NULL && errno == ENOENT)
maildir_create (config.outboxname);
else
closedir (foo);
if (-1 == maildir_check (config.outboxname))
{
if (config.merr)
fprintf (stderr, "%s: %s: Not a maildir folder\n", APPNAME,
config.outboxname);
exit (2);
}
}
runtime.count = 0;
if (config.action == ACTION_DELETE)
delete = 1;
if ((config.format == FORMAT_MBOX) || (config.format == FORMAT_ZMBOX)
|| (config.format == FORMAT_BZ2MBOX))
{
mbox = (mbox_t *) mbox_open (path, "r");
if (mbox == NULL)
return;
}
else if ((config.format == FORMAT_MH) || (config.format == FORMAT_NNMH)
|| (config.format == FORMAT_NNML))
{
boxd = mh_open (path);
if (boxd == NULL)
return;
}
else if (config.format == FORMAT_MAILDIR)
{
maildird = maildir_open (path);
if (maildird == NULL)
return;
}
for (;;)
{
config.res1 = 1;
config.res2 = 1;
if ((config.format == FORMAT_MBOX) || (config.format == FORMAT_ZMBOX)
|| (config.format == FORMAT_BZ2MBOX))
msg = (message_t *) mbox_read_message (mbox);
else if ((config.format == FORMAT_MH) || (config.format == FORMAT_NNMH)
|| (config.format == FORMAT_NNML))
msg = (message_t *) mh_read_message (boxd);
else if (config.format == FORMAT_MAILDIR)
msg = (message_t *) maildir_read_message (maildird);
if (msg == NULL)
break;
if (msg->from == NULL)
msg->from = (char *) xstrdup ("nobody");
#ifdef HAVE_LIBPCRE2
if (config.regextype == REGEX_PERL)
pcre_match (msg);
else
#endif /* HAVE_LIBPCRE2 */
regex_match (msg);
if (config.dedup)
isdup = md5_check_message (msg->body, runtime.cs);
if (((config.res1 == 0) | (config.res2 == 0)) ^
((config.invert ^ delete)) &&
((config.dedup && !isdup) || !config.dedup))
{
if (config.action == ACTION_DISPLAY)
{
if (config.format != FORMAT_MBOX && config.format != FORMAT_ZMBOX
&& config.format != FORMAT_BZ2MBOX
&& 0 != strncmp ("From ", msg->headers, 5))
postmark_print (msg);
fprintf (stdout, "%s\n%s", msg->headers, msg->body);
}
else if (config.action == ACTION_WRITE)
{
if (config.format == FORMAT_MAILDIR)
maildir_write_message (msg, config.outboxname);
else if (config.format == FORMAT_MH || config.format == FORMAT_NNMH
|| config.format == FORMAT_NNML)
mh_write_message (msg, config.outboxname);
else if ((config.format == FORMAT_MBOX) || (config.format == FORMAT_ZMBOX)
|| (config.format == FORMAT_BZ2MBOX))
{
out = mbox_open (config.outboxname, "w");
/* fprintf (out->fp, "%s\n%s", msg->headers, msg->body); */
mbox_write_message (msg, out);
mbox_close (out);
}
}
else if (config.action == ACTION_PIPE)
{
outf = popen (config.pipecmd, "w");
if (outf == NULL)
{
if (config.merr)
{
fprintf (stderr, "%s: %s: ", APPNAME, config.pipecmd);
perror (NULL);
}
exit (2);
} /* if */
fprintf (outf, "%s\n%s", msg->headers, msg->body);
pclose (outf);
}
else if (config.action == ACTION_COUNT)
runtime.count++;
else if (config.action == ACTION_DELETE &&
((config.format == FORMAT_MBOX) || (config.format == FORMAT_ZMBOX)
|| (config.format == FORMAT_BZ2MBOX)))
mbox_write_message (msg, runtime.tmp_mbox);
}
else
if (((((config.res1 == 0) | (config.res2 == 0)) ^ config.invert)
&& delete) && ((config.format == FORMAT_MH) || (config.format == FORMAT_NNMH)
|| (config.format == FORMAT_NNML)
|| (config.format == FORMAT_MAILDIR)))
m_unlink (msg->filename);
free (msg->body);
free (msg->headers);
free (msg);
} /* for */
if ((config.format == FORMAT_MBOX) || (config.format == FORMAT_ZMBOX)
|| (config.format == FORMAT_BZ2MBOX))
mbox_close (mbox);
else if ((config.format == FORMAT_MH) || (config.format == FORMAT_NNMH)
|| (config.format == FORMAT_NNML))
mh_close (boxd);
}
void
recursive_scan (char path[])
{
#ifdef HAVE_FTS_OPEN
FTS *ftsfoo;
FTSENT *ftsbar;
#endif /* HAVE_FTS_OPEN */
#ifdef HAVE_FTS_OPEN
{
char *p[2];
p[0] = strdup (path);
p[1] = 0;
ftsfoo = fts_open (p, FTS_NOCHDIR, NULL);
if (ftsfoo == NULL)
{
/* fixme (?) */
perror (APPNAME);
exit (2);
}
while ((ftsbar = fts_read (ftsfoo)))
scan_mailbox (ftsbar->fts_path);
fts_close (ftsfoo);
}
#else
ftw (path, (void *) scan_mailbox, 1);
#endif /* HAVE_FTS_OPEN */
}
int
md5_check_message (char *body, checksum_t * chksum)
{
struct md5_ctx a;
char b[16];
int i;
md5_init_ctx (&a);
if (body == NULL)
md5_process_bytes ("", 0, &a);
else
md5_process_bytes (body, strlen (body), &a);
md5_finish_ctx (&a, b);
for (i = 0; i < chksum->n; i++)
{
if (0 == strncmp ((char *) chksum->md5[i], b, 16))
return 1;
}
chksum->md5 =
(char **) xrealloc (chksum->md5, (1 + chksum->n) * sizeof (char *));
chksum->md5[chksum->n] = xstrdup (b);
(chksum->n)++;
return 0;
}