summaryrefslogtreecommitdiff
path: root/archives/bin/splitmbox
blob: 7f679897b6b186009c605c73b164731d0af09c05 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
#!/bin/bash
#
# Split an mbox into message files, and sort them into directories according
# to message-id splitting.
#
# This needs to run under bash because some of the ${} stuff is a bash-ism.
#
# $Id$

mbox=$1
destdir=messages
export destdir

# *() and other patterns need this set
shopt -s extglob

if [ ! -f $mbox ]; then
  echo "mbox $mbox not found" >&2
  exit 1
fi

if [ ! -d $destdir ]; then
  echo "destination directory $destdir does not exist" >&2
  exit 1
fi

if [ $(basename $mbox) = $(basename $mbox .gz) ]; then
  cat=cat
else
  cat=zcat
fi

tempdir=$(mktemp -d)
export tempdir
$cat $mbox | formail -s sh -c 'cat - > $tempdir/msg.$FILENO'

for message in $tempdir/msg.*; do
  # Fetch the Message-Id.  Note: due to braindamage at Microsoft we need to
  # cope with messages having more than one Message-Id, so we loop here.
  formail -x Message-Id < $message | while read messageid; do
    # strip the initial " <", the trailing ">", and replace /'s with _
    messageid=${messageid##*([< ])}
    messageid=${messageid%%>}
    messageid=${messageid//\//_}
    # fetch the part after the first @ (inclusive)
    dir=${messageid##*([^@])}
    # escape [, ? and * from it (these are special chars for bash ${} expansion)
    diresc=${dir/[/\\[}
    diresc=${diresc/\*/\\*}
    diresc=${diresc/\?/\\?}
    # and fetch the part before the @ (i.e. strip $dir)
    file=${messageid%%$diresc}
    # create the directory if needed
    if [ ! -d "$destdir/$dir" ]; then
      mkdir -v "$destdir/$dir" || echo "failed to create $destdir/$dir"
    fi
    # and link the message into place
    if [ ! -f "$destdir/$dir/$file" ]; then
      ln $message "$destdir/$dir/$file" || echo "failed to link $message to $destdir/$dir/$file"
    fi
  done
  rm $message
done
rmdir $tempdir # unless something remained