Mailing List Archive

svn commit: r446790 - in /spamassassin/trunk/lib/Mail/SpamAssassin: ArchiveIterator.pm Constants.pm
Author: felicity
Date: Fri Sep 15 16:55:22 2006
New Revision: 446790

URL: http://svn.apache.org/viewvc?view=rev&rev=446790
Log:
bug 5101: fix bug in mbx parsing, also update the MBX_SEPARATOR RE to anchor at start and end of lines, which should make things faster.

Modified:
spamassassin/trunk/lib/Mail/SpamAssassin/ArchiveIterator.pm
spamassassin/trunk/lib/Mail/SpamAssassin/Constants.pm

Modified: spamassassin/trunk/lib/Mail/SpamAssassin/ArchiveIterator.pm
URL: http://svn.apache.org/viewvc/spamassassin/trunk/lib/Mail/SpamAssassin/ArchiveIterator.pm?view=diff&rev=446790&r1=446789&r2=446790
==============================================================================
--- spamassassin/trunk/lib/Mail/SpamAssassin/ArchiveIterator.pm (original)
+++ spamassassin/trunk/lib/Mail/SpamAssassin/ArchiveIterator.pm Fri Sep 15 16:55:22 2006
@@ -849,7 +849,7 @@
}

$self->bump_scan_progress();
- $info->{"$file.$offset"} = Mail::SpamAssassin::Util::receive_date($header);
+ $info->{$offset} = Mail::SpamAssassin::Util::receive_date($header);

# go onto the next message
seek(INPUT, $offset + $size, 0);

Modified: spamassassin/trunk/lib/Mail/SpamAssassin/Constants.pm
URL: http://svn.apache.org/viewvc/spamassassin/trunk/lib/Mail/SpamAssassin/Constants.pm?view=diff&rev=446790&r1=446789&r2=446790
==============================================================================
--- spamassassin/trunk/lib/Mail/SpamAssassin/Constants.pm (original)
+++ spamassassin/trunk/lib/Mail/SpamAssassin/Constants.pm Fri Sep 15 16:55:22 2006
@@ -265,7 +265,7 @@

# regular expression that matches message separators in The University of
# Washington's MBX mailbox format
-use constant MBX_SEPARATOR => qr/([\s|\d]\d-[a-zA-Z]{3}-\d{4}\s\d{2}:\d{2}:\d{2}.*),(\d+);([\da-f]{12})-(\w{8})/;
+use constant MBX_SEPARATOR => qr/^([\s|\d]\d-[a-zA-Z]{3}-\d{4}\s\d{2}:\d{2}:\d{2}.*),(\d+);([\da-f]{12})-(\w{8})\r?$/;
# $1 = datestamp (str)
# $2 = size of message in bytes (int)
# $3 = message status - binary (hex)