about summary refs log tree commit homepage
path: root/lib/PublicInbox/SearchIdx.pm
diff options
context:
space:
mode:
authorEric Wong <e@80x24.org>2015-10-03 10:02:33 +0000
committerEric Wong <e@80x24.org>2015-10-03 10:03:59 +0000
commitc68a1fcd75f103d08f8c2dabf9b3a1db4239f59c (patch)
tree5b431709093a712719136e8f07f9cac46af85aee /lib/PublicInbox/SearchIdx.pm
parent22d8fcc3d37b9ce13a5088f1d0557078c9a84062 (diff)
downloadpublic-inbox-c68a1fcd75f103d08f8c2dabf9b3a1db4239f59c.tar.gz
Xapian has this limit for terms, and there are likely no
legitimate Message-IDs (or single header lines) this long; so
there's no need to workaround this limit.
Diffstat (limited to 'lib/PublicInbox/SearchIdx.pm')
-rw-r--r--lib/PublicInbox/SearchIdx.pm5
1 files changed, 5 insertions, 0 deletions
diff --git a/lib/PublicInbox/SearchIdx.pm b/lib/PublicInbox/SearchIdx.pm
index 8184dc71..0646cfb3 100644
--- a/lib/PublicInbox/SearchIdx.pm
+++ b/lib/PublicInbox/SearchIdx.pm
@@ -8,6 +8,7 @@ use base qw(PublicInbox::Search);
 use PublicInbox::MID qw/mid_clean id_compress/;
 *xpfx = *PublicInbox::Search::xpfx;
 
+use constant MAX_MID_SIZE => 244; # max term size - 1 in Xapian
 use constant {
         PERM_UMASK => 0,
         OLD_PERM_GROUP => 1,
@@ -52,6 +53,7 @@ sub add_message {
         my $ct_msg = $mime->header('Content-Type') || 'text/plain';
 
         eval {
+                die 'Message-ID too long' if length($mid) > MAX_MID_SIZE;
                 my $smsg = $self->lookup_message($mid);
                 my $doc;
 
@@ -230,6 +232,9 @@ sub link_message_to_parents {
 
                 # prevent circular references via References: here:
                 foreach my $ref (@orig_refs) {
+                        if (length($ref) > MAX_MID_SIZE) {
+                                warn "References: <$ref> too long, ignoring\n";
+                        }
                         next if $uniq{$ref};
                         $uniq{$ref} = 1;
                         push @refs, $ref;