From eeabb27977bca531a1918ab85a7714c91ceaee42 Mon Sep 17 00:00:00 2001 From: "Eric Wong (Contractor, The Linux Foundation)" Date: Thu, 15 Feb 2018 01:12:18 +0000 Subject: scripts/import_vger_from_mbox: use v2 layout for import Big lists are orders of magnitude more efficient with v2. --- scripts/import_vger_from_mbox | 24 ++++++------------------ 1 file changed, 6 insertions(+), 18 deletions(-) (limited to 'scripts') diff --git a/scripts/import_vger_from_mbox b/scripts/import_vger_from_mbox index 3fa5c778..6ea2ca5d 100644 --- a/scripts/import_vger_from_mbox +++ b/scripts/import_vger_from_mbox @@ -22,32 +22,20 @@ binmode STDIN; my $msg = ''; use PublicInbox::Filter::Vger; my $vger = PublicInbox::Filter::Vger->new; +if ($im) { + $im->{ssoma_lock} = 0; + $im->{path_type} = 'v2'; +} + sub do_add ($$) { my ($im, $msg) = @_; $$msg =~ s/(\r?\n)+\z/$1/s; $msg = Email::MIME->new($$msg); $msg = $vger->scrub($msg); - my $hdr = $msg->header_obj; - my $date = $hdr->header_raw('Date'); - if ($date) { - eval { str2time($date) }; - if ($@) { - warn "bad Date: $date in ", - $hdr->header_raw('Message-ID'), ": $@\n"; - } - } else { - warn "missing Date: $date in ", - $hdr->header_raw('Message-ID'), ": $@\n"; - my $n = 0; - foreach my $r ($hdr->header_raw('Received')) { - warn "$n Received: $r\n"; - } - warn(('-' x 72), "\n"); - } return unless $im; $im->add($msg) or warn "duplicate: ", - $hdr->header_raw('Message-ID'), "\n"; + $msg->header_obj->header_raw('Message-ID'), "\n"; } # asctime: From example@example.com Fri Jun 23 02:56:55 2000 -- cgit v1.2.3-24-ge0c7