#!perl -w # Copyright (C) all contributors # License: AGPL-3.0+ use v5.10.1; use strict; use PublicInbox::Eml; use PublicInbox::Smsg; use PublicInbox::Git; use PublicInbox::Import; use Fcntl qw(:DEFAULT SEEK_SET); use PublicInbox::TestCommon; use MIME::Base64 3.05; # Perl 5.10.0 / 5.9.2 my ($dir, $for_destroy) = tmpdir(); my $git = PublicInbox::Git->new($dir); my $im = PublicInbox::Import->new($git, 'testbox', 'test@example'); $im->init_bare; my $mime = PublicInbox::Eml->new(<<'EOF'); From: a@example.com To: b@example.com Subject: this is a subject Message-ID: Date: Fri, 02 Oct 1993 00:00:00 +0000 hello world EOF my $v2 = require_git(2.6, 1); my $smsg = $v2 ? bless({}, 'PublicInbox::Smsg') : undef; like($im->add($mime, undef, $smsg), qr/\A:[0-9]+\z/, 'added one message'); SKIP: { skip 'git 2.6+ required', 3 if !$v2; like($smsg->{blob}, qr/\A[a-f0-9]{40,64}\z/, 'got last object_id'); my @cmd = ('git', "--git-dir=$git->{git_dir}", qw(hash-object --stdin)); open my $in, '+<', undef or BAIL_OUT "open(+<): $!"; print $in $mime->as_string or die "write failed: $!"; $in->flush or die "flush failed: $!"; seek($in, 0, SEEK_SET) or die "seek: $!"; chomp(my $hashed_obj = xqx(\@cmd, undef, { 0 => $in })); is($?, 0, 'hash-object'); is($hashed_obj, $smsg->{blob}, "blob object_id matches exp"); } $im->done; my @revs = $git->qx(qw(rev-list HEAD)); is(scalar @revs, 1, 'one revision created'); my $odd = '"=?iso-8859-1?Q?J_K=FCpper?= header_set('From', $odd); $mime->header_set('Message-ID', ''); $mime->header_set('Subject', 'msg2'); like($im->add($mime, sub { $mime }), qr/\A:\d+\z/, 'added 2nd message'); $im->done; @revs = $git->qx(qw(rev-list HEAD)); is(scalar @revs, 2, '2 revisions exist'); is($im->add($mime), undef, 'message only inserted once'); $im->done; @revs = $git->qx(qw(rev-list HEAD)); is(scalar @revs, 2, '2 revisions exist'); foreach my $c ('c'..'z') { $mime->header_set('Message-ID', "<$c\@example.com>"); $mime->header_set('Subject', "msg - $c"); like($im->add($mime), qr/\A:\d+\z/, "added $c message"); } $im->done; @revs = $git->qx(qw(rev-list HEAD)); is(scalar @revs, 26, '26 revisions exist after mass import'); my ($mark, $msg) = $im->remove($mime); like($mark, qr/\A:\d+\z/, 'got mark'); like(ref($msg), qr/\bPublicInbox::(?:Eml|MIME)\b/, 'got old message deleted'); is(undef, $im->remove($mime), 'remove is idempotent'); # mismatch on identical Message-ID $mime->header_set('Message-ID', ''); ($mark, $msg) = $im->remove($mime); is($mark, 'MISMATCH', 'mark == MISMATCH on mismatch'); is($msg->header('Message-ID'), '', 'Message-ID matches'); isnt($msg->header('Subject'), $mime->header('Subject'), 'subject mismatch'); $mime->header_set('Message-Id', ''); is($im->add($mime, sub { undef }), undef, 'check callback fails'); is($im->remove($mime), undef, 'message not added, so not removed'); is(undef, $im->checkpoint, 'checkpoint works before ->done'); $im->done; is(undef, $im->checkpoint, 'checkpoint works after ->done'); $im->checkpoint; my $nogit = PublicInbox::Git->new("$dir/non-existent/dir"); eval { my $nope = PublicInbox::Import->new($nogit, 'nope', 'no@example.com'); $nope->add($mime); }; ok($@, 'Import->add fails on non-existent dir'); my @cls = qw(PublicInbox::Eml); SKIP: { require_mods('Email::MIME', 1); require PublicInbox::MIME; push @cls, 'PublicInbox::MIME'; }; $main::badchars = "\n\0\r"; my $from = '=?UTF-8?B?'. encode_base64("B\ra\nd\0\$main::badchars", ''). '?='; for my $cls (@cls) { my $eml = $cls->new(< Message-ID: <$cls\@example.com> EOF ok($im->add($eml), "added $cls message with nasty char in From"); } $im->done; my $bref = $git->cat_file('HEAD'); like($$bref, qr/^author Ba d \$main::badchars /sm, 'latest commit accepted by spammer'); $git->qx(qw(fsck --no-progress --strict)); is($?, 0, 'fsck reported no errors'); $main::badchars = undef; done_testing();