#!perl -w # Copyright (C) 2020-2021 all contributors # License: AGPL-3.0+ use strict; use v5.10.1; use Test::More; use PublicInbox::TestCommon; use PublicInbox::Eml; use Fcntl qw(SEEK_SET); use PublicInbox::Spawn qw(popen_rd which); use List::Util qw(shuffle); require_mods(qw(DBD::SQLite)); require PublicInbox::MboxReader; use_ok 'PublicInbox::LeiToMail'; my $from = "Content-Length: 10\nSubject: x\n\nFrom hell\n"; my $noeol = "Subject: x\n\nFrom hell"; my $crlf = $noeol; $crlf =~ s/\n/\r\n/g; my $kw = [qw(seen answered flagged)]; my @MBOX = qw(mboxcl2 mboxrd mboxcl mboxo); for my $mbox (@MBOX) { my $m = "eml2$mbox"; my $cb = PublicInbox::LeiToMail->can($m); my $s = $cb->(PublicInbox::Eml->new($from), $kw); is(substr($$s, -1, 1), "\n", "trailing LF in normal $mbox"); my $eml = PublicInbox::Eml->new($s); is($eml->header('Status'), 'R', "Status: set by $m"); is($eml->header('X-Status'), 'AF', "X-Status: set by $m"); if ($mbox eq 'mboxcl2') { like($eml->body_raw, qr/^From /, "From not escaped $m"); } else { like($eml->body_raw, qr/^>From /, "From escaped once by $m"); } my @cl = $eml->header('Content-Length'); if ($mbox =~ /mboxcl/) { is(scalar(@cl), 1, "$m only has one Content-Length header"); is($cl[0] + length("\n"), length($eml->body_raw), "$m Content-Length matches"); } else { is(scalar(@cl), 0, "$m clobbered Content-Length"); } $s = $cb->(PublicInbox::Eml->new($noeol), $kw); is(substr($$s, -1, 1), "\n", "trailing LF added by $m when original lacks EOL"); $eml = PublicInbox::Eml->new($s); if ($mbox eq 'mboxcl2') { is($eml->body_raw, "From hell\n", "From not escaped by $m"); } else { is($eml->body_raw, ">From hell\n", "From escaped once by $m"); } $s = $cb->(PublicInbox::Eml->new($crlf), $kw); is(substr($$s, -2, 2), "\r\n", "trailing CRLF added $m by original lacks EOL"); $eml = PublicInbox::Eml->new($s); if ($mbox eq 'mboxcl2') { is($eml->body_raw, "From hell\r\n", "From not escaped by $m"); } else { is($eml->body_raw, ">From hell\r\n", "From escaped once by $m"); } if ($mbox =~ /mboxcl/) { is($eml->header('Content-Length') + length("\r\n"), length($eml->body_raw), "$m Content-Length matches"); } elsif ($mbox eq 'mboxrd') { $s = $cb->($eml, $kw); $eml = PublicInbox::Eml->new($s); is($eml->body_raw, ">>From hell\r\n\r\n", "From escaped again by $m"); } } my ($tmpdir, $for_destroy) = tmpdir(); local $ENV{TMPDIR} = $tmpdir; open my $err, '>>', "$tmpdir/lei.err" or BAIL_OUT $!; my $lei = { 2 => $err }; my $buf = <<'EOM'; From: x@example.com Subject: x blah EOM my $fn = "$tmpdir/x.mbox"; my ($mbox) = shuffle(@MBOX); # pick one, shouldn't matter my $orig = do { my $wcb = PublicInbox::LeiToMail->write_cb("$mbox:$fn", $lei); is(ref $wcb, 'CODE', 'write_cb returned callback'); ok(-f $fn && !-s _, 'empty file created'); $wcb->(\(my $dup = $buf), 'deadbeef', [ qw(seen) ]); undef $wcb; open my $fh, '<', $fn or BAIL_OUT $!; my $raw = do { local $/; <$fh> }; like($raw, qr/^blah\n/sm, 'wrote content'); unlink $fn or BAIL_OUT $!; local $lei->{opt} = { jobs => 2 }; $wcb = PublicInbox::LeiToMail->write_cb("$mbox:$fn", $lei); ok(-f $fn && !-s _, 'truncated mbox destination'); $lei->{dedupe}->prepare_dedupe; $wcb->(\($dup = $buf), 'deadbeef', [ qw(seen) ]); undef $wcb; open $fh, '<', $fn or BAIL_OUT $!; is($raw, do { local $/; <$fh> }, 'jobs > 1'); $raw; }; for my $zsfx (qw(gz bz2 xz)) { # XXX should we support zst, zz, lzo, lzma? my $zsfx2cmd = PublicInbox::LeiToMail->can('zsfx2cmd'); SKIP: { my $cmd = eval { $zsfx2cmd->($zsfx, 0, $lei) }; skip $@, 3 if $@; my $dc_cmd = eval { $zsfx2cmd->($zsfx, 1, $lei) }; ok($dc_cmd, "decompressor for .$zsfx"); my $f = "$fn.$zsfx"; my $dst = "$mbox:$f"; my $wcb = PublicInbox::LeiToMail->write_cb($dst, $lei); $wcb->(\(my $dup = $buf), 'deadbeef', [ qw(seen) ]); undef $wcb; my $uncompressed = xqx([@$dc_cmd, $f]); is($uncompressed, $orig, "$zsfx works unlocked"); local $lei->{opt} = { jobs => 2 }; # for atomic writes unlink $f or BAIL_OUT "unlink $!"; $wcb = PublicInbox::LeiToMail->write_cb($dst, $lei); $lei->{dedupe}->prepare_dedupe; $wcb->(\($dup = $buf), 'deadbeef', [ qw(seen) ]); undef $wcb; is(xqx([@$dc_cmd, $f]), $orig, "$zsfx matches with lock"); local $lei->{opt} = { augment => 1 }; $wcb = PublicInbox::LeiToMail->write_cb($dst, $lei); $lei->{dedupe}->prepare_dedupe; $wcb->(\($dup = $buf . "\nx\n"), 'deadbeef', [ qw(seen) ]); undef $wcb; # commit my $cat = popen_rd([@$dc_cmd, $f]); my @raw; PublicInbox::MboxReader->$mbox($cat, sub { push @raw, shift->as_string }); like($raw[1], qr/\nblah\n\nx\n\z/s, "augmented $zsfx"); like($raw[0], qr/\nblah\n\z/s, "original preserved $zsfx"); local $lei->{opt} = { augment => 1, jobs => 2 }; $wcb = PublicInbox::LeiToMail->write_cb($dst, $lei); $lei->{dedupe}->prepare_dedupe; $wcb->(\($dup = $buf . "\ny\n"), 'deadbeef', [ qw(seen) ]); undef $wcb; # commit my @raw3; $cat = popen_rd([@$dc_cmd, $f]); PublicInbox::MboxReader->$mbox($cat, sub { push @raw3, shift->as_string }); my $y = pop @raw3; is_deeply(\@raw3, \@raw, 'previous messages preserved'); like($y, qr/\nblah\n\ny\n\z/s, "augmented $zsfx (atomic)"); } } unlink $fn or BAIL_OUT $!; if ('default deduplication uses content_hash') { my $wcb = PublicInbox::LeiToMail->write_cb("mboxo:$fn", $lei); $wcb->(\(my $x = $buf), 'deadbeef', []) for (1..2); undef $wcb; # undef to commit changes my $cmp = ''; open my $fh, '<', $fn or BAIL_OUT $!; PublicInbox::MboxReader->mboxo($fh, sub { $cmp .= shift->as_string }); is($cmp, $buf, 'only one message written'); local $lei->{opt} = { augment => 1 }; $wcb = PublicInbox::LeiToMail->write_cb("mboxo:$fn", $lei); $wcb->(\($x = $buf . "\nx\n"), 'deadbeef', []) for (1..2); undef $wcb; # undef to commit changes open $fh, '<', $fn or BAIL_OUT $!; my @x; PublicInbox::MboxReader->mboxo($fh, sub { push @x, shift->as_string }); is(scalar(@x), 2, 'augmented mboxo'); is($x[0], $cmp, 'original message preserved'); is($x[1], $buf . "\nx\n", 'new message appended'); } { # stdout support open my $tmp, '+>', undef or BAIL_OUT $!; local $lei->{1} = $tmp; my $wcb = PublicInbox::LeiToMail->write_cb("mboxrd:/dev/stdout", $lei); $wcb->(\(my $x = $buf), 'deadbeef', []); undef $wcb; # commit seek($tmp, 0, SEEK_SET) or BAIL_OUT $!; my $cmp = ''; PublicInbox::MboxReader->mboxrd($tmp, sub { $cmp .= shift->as_string }); is($cmp, $buf, 'message written to stdout'); } SKIP: { # FIFO support use POSIX qw(mkfifo); my $fn = "$tmpdir/fifo"; mkfifo($fn, 0600) or skip("mkfifo not supported: $!", 1); my $cat = popen_rd([which('cat'), $fn]); my $wcb = PublicInbox::LeiToMail->write_cb("mboxo:$fn", $lei); $wcb->(\(my $x = $buf), 'deadbeef', []); undef $wcb; # commit my $cmp = ''; PublicInbox::MboxReader->mboxo($cat, sub { $cmp .= shift->as_string }); is($cmp, $buf, 'message written to FIFO'); } { # Maildir support my $md = "$tmpdir/maildir/"; my $wcb = PublicInbox::LeiToMail->write_cb("Maildir:$md", $lei); ok($wcb, 'got Maildir callback'); $lei->{dedupe}->prepare_dedupe; $wcb->(\(my $x = $buf), 'badc0ffee', []); undef $wcb; # commit my @f; PublicInbox::LeiToMail::_maildir_each_file($md, sub { push @f, shift }); is(scalar(@f), 1, 'wrote one file'); open my $fh, $f[0] or BAIL_OUT $!; is(do { local $/; <$fh> }, $buf, 'wrote to Maildir'); $wcb = PublicInbox::LeiToMail->write_cb("maildir:$md", $lei); $lei->{dedupe}->prepare_dedupe; $wcb->(\($x = $buf."\nx\n"), 'deadcafe', []); undef $wcb; # commit my @x = (); PublicInbox::LeiToMail::_maildir_each_file($md, sub { push @x, shift }); is(scalar(@x), 1, 'wrote one new file'); ok(!-f $f[0], 'old file clobbered'); open $fh, $x[0] or BAIL_OUT $!; is(do { local $/; <$fh> }, $buf."\nx\n", 'wrote new file to Maildir'); local $lei->{opt}->{augment} = 1; $wcb = PublicInbox::LeiToMail->write_cb("maildir:$md", $lei); $lei->{dedupe}->prepare_dedupe; $wcb->(\($x = $buf."\ny\n"), 'deadcafe', []); $wcb->(\($x = $buf."\ny\n"), 'b4dc0ffee', []); # skipped by dedupe undef $wcb; # commit @f = (); PublicInbox::LeiToMail::_maildir_each_file($md, sub { push @f, shift }); is(scalar grep(/\A\Q$x[0]\E\z/, @f), 1, 'old file still there'); my @new = grep(!/\A\Q$x[0]\E\z/, @f); is(scalar @new, 1, '1 new file written (b4dc0ffee skipped)'); open $fh, $x[0] or BAIL_OUT $!; is(do { local $/; <$fh> }, $buf."\nx\n", 'old file untouched'); open $fh, $new[0] or BAIL_OUT $!; is(do { local $/; <$fh> }, $buf."\ny\n", 'new file written'); } done_testing;