about summary refs log tree commit homepage
path: root/xt
diff options
context:
space:
mode:
authorEric Wong <e@80x24.org>2021-09-19 12:50:30 +0000
committerEric Wong <e@80x24.org>2021-09-19 19:53:01 +0000
commitc029c9e085ca1f1b1319e566157e04f9c972c55b (patch)
treead7b4f20990ba57b409572856e25eb9012a0aa2e /xt
parent67fe4d8d90ac77419c8fc41457c849aa7d366a9d (diff)
downloadpublic-inbox-c029c9e085ca1f1b1319e566157e04f9c972c55b.tar.gz
I'm not sure what caused it, but I've noticed two missing
messages that failed from "lei up" on an https:// external;
and I've also seen some duplicates in the past (which I
think I fixed...).
Diffstat (limited to 'xt')
-rw-r--r--xt/over-fsck.perl44
1 files changed, 44 insertions, 0 deletions
diff --git a/xt/over-fsck.perl b/xt/over-fsck.perl
new file mode 100644
index 00000000..053204fe
--- /dev/null
+++ b/xt/over-fsck.perl
@@ -0,0 +1,44 @@
+#!perl -w
+# Copyright (C) all contributors <meta@public-inbox.org>
+# License: AGPL-3.0+ <https://www.gnu.org/licenses/agpl-3.0.txt>
+# unstable dev script, chasing a bug which may be in LeiSavedSearch->is_dup
+use v5.12;
+use Data::Dumper;
+use PublicInbox::OverIdx;
+@ARGV == 1 or die "Usage: $0 /path/to/over.sqlite3\n";
+my $over = PublicInbox::OverIdx->new($ARGV[0]);
+my $dbh = $over->dbh;
+$dbh->do('PRAGMA mmap_size = '.(2 ** 48));
+my $num = 0;
+my ($err, $none, $nr, $ids);
+$Data::Dumper::Useqq = $Data::Dumper::Sortkeys = 1;
+do {
+        $ids = $over->ids_after(\$num);
+        $nr += @$ids;
+        for my $n (@$ids) {
+                my $smsg = $over->get_art($n);
+                if (!$smsg) {
+                        warn "#$n article missing\n";
+                        ++$err;
+                        next;
+                }
+                my $exp = $smsg->{blob};
+                if ($exp eq '') {
+                        ++$none if $smsg->{bytes};
+                        next;
+                }
+                my $xr3 = $over->get_xref3($n, 1);
+                my $found;
+                for my $r (@$xr3) {
+                        $r->[2] = unpack('H*', $r->[2]);
+                        $found = 1 if $r->[2] eq $exp;
+                }
+                if (!$found) {
+                        warn Dumper([$smsg, $xr3 ]);
+                        ++$err;
+                }
+        }
+} while (@$ids);
+warn "$none/$nr had no blob (external?)\n" if $none;
+warn "$err errors\n" if $err;
+exit($err ? 1 : 0);