about summary refs log tree commit homepage
path: root/lib/PublicInbox/ExtMsg.pm
diff options
context:
space:
mode:
authorEric Wong <e@80x24.org>2020-12-04 22:03:49 +0000
committerEric Wong <e@80x24.org>2020-12-05 21:41:52 +0000
commit8e0aef5068aa71e58d4a049491229f41e6bf19fb (patch)
treeadc875a52b6671cb8dd61df6b9139f584e39b4e0 /lib/PublicInbox/ExtMsg.pm
parent629e22b8351e96a831535baa2854d0c9ca014445 (diff)
downloadpublic-inbox-8e0aef5068aa71e58d4a049491229f41e6bf19fb.tar.gz
extmsg: use ->ALL for "global" MID lookups
As with NewsWWW and NNTP, we can use ->ALL to completely
avoid trying SQLite/Xapian lookups across hundreds/thousands
of inboxes.
Diffstat (limited to 'lib/PublicInbox/ExtMsg.pm')
-rw-r--r--lib/PublicInbox/ExtMsg.pm36
1 files changed, 33 insertions, 3 deletions
diff --git a/lib/PublicInbox/ExtMsg.pm b/lib/PublicInbox/ExtMsg.pm
index 03faf3a1..2a0a3e46 100644
--- a/lib/PublicInbox/ExtMsg.pm
+++ b/lib/PublicInbox/ExtMsg.pm
@@ -103,9 +103,37 @@ sub ext_msg_step {
         }
 }
 
+sub ext_msg_ALL ($) {
+        my ($ctx) = @_;
+        my $ALL = $ctx->{www}->{pi_config}->ALL or return;
+        my $by_eidx_key = $ctx->{www}->{pi_config}->{-by_eidx_key};
+        my $cur_key = $ctx->{-inbox}->eidx_key;
+        my %seen = ($cur_key => 1);
+        my ($id, $prev);
+        while (my $x = $ALL->over->next_by_mid($ctx->{mid}, \$id, \$prev)) {
+                my $xr3 = $ALL->over->get_xref3($x->{num});
+                for my $k (@$xr3) {
+                        $k =~ s/:[0-9]+:$x->{blob}\z// or next;
+                        next if $k eq $cur_key;
+                        my $ibx = $by_eidx_key->{$k} // next;
+                        my $url = $ibx->base_url or next;
+                        push(@{$ctx->{found}}, $ibx) unless $seen{$k}++;
+                }
+        }
+        return exact($ctx) if $ctx->{found};
+
+        # fall back to partial MID matching
+        for my $ibxish ($ctx->{-inbox}, $ALL) {
+                my $mids = search_partial($ibxish, $ctx->{mid}) or next;
+                push @{$ctx->{partial}}, [ $ibxish, $mids ];
+                last if ($ctx->{n_partial} += scalar(@$mids)) >= PARTIAL_MAX;
+        }
+        partial_response($ctx);
+}
+
 sub ext_msg {
         my ($ctx) = @_;
-        sub {
+        ext_msg_ALL($ctx) // sub {
                 $ctx->{-wcb} = $_[0]; # HTTP server write callback
 
                 if ($ctx->{env}->{'pi-httpd.async'}) {
@@ -159,7 +187,7 @@ sub finalize_exact {
         finalize_partial($ctx);
 }
 
-sub finalize_partial {
+sub partial_response ($) {
         my ($ctx) = @_;
         my $mid = $ctx->{mid};
         my $code = 404;
@@ -192,9 +220,11 @@ sub finalize_partial {
         $ctx->{-html_tip} = $s .= '</pre>';
         $ctx->{-title_html} = $title;
         $ctx->{-upfx} = '../';
-        $ctx->{-wcb}->(html_oneshot($ctx, $code));
+        html_oneshot($ctx, $code);
 }
 
+sub finalize_partial ($) { $_[0]->{-wcb}->(partial_response($_[0])) }
+
 sub ext_urls {
         my ($ctx, $mid, $href, $html) = @_;