# Copyright (C) all contributors
# License: AGPL-3.0+
# *-external commands of lei
package PublicInbox::LeiExternal;
use strict;
use v5.10.1;
use PublicInbox::Config qw(glob2re);
sub externals_each {
my ($self, $cb, @arg) = @_;
my $cfg = $self->_lei_cfg;
my %boost;
for my $sec (grep(/\Aexternal\./, @{$cfg->{-section_order}})) {
my $loc = substr($sec, length('external.'));
$boost{$loc} = $cfg->{"$sec.boost"};
}
return \%boost if !wantarray && !$cb;
# highest boost first, but stable for alphabetic tie break
use sort 'stable';
my @order = sort { $boost{$b} <=> $boost{$a} } sort keys %boost;
if (ref($cb) eq 'CODE') {
for my $loc (@order) {
$cb->(@arg, $loc, $boost{$loc});
}
} elsif (ref($cb) eq 'HASH') {
%$cb = %boost;
}
@order; # scalar or array
}
sub ext_canonicalize {
my $location = $_[-1]; # $_[0] may be $lei
if ($location !~ m!\Ahttps?://!) {
PublicInbox::Config::rel2abs_collapsed($location);
} else {
require URI;
my $uri = URI->new($location)->canonical;
my $path = $uri->path . '/';
$path =~ tr!/!/!s; # squeeze redundant '/'
$uri->path($path);
$uri->as_string;
}
}
# get canonicalized externals list matching $loc
# $is_exclude denotes it's for --exclude
# otherwise it's for --only/--include is assumed
sub get_externals {
my ($self, $loc, $is_exclude) = @_;
return (ext_canonicalize($loc)) if -e $loc;
my @m;
my @cur = externals_each($self);
my $do_glob = !$self->{opt}->{globoff}; # glob by default
if ($do_glob && (my $re = glob2re($loc))) {
@m = grep(m!$re/?\z!, @cur);
return @m if scalar(@m);
} elsif (index($loc, '/') < 0) { # exact basename match:
@m = grep(m!/\Q$loc\E/?\z!, @cur);
return @m if scalar(@m) == 1;
} elsif ($is_exclude) { # URL, maybe:
my $canon = ext_canonicalize($loc);
@m = grep(m!\A\Q$canon\E\z!, @cur);
return @m if scalar(@m) == 1;
} else { # URL:
return (ext_canonicalize($loc));
}
if (scalar(@m) == 0) {
die "`$loc' is unknown\n";
} else {
die("`$loc' is ambiguous:\n", map { "\t$_\n" } @m, "\n");
}
}
sub canonicalize_excludes {
my ($lei, $excludes) = @_;
my %x;
for my $loc (@$excludes) {
my @l = get_externals($lei, $loc, 1);
$x{$_} = 1 for @l;
}
\%x;
}
# returns an anonymous sub which returns an array of potential results
sub complete_url_prepare {
my $argv = $_[-1]; # $_[0] may be $lei
# Workaround bash default COMP_WORDBREAKS splitting URLs to
# ['https', ':', '//', ...]. COMP_WORDBREAKS is global for all
# completions loaded, not just ours, so we can't change it.
# cf. contrib/completion/lei-completion.bash
my ($pfx, $cur) = ('', pop(@$argv) // '');
if (@$argv) {
my @x = @$argv;
if ($cur =~ /\A[:;=]\z/) { # COMP_WORDBREAKS + URL union
push @x, $cur;
$cur = '';
}
while (@x && $pfx !~ m!\A(?: (?:[\+\-]?(?:L|kw):) |
(?:(?:imap|nntp|http)s?:) |
(?:--\w?\z)|(?:-\w?\z) )!x) {
$pfx = pop(@x).$pfx;
}
}
my $re = qr!\A\Q$pfx\E(\Q$cur\E.*)!;
my $match_cb = sub {
# the "//;" here (for AUTH=ANONYMOUS) interacts badly with
# bash tab completion, strip it out for now since our commands
# work w/o it. Not sure if there's a better solution...
$_[0] =~ s!//;AUTH=ANONYMOUS\@!//!i;
# only return the part specified on the CLI
# don't duplicate if already 100% completed
$_[0] =~ $re ? ($cur eq $1 ? () : $1) : ()
};
wantarray ? ($pfx, $cur, $match_cb) : $match_cb;
}
1;