#!/usr/bin/perl -w # Copyright (C) 2015-2018 all contributors # License: AGPL-3.0+ # Basic tool to create a Xapian search index for a git repository # configured for public-inbox. # Usage with libeatmydata # highly recommended: eatmydata public-inbox-index GIT_DIR use strict; use warnings; use Getopt::Long qw(:config gnu_getopt no_ignore_case auto_abbrev); use Cwd 'abs_path'; my $usage = "public-inbox-index GIT_DIR"; use PublicInbox::Config; my $config = eval { PublicInbox::Config->new } || eval { warn "public-inbox unconfigured for serving, indexing anyways...\n"; {} }; eval { require PublicInbox::SearchIdx }; if ($@) { print STDERR "Search::Xapian required for $0\n"; exit 1; } my $reindex; my %opts = ( '--reindex' => \$reindex ); GetOptions(%opts) or die "bad command-line args\n$usage"; my @dirs; sub resolve_git_dir { my ($cd) = @_; my @cmd = qw(git rev-parse --git-dir); my $cmd = join(' ', @cmd); my $pid = open my $fh, '-|'; defined $pid or die "forking $cmd failed: $!\n"; if ($pid == 0) { if (defined $cd) { chdir $cd or die "chdir $cd failed: $!\n"; } exec @cmd; die "Failed to exec $cmd: $!\n"; } else { my $dir = eval { local $/; <$fh>; }; close $fh or die "error in $cmd: $!\n"; chomp $dir; return abs_path($cd) if ($dir eq '.' && defined $cd); abs_path($dir); } } if (@ARGV) { @dirs = map { resolve_git_dir($_) } @ARGV; } else { @dirs = (resolve_git_dir()); } sub usage { print STDERR "Usage: $usage\n"; exit 1 } usage() unless @dirs; foreach my $k (keys %$config) { $k =~ /\Apublicinbox\.([^\.]+)\.mainrepo\z/ or next; my $name = $1; my $v = $config->{$k}; for my $i (0..$#dirs) { next if $dirs[$i] ne $v; my $ibx = $config->lookup_name($name); $dirs[$i] = $ibx if $ibx; } } foreach my $dir (@dirs) { index_dir($dir); } sub index_dir { my ($git_dir) = @_; if (!ref $git_dir && ! -d $git_dir) { die "$git_dir does not appear to be a git repository\n"; } my $s = PublicInbox::SearchIdx->new($git_dir, 1); $s->index_sync({ reindex => $reindex }); }