1 # Copyright (C) 2020-2021 all contributors <meta@public-inbox.org>
2 # License: AGPL-3.0+ <https://www.gnu.org/licenses/agpl-3.0.txt>
4 # internal class used by PublicInbox::Git + PublicInbox::DS
5 # This parses the output pipe of "git cat-file --batch"
6 package PublicInbox::GitAsyncCat;
8 use parent qw(PublicInbox::DS Exporter);
10 use PublicInbox::Syscall qw(EPOLLIN EPOLLET);
11 our @EXPORT = qw(ibx_async_cat ibx_async_prefetch);
12 use PublicInbox::Git ();
14 our $GCF2C; # singleton PublicInbox::Gcf2Client
18 if (my $git = delete $self->{git}) {
21 $self->SUPER::close; # PublicInbox::DS::close
26 my $git = $self->{git} or return;
27 return $self->close if ($git->{in} // 0) != ($self->{sock} // 1);
28 my $inflight = $git->{inflight};
29 if ($inflight && @$inflight) {
30 $git->cat_async_step($inflight);
33 if (($git->{in} // 0) != ($self->{sock} // 1)) {
35 } elsif (@$inflight || exists $git->{rbuf}) {
36 # ok, more to do, requeue for fairness
39 } elsif ((my $pid = waitpid($git->{pid}, WNOHANG)) > 0) {
40 # May happen if the child process is killed by a BOFH
43 warn "E: git $pid exited with \$?=$?\n";
51 PublicInbox::DS::add_timer(3, \&git_tmp_cleanup, $git);
54 sub ibx_async_cat ($$$$) {
55 my ($ibx, $oid, $cb, $arg) = @_;
56 my $git = $ibx->{git} // $ibx->git;
57 # {topdir} means ExtSearch (likely [extindex "all"]) with potentially
58 # 100K alternates. git(1) has a proposed patch for 100K alternates:
59 # <https://lore.kernel.org/git/20210624005806.12079-1-e@80x24.org/>
60 if (!defined($ibx->{topdir}) && !defined($git->{-tmp}) &&
62 require PublicInbox::Gcf2Client;
63 PublicInbox::Gcf2Client::new();
64 } // 0)) { # 0: do not retry if libgit2 or Inline::C are missing
65 $GCF2C->gcf2_async(\"$oid $git->{git_dir}\n", $cb, $arg);
67 } else { # read-only end of git-cat-file pipe
68 $git->cat_async($oid, $cb, $arg);
69 $git->{async_cat} //= do {
70 my $self = bless { git => $git }, __PACKAGE__;
71 $git->{in}->blocking(0);
72 $git->{-tmp} and PublicInbox::DS::add_uniq_timer(
73 3, \&git_tmp_cleanup, $git);
74 $self->SUPER::new($git->{in}, EPOLLIN|EPOLLET);
75 \undef; # this is a true ref()
80 # this is safe to call inside $cb, but not guaranteed to enqueue
81 # returns true if successful, undef if not. For fairness, we only
82 # prefetch if there's no in-flight requests.
83 sub ibx_async_prefetch {
84 my ($ibx, $oid, $cb, $arg) = @_;
86 if (!defined($ibx->{topdir}) && $GCF2C) {
87 if (!@{$GCF2C->{inflight} // []}) {
88 $oid .= " $git->{git_dir}\n";
89 return $GCF2C->gcf2_async(\$oid, $cb, $arg); # true
91 } elsif ($git->{async_cat} && (my $inflight = $git->{inflight})) {
93 print { $git->{out} } $oid, "\n" or
94 $git->fail("write error: $!");
95 return push(@$inflight, $oid, $cb, $arg);