1 # Copyright (C) 2018 all contributors <meta@public-inbox.org>
2 # License: AGPL-3.0+ <https://www.gnu.org/licenses/agpl-3.0.txt>
3 package PublicInbox::SearchIdxSkeleton;
6 use base qw(PublicInbox::SearchIdx);
7 use Storable qw(freeze thaw);
10 my ($class, $v2writable) = @_;
11 my $self = $class->SUPER::new($v2writable->{-inbox}, 1, 'skel');
15 $self->spawn_worker($v2writable) if $v2writable->{parallel};
20 my ($self, $v2writable) = @_;
22 pipe($r, $w) or die "pipe failed: $!\n";
23 my ($barrier_wait, $barrier_note);
24 pipe($barrier_wait, $barrier_note) or die "pipe failed: $!\n";
25 binmode $_, ':raw' foreach ($r, $w, $barrier_wait, $barrier_note);
27 defined $pid or die "fork failed: $!\n";
29 $v2writable->atfork_child;
33 eval { skeleton_worker_loop($self, $r, $barrier_note) };
34 die "skeleton worker died: $@\n" if $@;
41 $self->{barrier_wait} = $barrier_wait;
45 # lock on only exists in parent, not in worker
46 $self->{lock_path} = $self->xdir . '/pi-v2-skeleton.lock';
49 sub skeleton_worker_loop {
50 my ($self, $r, $barrier_note) = @_;
51 $barrier_note->autoflush(1);
52 $0 = 'pi-v2-skeleton';
53 $self->begin_txn_lazy;
55 while (my $line = $r->getline) {
56 if ($line eq "commit\n") {
57 $self->commit_txn_lazy;
58 } elsif ($line eq "close\n") {
60 } elsif ($line =~ /\Abarrier_init (\d+)\n\z/) {
62 die "barrier in-progress\n" if defined $barrier;
63 $barrier = { map { $_ => 1 } (0..$n) };
64 } elsif ($line =~ /\Abarrier (\d+)\n\z/) {
66 die "no barrier in-progress\n" unless defined $barrier;
67 delete $barrier->{$1} or die "unknown barrier: $part\n";
68 if ((scalar keys %$barrier) == 0) {
70 $self->commit_txn_lazy;
71 print $barrier_note "barrier_done\n" or die
72 "print failed to barrier note: $!";
74 } elsif ($line =~ /\AD ([a-f0-9]{40,}) (.*)\n\z/s) {
75 my ($oid, $mid) = ($1, $2);
76 $self->begin_txn_lazy;
77 $self->remove_by_oid($oid, $mid);
80 my $n = read($r, my $msg, $len) or die "read: $!\n";
81 $n == $len or die "short read: $n != $len\n";
82 $msg = thaw($msg); # should raise on error
83 defined $msg or die "failed to thaw buffer\n";
84 $self->begin_txn_lazy;
85 eval { index_skeleton_real($self, $msg) };
86 warn "failed to index message <$msg->[-1]>: $@\n" if $@;
92 # called by a partition worker
94 my ($self, $values) = @_;
95 if (my $w = $self->{w}) {
97 my $str = freeze($values);
98 $str = length($str) . "\n" . $str;
100 # multiple processes write to the same pipe, so use flock
101 # We can't avoid this lock for <=PIPE_BUF writes, either,
102 # because those atomic writes can break up >PIPE_BUF ones
104 print $w $str or $err = $!;
107 die "print failed: $err\n" if $err;
109 $self->begin_txn_lazy;
110 index_skeleton_real($self, $values);
115 my ($self, $oid, $mid) = @_;
118 eval { $self->SUPER::remote_remove($oid, $mid) };
124 # values: [ TS, NUM, BYTES, LINES, MID, XPATH, doc_data ]
125 sub index_skeleton_real ($$) {
126 my ($self, $values) = @_;
127 my $doc_data = pop @$values;
128 my $xpath = pop @$values;
129 my $mids = pop @$values;
130 my $ts = $values->[PublicInbox::Search::TS];
131 my $smsg = PublicInbox::SearchMsg->new(undef);
132 my $doc = $smsg->{doc};
133 PublicInbox::SearchIdx::add_values($doc, $values);
134 $doc->set_data($doc_data);
136 $smsg->load_from_data($doc_data);
137 my $num = $values->[PublicInbox::Search::NUM];
138 my @refs = ($smsg->references =~ /<([^>]+)>/g);
139 $self->link_and_save($doc, $mids, \@refs, $num, $xpath);
142 # write to the subprocess
144 my ($self, $nparts) = @_;
145 my $w = $self->{w} or return;
148 print $w "barrier_init $nparts\n" or $err = "failed to write: $!\n";
155 my $bw = $self->{barrier_wait} or return;
156 my $l = $bw->getline;
157 $l eq "barrier_done\n" or die "bad response from barrier_wait: $l\n";