X-Git-Url: http://www.git.stargrave.org/?a=blobdiff_plain;f=t%2Fv2mirror.t;h=ebad2566605a79dbbc25d2689e67deba4564da66;hb=af0b0fb7a454470a32c452119d0392e0dedb3fe1;hp=0c66aef48d1d9473874e10e265cd662e049af3a3;hpb=678fb3c2ba03a4a284620c039717c0d94dd6106a;p=public-inbox.git diff --git a/t/v2mirror.t b/t/v2mirror.t index 0c66aef4..ebad2566 100644 --- a/t/v2mirror.t +++ b/t/v2mirror.t @@ -1,31 +1,31 @@ -# Copyright (C) 2018 all contributors +# Copyright (C) 2018-2021 all contributors # License: AGPL-3.0+ use strict; use warnings; use Test::More; +use PublicInbox::TestCommon; +use File::Path qw(remove_tree); +use Cwd qw(abs_path); +require_git(2.6); +local $ENV{HOME} = abs_path('t'); # Integration tests for HTTP cloning + mirroring -foreach my $mod (qw(Plack::Util Plack::Builder Danga::Socket - HTTP::Date HTTP::Status Search::Xapian DBD::SQLite)) { - eval "require $mod"; - plan skip_all => "$mod missing for v2mirror.t" if $@; -} -use File::Temp qw/tempdir/; +require_mods(qw(Plack::Util Plack::Builder + HTTP::Date HTTP::Status Search::Xapian DBD::SQLite)); use IO::Socket; use POSIX qw(dup2); -use PublicInbox::V2Writable; -use PublicInbox::MIME; +use_ok 'PublicInbox::V2Writable'; +use PublicInbox::InboxWritable; +use PublicInbox::Eml; use PublicInbox::Config; -use Fcntl qw(FD_CLOEXEC F_SETFD F_GETFD); # FIXME: too much setup -my $tmpdir = tempdir('pi-v2mirror-XXXXXX', TMPDIR => 1, CLEANUP => 1); -my $script = 'blib/script/public-inbox'; +my ($tmpdir, $for_destroy) = tmpdir(); my $pi_config = "$tmpdir/config"; { open my $fh, '>', $pi_config or die "open($pi_config): $!"; print $fh <<"" or die "print $pi_config: $!"; [publicinbox "v2"] - mainrepo = $tmpdir/in + inboxdir = $tmpdir/in address = test\@example.com close $fh or die "close($pi_config): $!"; @@ -39,75 +39,84 @@ $ibx->{version} = 2; my $v2w = PublicInbox::V2Writable->new($ibx, 1); ok $v2w, 'v2w loaded'; $v2w->{parallel} = 0; -my $mime = PublicInbox::MIME->new(<<''); +my $mime = PublicInbox::Eml->new(<<''); From: Me To: You Subject: a Date: Thu, 01 Jan 1970 00:00:00 +0000 +my $old_rotate_bytes = $v2w->{rotate_bytes}; +$v2w->{rotate_bytes} = 500; # force rotating for my $i (1..9) { $mime->header_set('Message-ID', "<$i\@example.com>"); $mime->header_set('Subject', "subject = $i"); ok($v2w->add($mime), "add msg $i OK"); } -$v2w->barrier; - -my %opts = ( - LocalAddr => '127.0.0.1', - ReuseAddr => 1, - Proto => 'tcp', - Listen => 1024, -); -my ($sock, $pid); -END { kill 'TERM', $pid if defined $pid }; - -$! = 0; -$sock = IO::Socket::INET->new(%opts); -ok($sock, 'sock created'); -my $fl = fcntl($sock, F_GETFD, 0); -$pid = fork; -if ($pid == 0) { - # pretend to be systemd - fcntl($sock, F_SETFD, $fl &= ~FD_CLOEXEC); - dup2(fileno($sock), 3) or die "dup2 failed: $!\n"; - $ENV{LISTEN_PID} = $$; - $ENV{LISTEN_FDS} = 1; - exec "$script-httpd", "--stdout=$tmpdir/out", "--stderr=$tmpdir/err"; - die "FAIL: $!\n"; + +my $epoch_max = $v2w->{epoch_max}; +ok($epoch_max > 0, "multiple epochs"); +$v2w->done; +{ + my $smsg = $ibx->over->get_art(1); + like($smsg->{lines}, qr/\A[0-9]+\z/, 'lines is a digit'); + like($smsg->{bytes}, qr/\A[0-9]+\z/, 'bytes is a digit'); } -ok(defined $pid, 'forked httpd process successfully'); +$ibx->cleanup; + +my $sock = tcp_server(); +ok($sock, 'sock created'); +my $cmd = [ '-httpd', '-W0', "--stdout=$tmpdir/out", "--stderr=$tmpdir/err" ]; +my $td = start_script($cmd, undef, { 3 => $sock }); my ($host, $port) = ($sock->sockhost, $sock->sockport); $sock = undef; -my @cmd = (qw(git clone --mirror -q), "http://$host:$port/v2/0", - "$tmpdir/m/git/0.git"); +my @cmd; +foreach my $i (0..$epoch_max) { + my $sfx = $i == 0 ? '.git' : ''; + @cmd = (qw(git clone --mirror -q), + "http://$host:$port/v2/$i$sfx", + "$tmpdir/m/git/$i.git"); -is(system(@cmd), 0, 'cloned OK'); -ok(-d "$tmpdir/m/git/0.git", 'mirror OK');; + is(xsys(@cmd), 0, "cloned $i.git"); + ok(-d "$tmpdir/m/git/$i.git", "mirror $i OK"); +} -@cmd = ("$script-init", '-V2', 'm', "$tmpdir/m", 'http://example.com/m', +@cmd = ("-init", '-j1', '-V2', 'm', "$tmpdir/m", 'http://example.com/m', 'alt@example.com'); -is(system(@cmd), 0, 'initialized public-inbox -V2'); -is(system("$script-index", "$tmpdir/m"), 0, 'indexed'); +ok(run_script(\@cmd), 'initialized public-inbox -V2'); +my @shards = glob("$tmpdir/m/xap*/?"); +is(scalar(@shards), 1, 'got a single shard on init'); + +ok(run_script([qw(-index -j0), "$tmpdir/m"]), 'indexed'); -my $mibx = { mainrepo => "$tmpdir/m", address => 'alt@example.com' }; +my $mibx = { inboxdir => "$tmpdir/m", address => 'alt@example.com' }; $mibx = PublicInbox::Inbox->new($mibx); is_deeply([$mibx->mm->minmax], [$ibx->mm->minmax], 'index synched minmax'); +$v2w->{rotate_bytes} = $old_rotate_bytes; for my $i (10..15) { $mime->header_set('Message-ID', "<$i\@example.com>"); $mime->header_set('Subject', "subject = $i"); ok($v2w->add($mime), "add msg $i OK"); } -$v2w->barrier; -is(system('git', "--git-dir=$tmpdir/m/git/0.git", 'fetch', '-q'), 0, - 'fetch successful'); +$v2w->done; +$ibx->cleanup; + +my $fetch_each_epoch = sub { + foreach my $i (0..$epoch_max) { + my $dir = "$tmpdir/m/git/$i.git"; + is(xsys('git', "--git-dir=$dir", 'fetch', '-q'), 0, + 'fetch successful'); + } +}; -my $mset = $mibx->search->reopen->query('m:15@example.com', {mset => 1}); +$fetch_each_epoch->(); + +my $mset = $mibx->search->reopen->mset('m:15@example.com'); is(scalar($mset->items), 0, 'new message not found in mirror, yet'); -is(system("$script-index", "$tmpdir/m"), 0, 'index updated'); +ok(run_script([qw(-index -j0), "$tmpdir/m"]), 'index updated'); is_deeply([$mibx->mm->minmax], [$ibx->mm->minmax], 'index synched minmax'); -$mset = $mibx->search->reopen->query('m:15@example.com', {mset => 1}); +$mset = $mibx->search->reopen->mset('m:15@example.com'); is(scalar($mset->items), 1, 'found message in mirror'); # purge: @@ -123,38 +132,32 @@ $mime->header_set('Subject', 'subject = 10'); is_deeply(\@subj, ["# subject = 10"], "only rewrote one"); } -$v2w->barrier; +$v2w->done; -my $msgs = $mibx->search->{over_ro}->get_thread('10@example.com'); +my $msgs = $mibx->over->get_thread('10@example.com'); my $to_purge = $msgs->[0]->{blob}; like($to_purge, qr/\A[a-f0-9]{40,}\z/, 'read blob to be purged'); -$mset = $ibx->search->reopen->query('m:10@example.com', {mset => 1}); +$mset = $ibx->search->reopen->mset('m:10@example.com'); is(scalar($mset->items), 0, 'purged message gone from origin'); -is(system('git', "--git-dir=$tmpdir/m/git/0.git", 'fetch', '-q'), 0, - 'fetch successful'); +$fetch_each_epoch->(); { - open my $err, '+>', "$tmpdir/index-err" or die "open: $!"; - my $ipid = fork; - if ($ipid == 0) { - dup2(fileno($err), 2) or die "dup2 failed: $!"; - exec("$script-index", '--prune', "$tmpdir/m"); - die "exec fail: $!"; - } - ok($ipid, 'running index..'); - is(waitpid($ipid, 0), $ipid, 'index --prune done'); - is($?, 0, 'no error from index'); - ok(seek($err, 0, 0), 'rewound stderr'); - $err = eval { local $/; <$err> }; + $ibx->cleanup; + PublicInbox::InboxWritable::cleanup($mibx); + $v2w->done; + my $cmd = [ qw(-index --prune -j0), "$tmpdir/m" ]; + my ($out, $err) = ('', ''); + my $opt = { 1 => \$out, 2 => \$err }; + ok(run_script($cmd, undef, $opt), '-index --prune'); like($err, qr/discontiguous range/, 'warned about discontiguous range'); unlike($err, qr/fatal/, 'no scary fatal error shown'); } -$mset = $mibx->search->reopen->query('m:10@example.com', {mset => 1}); +$mset = $mibx->search->reopen->mset('m:10@example.com'); is(scalar($mset->items), 0, 'purged message not found in mirror'); is_deeply([$mibx->mm->minmax], [$ibx->mm->minmax], 'minmax still synced'); for my $i ((1..9),(11..15)) { - $mset = $mibx->search->query("m:$i\@example.com", {mset => 1}); + $mset = $mibx->search->mset("m:$i\@example.com"); is(scalar($mset->items), 1, "$i\@example.com remains visible"); } is($mibx->git->check($to_purge), undef, 'unindex+prune successful in mirror'); @@ -166,10 +169,73 @@ is($mibx->git->check($to_purge), undef, 'unindex+prune successful in mirror'); is_deeply(\@warn, [], 'no warnings from index_sync after purge'); } -$v2w->done; -ok(kill('TERM', $pid), 'killed httpd'); -$pid = undef; -waitpid(-1, 0); +# deletes happen in a different fetch window +{ + $mset = $mibx->search->reopen->mset('m:1@example.com'); + is(scalar($mset->items), 1, '1@example.com visible in mirror'); + $mime->header_set('Message-ID', '<1@example.com>'); + $mime->header_set('Subject', 'subject = 1'); + ok($v2w->remove($mime), 'removed <1@example.com> from source'); + $v2w->done; + $ibx->cleanup; + $fetch_each_epoch->(); + PublicInbox::InboxWritable::cleanup($mibx); + + my $cmd = [ qw(-index -j0), "$tmpdir/m" ]; + my ($out, $err) = ('', ''); + my $opt = { 1 => \$out, 2 => \$err }; + ok(run_script($cmd, undef, $opt), 'index ran'); + is($err, '', 'no errors reported by index'); + $mset = $mibx->search->reopen->mset('m:1@example.com'); + is(scalar($mset->items), 0, '1@example.com no longer visible in mirror'); +} + +if ('sequential-shard') { + $mset = $mibx->search->mset('m:15@example.com'); + is(scalar($mset->items), 1, 'large message not indexed'); + remove_tree(glob("$tmpdir/m/xap*"), glob("$tmpdir/m/msgmap.*")); + my $cmd = [ qw(-index -j9 --sequential-shard), "$tmpdir/m" ]; + ok(run_script($cmd), '--sequential-shard works'); + my @shards = glob("$tmpdir/m/xap*/?"); + is(scalar(@shards), 8, 'got expected shard count'); + PublicInbox::InboxWritable::cleanup($mibx); + $mset = $mibx->search->mset('m:15@example.com'); + is(scalar($mset->items), 1, 'search works after --sequential-shard'); +} + +if ('max size') { + $mime->header_set('Message-ID', '<2big@a>'); + my $max = '2k'; + $mime->body_str_set("z\n" x 1024); + ok($v2w->add($mime), "add big message"); + $v2w->done; + $ibx->cleanup; + $fetch_each_epoch->(); + PublicInbox::InboxWritable::cleanup($mibx); + my $cmd = [qw(-index -j0), "$tmpdir/m", "--max-size=$max" ]; + my $opt = { 2 => \(my $err) }; + ok(run_script($cmd, undef, $opt), 'indexed with --max-size'); + like($err, qr/skipping [a-f0-9]{40,}/, 'warned about skipping message'); + $mset = $mibx->search->reopen->mset('m:2big@a'); + is(scalar($mset->items), 0, 'large message not indexed'); + + { + open my $fh, '>>', $pi_config or die; + print $fh <search->reopen->mset('m:2big@a'); + is(scalar($mset->items), 0, 'large message not re-indexed'); +} + +ok($td->kill, 'killed httpd'); +$td->join; done_testing();