# Copyright (C) 2018-2020 all contributors
# License: AGPL-3.0+
use strict;
use warnings;
use Test::More;
use PublicInbox::MIME;
use PublicInbox::ContentId qw(content_digest);
use PublicInbox::TestCommon;
use Cwd qw(abs_path);
require_git(2.6);
require_mods(qw(DBD::SQLite Search::Xapian));
local $ENV{HOME} = abs_path('t');
use_ok 'PublicInbox::V2Writable';
umask 007;
my ($inboxdir, $for_destroy) = tmpdir();
my $ibx = {
inboxdir => $inboxdir,
name => 'test-v2writable',
version => 2,
-primary_address => 'test@example.com',
};
$ibx = PublicInbox::Inbox->new($ibx);
my $mime = PublicInbox::MIME->create(
header => [
From => 'a@example.com',
To => 'test@example.com',
Subject => 'this is a subject',
'Message-ID' => '',
Date => 'Fri, 02 Oct 1993 00:00:00 +0000',
],
body => "hello world\n",
);
my $im = PublicInbox::V2Writable->new($ibx, {nproc => 1});
is($im->{shards}, 1, 'one shard when forced');
ok($im->add($mime), 'ordinary message added');
foreach my $f ("$inboxdir/msgmap.sqlite3",
glob("$inboxdir/xap*/*"),
glob("$inboxdir/xap*/*/*")) {
my @st = stat($f);
my ($bn) = (split(m!/!, $f))[-1];
is($st[2] & 07777, -f _ ? 0660 : 0770,
"default sharedRepository respected for $bn");
}
my $git0;
if ('ensure git configs are correct') {
my @cmd = (qw(git config), "--file=$inboxdir/all.git/config",
qw(core.sharedRepository 0644));
is(system(@cmd), 0, "set sharedRepository in all.git");
$git0 = PublicInbox::Git->new("$inboxdir/git/0.git");
chomp(my $v = $git0->qx(qw(config core.sharedRepository)));
is($v, '0644', 'child repo inherited core.sharedRepository');
chomp($v = $git0->qx(qw(config --bool repack.writeBitmaps)));
is($v, 'true', 'child repo inherited repack.writeBitmaps');
}
{
my @warn;
local $SIG{__WARN__} = sub { push @warn, @_ };
is($im->add($mime), undef, 'obvious duplicate rejected');
is(scalar(@warn), 0, 'no warning about resent message');
@warn = ();
$mime->header_set('Message-Id', '', '');
is($im->add($mime), undef, 'secondary MID ignored if first matches');
my $sec = PublicInbox::MIME->new($mime->as_string);
$sec->header_set('Date');
$sec->header_set('Message-Id', '', '');
ok($im->add($sec), 'secondary MID used if data is different');
like(join(' ', @warn), qr/mismatched/, 'warned about mismatch');
like(join(' ', @warn), qr/alternative/, 'warned about alternative');
is_deeply([ '', '' ],
[ $sec->header_obj->header_raw('Message-Id') ],
'no new Message-Id added');
my $sane_mid = qr/\A<[\w\-\.]+\@\w+>\z/;
@warn = ();
$mime->header_set('Message-Id', '');
$mime->body_set('different');
ok($im->add($mime), 'reused mid ok');
like(join(' ', @warn), qr/reused/, 'warned about reused MID');
my @mids = $mime->header_obj->header_raw('Message-Id');
is($mids[0], '', 'original mid not changed');
like($mids[1], $sane_mid, 'new MID added');
is(scalar(@mids), 2, 'only one new MID added');
@warn = ();
$mime->header_set('Message-Id', '');
$mime->body_set('this one needs a random mid');
my $hdr = $mime->header_obj;
my $gen = PublicInbox::Import::digest2mid(content_digest($mime), $hdr);
unlike($gen, qr![\+/=]!, 'no URL-unfriendly chars in Message-Id');
my $fake = PublicInbox::MIME->new($mime->as_string);
$fake->header_set('Message-Id', "<$gen>");
ok($im->add($fake), 'fake added easily');
is_deeply(\@warn, [], 'no warnings from a faker');
ok($im->add($mime), 'random MID made');
like(join(' ', @warn), qr/using random/, 'warned about using random');
@mids = $mime->header_obj->header_raw('Message-Id');
is($mids[0], '', 'original mid not changed');
like($mids[1], $sane_mid, 'new MID added');
is(scalar(@mids), 2, 'only one new MID added');
@warn = ();
$mime->header_set('Message-Id');
ok($im->add($mime), 'random MID made for MID free message');
@mids = $mime->header_obj->header_raw('Message-Id');
like($mids[0], $sane_mid, 'mid was generated');
is(scalar(@mids), 1, 'new generated');
}
{
$mime->header_set('Message-Id', '', '');
$mime->header_set('X-Alt-Message-Id', '');
$mime->header_set('References', '');
ok($im->add($mime), 'message with multiple Message-ID');
$im->done;
my ($total, undef) = $ibx->over->recent;
is($ibx->mm->num_highwater, $total, 'got expected highwater value');
my $srch = $ibx->search;
my $mset1 = $srch->reopen->query('m:abcde@1', { mset => 1 });
is($mset1->size, 1, 'message found by first MID');
my $mset2 = $srch->reopen->query('m:abcde@2', { mset => 1 });
is($mset2->size, 1, 'message found by second MID');
is((($mset1->items)[0])->get_docid, (($mset2->items)[0])->get_docid,
'same document') if ($mset1->size);
my $alt = $srch->reopen->query('m:alt-id-for-nntp', { mset => 1 });
is($alt->size, 1, 'message found by alt MID (NNTP)');
is((($alt->items)[0])->get_docid, (($mset1->items)[0])->get_docid,
'same document') if ($mset1->size);
$mime->header_set('X-Alt-Message-Id');
my %uniq;
for my $mid (qw(abcde@1 abcde@2 alt-id-for-nntp)) {
my $msgs = $ibx->over->get_thread($mid);
my $key = join(' ', sort(map { $_->{num} } @$msgs));
$uniq{$key}++;
}
is(scalar(keys(%uniq)), 1, 'all alt Message-ID queries give same smsg');
is_deeply([values(%uniq)], [3], '3 queries, 3 results');
}
{
use Net::NNTP;
my $err = "$inboxdir/stderr.log";
my $out = "$inboxdir/stdout.log";
my $group = 'inbox.comp.test.v2writable';
my $pi_config = "$inboxdir/pi_config";
open my $fh, '>', $pi_config or die "open: $!\n";
print $fh < $pi_config };
my $td = start_script($cmd, $env, { 3 => $sock });
my $host_port = $sock->sockhost . ':' . $sock->sockport;
my $n = Net::NNTP->new($host_port);
$n->group($group);
my $x = $n->xover('1-');
my %uniq;
foreach my $num (sort { $a <=> $b } keys %$x) {
my $mid = $x->{$num}->[3];
is($uniq{$mid}++, 0, "MID for $num is unique in XOVER");
is_deeply($n->xhdr('Message-ID', $num),
{ $num => $mid }, "XHDR lookup OK on num $num");
is_deeply($n->xhdr('Message-ID', $mid),
{ $mid => $mid }, "XHDR lookup OK on MID $num");
}
my %nn;
foreach my $mid (@{$n->newnews(0, $group)}) {
is($nn{$mid}++, 0, "MID is unique in NEWNEWS");
}
is_deeply([sort keys %nn], [sort keys %uniq]);
my %lg;
foreach my $num (@{$n->listgroup($group)}) {
is($lg{$num}++, 0, "num is unique in LISTGROUP");
}
is_deeply([sort keys %lg], [sort keys %$x],
'XOVER and LISTGROUPS return the same article numbers');
my $xref = $n->xhdr('Xref', '1-');
is_deeply([sort keys %lg], [sort keys %$xref], 'Xref range OK');
my $mids = $n->xhdr('Message-ID', '1-');
is_deeply([sort keys %lg], [sort keys %$xref], 'Message-ID range OK');
my $rover = $n->xrover('1-');
is_deeply([sort keys %lg], [sort keys %$rover], 'XROVER range OK');
};
{
my @log = qw(log --no-decorate --no-abbrev --no-notes --no-color);
my @before = $git0->qx(@log, qw(--pretty=oneline));
my $before = $git0->qx(@log, qw(--pretty=raw --raw -r));
$im = PublicInbox::V2Writable->new($ibx, {nproc => 2});
is($im->{shards}, 1, 'detected single shard from previous');
my $smsg = $im->remove($mime, 'test removal');
$im->done;
my @after = $git0->qx(@log, qw(--pretty=oneline));
my $tip = shift @after;
like($tip, qr/\A[a-f0-9]+ test removal\n\z/s,
'commit message propagated to git');
is_deeply(\@after, \@before, 'only one commit written to git');
is($ibx->mm->num_for($smsg->mid), undef, 'no longer in Msgmap by mid');
my $num = $smsg->{num};
like($num, qr/\A\d+\z/, 'numeric number in return message');
is($ibx->mm->mid_for($num), undef, 'no longer in Msgmap by num');
my $srch = $ibx->search->reopen;
my $mset = $srch->query('m:'.$smsg->mid, { mset => 1});
is($mset->size, 0, 'no longer found in Xapian');
my @log1 = (@log, qw(-1 --pretty=raw --raw -r --no-renames));
is($srch->{over_ro}->get_art($num), undef,
'removal propagated to Over DB');
my $after = $git0->qx(@log1);
if ($after =~ m!( [a-f0-9]+ )A\td$!m) {
my $oid = $1;
ok(index($before, $oid) > 0, 'no new blob introduced');
} else {
fail('failed to extract blob from log output');
}
is($im->remove($mime, 'test removal'), undef,
'remove is idempotent');
$im->done;
is($git0->qx(@log1),
$after, 'no git history made with idempotent remove');
eval { $im->done };
ok(!$@, '->done is idempotent');
}
{
ok($im->add($mime), 'add message to be purged');
local $SIG{__WARN__} = sub {};
ok(my $cmts = $im->purge($mime), 'purged message');
like($cmts->[0], qr/\A[a-f0-9]{40}\z/, 'purge returned current commit');
$im->done;
# again
is($im->purge($mime), undef, 'no-op returns undef');
}
{
my $x = 'x'x250;
my $y = 'y'x250;
local $SIG{__WARN__} = sub {};
$mime->header_set('Subject', 'long mid');
$mime->header_set('Message-ID', "<$x>");
ok($im->add($mime), 'add excessively long Message-ID');
$mime->header_set('Message-ID', "<$y>");
$mime->header_set('References', "<$x>");
ok($im->add($mime), 'add excessively long References');
$im->barrier;
my $msgs = $ibx->search->{over_ro}->get_thread('x'x244);
is(2, scalar(@$msgs), 'got both messages');
is($msgs->[0]->{mid}, 'x'x244, 'stored truncated mid');
is($msgs->[1]->{references}, '<'.('x'x244).'>', 'stored truncated ref');
is($msgs->[1]->{mid}, 'y'x244, 'stored truncated mid(2)');
$im->done;
}
my $tmp = {
inboxdir => "$inboxdir/non-existent/subdir",
name => 'nope',
version => 2,
-primary_address => 'test@example.com',
};
eval {
my $nope = PublicInbox::V2Writable->new($tmp);
$nope->add($mime);
};
ok($@, 'V2Writable fails on non-existent dir');
{
my $v2w = PublicInbox::V2Writable->new($tmp, 1);
ok($v2w, 'creat flag works');
$v2w->{parallel} = 0;
$v2w->init_inbox(0);
my $alt = "$tmp->{inboxdir}/all.git/objects/info/alternates";
open my $fh, '>>', $alt or die $!;
print $fh "$inboxdir/all.git/objects\n" or die $!;
chmod(0664, $fh) or die "fchmod: $!";
close $fh or die $!;
open $fh, '<', $alt or die $!;
my $before = do { local $/; <$fh> };
ok($v2w->git_init(3), 'init a new epoch');
open $fh, '<', $alt or die $!;
my $after = do { local $/; <$fh> };
ok(index($after, $before) > 0,
'old contents preserved after adding epoch');
like($after, qr!\A[^\n]+?/3\.git/objects\n!s,
'first line is newest epoch');
my $mode = (stat($alt))[2] & 07777;
is($mode, 0664, sprintf('0%03o', $mode).' is 0664');
}
done_testing();