Today the only thing that prevents public-inbox not reusing the
message numbers of deleted messages is the sqlite autoincrement magic
and that only works part of the time. The new incremental indexing
test has revealed areas where today public-inbox does try to reuse
numbers of deleted messages.
Reusing the message numbers of existing messages is a problem because
if a client ever sees messages that are subsequently deleted the
client will not see the new messages with their old numbers.
In practice this is difficult to trigger because it requires the most
recently added message to be removed and have the removal show up in a
separate pull request. Still it can happen and it should be handled.
Instead of infering the highset number ever used by finding the maximum
number in the message map, track the largest number ever assigned directly.
Update Msgmap to track this value and update the indexers to use this
value.
Signed-off-by: "Eric W. Biederman" <ebiederm@xmission.com>
create_tables($dbh);
$dbh->begin_work;
$self->created_at(time) unless $self->created_at;
create_tables($dbh);
$dbh->begin_work;
$self->created_at(time) unless $self->created_at;
+
+ my (undef, $max) = $self->minmax();
+ $max ||= 0;
+ $self->num_highwater($max);
$self->meta_accessor('created_at', $second);
}
$self->meta_accessor('created_at', $second);
}
+sub num_highwater {
+ my ($self, $num) = @_;
+ my $high = $self->{num_highwater} ||=
+ $self->meta_accessor('num_highwater');
+ if (defined($num) && (!defined($high) || ($num > $high))) {
+ $self->{num_highwater} = $num;
+ $self->meta_accessor('num_highwater', $num);
+ }
+ $self->{num_highwater};
+}
+
sub mid_insert {
my ($self, $mid) = @_;
my $dbh = $self->{dbh};
sub mid_insert {
my ($self, $mid) = @_;
my $dbh = $self->{dbh};
INSERT OR IGNORE INTO msgmap (mid) VALUES (?)
return if $sth->execute($mid) == 0;
INSERT OR IGNORE INTO msgmap (mid) VALUES (?)
return if $sth->execute($mid) == 0;
- $dbh->last_insert_id(undef, undef, 'msgmap', 'num');
+ my $num = $dbh->last_insert_id(undef, undef, 'msgmap', 'num');
+ $self->num_highwater($num) unless !defined($num);
+ $num;
$self->{dbh}->prepare(
'INSERT OR IGNORE INTO msgmap (num,mid) VALUES (?,?)');
};
$self->{dbh}->prepare(
'INSERT OR IGNORE INTO msgmap (num,mid) VALUES (?,?)');
};
- $sth->execute($num, $mid);
+ my $result = $sth->execute($num, $mid);
+ $self->num_highwater($num) if (defined($result) && $result == 1);
+ $result;
--no-notes --no-color --no-renames
--diff-filter=AM), $range);
++$fcount while <$fh>;
--no-notes --no-color --no-renames
--diff-filter=AM), $range);
++$fcount while <$fh>;
- my (undef, $max) = $self->{mm}->minmax;
+ my $high = $self->{mm}->num_highwater;
if (index($range, '..') < 0) {
if (index($range, '..') < 0) {
- if ($max && $max == $fcount) {
+ if ($high && $high == $fcount) {
# fix up old bugs in full indexes which caused messages to
# not appear in Msgmap
# fix up old bugs in full indexes which caused messages to
# not appear in Msgmap
- $self->{regen_up} = $max;
+ $self->{regen_up} = $high;
} else {
# normal regen is for for fresh data
$self->{regen_down} = $fcount;
}
} else {
# Give oldest messages the smallest numbers
} else {
# normal regen is for for fresh data
$self->{regen_down} = $fcount;
}
} else {
# Give oldest messages the smallest numbers
- $self->{regen_down} = $max + $fcount;
+ $self->{regen_down} = $high + $fcount;
}
$git->popen(qw/log --no-notes --no-color --no-renames
}
$git->popen(qw/log --no-notes --no-color --no-renames
my $mm_tmp = $self->{mm}->tmp_clone;
my $ranges = $opts->{reindex} ? [] : $self->last_commits($epoch_max);
my $mm_tmp = $self->{mm}->tmp_clone;
my $ranges = $opts->{reindex} ? [] : $self->last_commits($epoch_max);
- my ($min, $max) = $mm_tmp->minmax;
+ my $high = $self->{mm}->num_highwater();
my $regen = $self->index_prepare($opts, $epoch_max, $ranges);
my $regen = $self->index_prepare($opts, $epoch_max, $ranges);
- $$regen += $max if $max;
+ $$regen += $high if $high;
my $D = {}; # "$mid\0$cid" => $oid
my @cmd = qw(log --raw -r --pretty=tformat:%H
--no-notes --no-color --no-abbrev --no-renames);
my $D = {}; # "$mid\0$cid" => $oid
my @cmd = qw(log --raw -r --pretty=tformat:%H
--no-notes --no-color --no-abbrev --no-renames);