# data notes:
# * NNTP article numbers are UIDs and message sequence numbers (MSNs)
# * Message sequence numbers (MSNs) can be stable since we're read-only.
-# Most IMAP clients use UIDs (I hope), and we can return a dummy
-# message if a client requests a non-existent MSN.
+# Most IMAP clients use UIDs (I hope). We may return a dummy message
+# in the future if a client requests a non-existent MSN, but that seems
+# unecessary with mutt.
package PublicInbox::IMAP;
use strict;
use PublicInbox::GitAsyncCat;
use Text::ParseWords qw(parse_line);
use Errno qw(EAGAIN);
+use Time::Local qw(timegm);
+use POSIX qw(strftime);
my $Address;
for my $mod (qw(Email::Address::XS Mail::Address)) {
my $valid_range = '[0-9]+|[0-9]+:[0-9]+|[0-9]+:\*';
$valid_range = qr/\A(?:$valid_range)(?:,(?:$valid_range))*\z/;
+my @MoY = qw(Jan Feb Mar Apr May Jun Jul Aug Sep Oct Nov Dec);
+my %MoY;
+@MoY{@MoY} = (0..11);
+
sub greet ($) {
my ($self) = @_;
my $capa = capa($self);
join('', @hold);
}
-sub dummy_message ($$) {
- my ($self, $seqno) = @_;
- my $ret = <<EOF;
-From: nobody\@localhost\r
-To: nobody\@localhost\r
-Date: Thu, 01 Jan 1970 00:00:00 +0000\r
-Message-ID: <dummy-$seqno\@$self->{ibx}->{newsgroup}>\r
-Subject: dummy message #$seqno\r
-\r
-You're seeing this message because your IMAP client didn't use UIDs.\r
-The message which used to use this sequence number was likely spam\r
-and removed by the administrator.\r
-EOF
- \$ret;
-}
-
sub requeue_once ($) {
my ($self) = @_;
# COMPRESS users all share the same DEFLATE context.
if (!defined($oid)) {
# it's possible to have TOCTOU if an admin runs
# public-inbox-(edit|purge), just move onto the next message
- return requeue_once($self) unless defined $want->{-seqno};
- $bref = dummy_message($self, $smsg->{num});
+ return requeue_once($self);
} else {
$smsg->{blob} eq $oid or die "BUG: $smsg->{blob} != $oid";
}
requeue_once($self);
}
+sub uid_clamp ($$$) {
+ my ($self, $beg, $end) = @_;
+ my $uid_min = $self->{uid_min} or return;
+ my $uid_end = $uid_min + UID_BLOCK - 1;
+ $$beg = $uid_min if $$beg < $uid_min;
+ $$end = $uid_end if $$end > $uid_end;
+}
+
sub range_step ($$) {
my ($self, $range_csv) = @_;
my ($beg, $end, $range);
} elsif ($range =~ /\A([0-9]+):\*\z/) {
$beg = $1 + 0;
$end = $self->{ibx}->mm->max // 0;
+ my $uid_end = ($self->{uid_min} // 1) - 1 + UID_BLOCK;
+ $end = $uid_end if $end > $uid_end;
$beg = $end if $beg > $end;
} elsif ($range =~ /\A[0-9]+\z/) {
$beg = $end = $range + 0;
} else {
return 'BAD fetch range';
}
- if (defined($range) && (my $uid_min = $self->{uid_min})) {
- my $uid_end = $uid_min + UID_BLOCK - 1;
- $beg = $uid_min if $beg < $uid_min;
- $end = $uid_end if $end > $uid_end;
- }
+ uid_clamp($self, \$beg, \$end) if defined($range);
[ $beg, $end, $$range_csv ];
}
$args; # error
}
-sub seq_fetch_m { # long_response
- my ($self, $tag, $msgs, $range_info, $want) = @_;
- while (!@$msgs) { # rare
- if (my $end = refill_range($self, $msgs, $range_info)) {
- $self->write(\"$tag $end\r\n");
- return;
- }
- }
- my $seq = $want->{-seqno}++;
- my $cur_num = $msgs->[0]->{num};
- if ($cur_num == $seq) { # as expected
- git_async_cat($self->{ibx}->git, $msgs->[0]->{blob},
- \&uid_fetch_cb, \@_);
- } elsif ($cur_num > $seq) {
- # send dummy messages until $seq catches up to $cur_num
- my $smsg = bless { num => $seq, ts => 0 }, 'PublicInbox::Smsg';
- unshift @$msgs, $smsg;
- my $bref = dummy_message($self, $seq);
- uid_fetch_cb($bref, undef, undef, undef, \@_);
- $smsg; # blessed response since uid_fetch_cb requeues
- } else { # should not happen
- die "BUG: cur_num=$cur_num < seq=$seq";
- }
-}
-
-sub cmd_fetch ($$$;@) {
- my ($self, $tag, $range_csv, @want) = @_;
- my $args = fetch_common($self, $tag, $range_csv, \@want);
- ref($args) eq 'ARRAY' ? do {
- my $want = $args->[-1];
- $want->{-seqno} = $args->[2]->[0]; # $beg == $range_info->[0];
- long_response($self, \&seq_fetch_m, @$args)
- } : $args; # error
+sub parse_date ($) { # 02-Oct-1993
+ my ($date_text) = @_;
+ my ($dd, $mon, $yyyy) = split(/-/, $_[0], 3);
+ defined($yyyy) or return;
+ my $mm = $MoY{$mon} // return;
+ $dd =~ /\A[0123]?[0-9]\z/ or return;
+ $yyyy =~ /\A[0-9]{4,}\z/ or return; # Y10K-compatible!
+ timegm(0, 0, 0, $dd, $mm, $yyyy);
}
-sub uid_search_all { # long_response
- my ($self, $tag, $num) = @_;
- my $uids = $self->{ibx}->mm->ids_after($num);
- if (scalar(@$uids)) {
+sub uid_search_uid_range { # long_response
+ my ($self, $tag, $beg, $end, $sql) = @_;
+ my $uids = $self->{ibx}->over->uid_range($$beg, $end, $sql);
+ if (@$uids) {
+ $$beg = $uids->[-1] + 1;
$self->msg_more(join(' ', '', @$uids));
} else {
$self->write(\"\r\n$tag OK Search done\r\n");
}
}
-sub uid_search_uid_range { # long_response
- my ($self, $tag, $beg, $end) = @_;
- my $uids = $self->{ibx}->mm->msg_range($beg, $end, 'num');
- if (@$uids) {
- $self->msg_more(join('', map { " $_->[0]" } @$uids));
+sub date_search {
+ my ($q, $k, $d) = @_;
+ my $sql = $q->{sql};
+
+ # Date: header
+ if ($k eq 'SENTON') {
+ my $end = $d + 86399; # no leap day...
+ my $da = strftime('%Y%m%d%H%M%S', gmtime($d));
+ my $db = strftime('%Y%m%d%H%M%S', gmtime($end));
+ $q->{xap} .= " dt:$da..$db";
+ $$sql .= " AND ds >= $d AND ds <= $end" if defined($sql);
+ } elsif ($k eq 'SENTBEFORE') {
+ $q->{xap} .= ' d:..'.strftime('%Y%m%d', gmtime($d));
+ $$sql .= " AND ds <= $d" if defined($sql);
+ } elsif ($k eq 'SENTSINCE') {
+ $q->{xap} .= ' d:'.strftime('%Y%m%d', gmtime($d)).'..';
+ $$sql .= " AND ds >= $d" if defined($sql);
+
+ # INTERNALDATE (Received)
+ } elsif ($k eq 'ON') {
+ my $end = $d + 86399; # no leap day...
+ $q->{xap} .= " ts:$d..$end";
+ $$sql .= " AND ts >= $d AND ts <= $end" if defined($sql);
+ } elsif ($k eq 'BEFORE') {
+ $q->{xap} .= " ts:..$d";
+ $$sql .= " AND ts <= $d" if defined($sql);
+ } elsif ($k eq 'SINCE') {
+ $q->{xap} .= " ts:$d..";
+ $$sql .= " AND ts >= $d" if defined($sql);
} else {
- $self->write(\"\r\n$tag OK Search done\r\n");
- undef;
+ die "BUG: $k not recognized";
}
}
+# IMAP to Xapian search key mapping
+my %I2X = (
+ SUBJECT => 's:',
+ BODY => 'b:',
+ FROM => 'f:',
+ TEXT => '', # n.b. does not include all headers
+ TO => 't:',
+ CC => 'c:',
+ # BCC => 'bcc:', # TODO
+ # KEYWORD # TODO ? dfpre,dfpost,...
+);
+
+sub parse_query {
+ my ($self, $rest) = @_;
+ if (uc($rest->[0]) eq 'CHARSET') {
+ shift @$rest;
+ defined(my $c = shift @$rest) or return 'BAD missing charset';
+ $c =~ /\A(?:UTF-8|US-ASCII)\z/ or return 'NO [BADCHARSET]';
+ }
+
+ my $sql = ''; # date conditions, {sql} deleted if Xapian is needed
+ my $q = { xap => '', sql => \$sql };
+ while (@$rest) {
+ my $k = uc(shift @$rest);
+ # default criteria
+ next if $k =~ /\A(?:ALL|RECENT|UNSEEN|NEW)\z/;
+ next if $k eq 'AND'; # the default, until we support OR
+ if ($k =~ $valid_range) { # sequence numbers == UIDs
+ push @{$q->{uid}}, $k;
+ } elsif ($k eq 'UID') {
+ $k = shift(@$rest) // '';
+ $k =~ $valid_range or return 'BAD UID range';
+ push @{$q->{uid}}, $k;
+ } elsif ($k =~ /\A(?:SENT)?(?:SINCE|ON|BEFORE)\z/) {
+ my $d = parse_date(shift(@$rest) // '');
+ defined $d or return "BAD $k date format";
+ date_search($q, $k, $d);
+ } elsif ($k =~ /\A(?:SMALLER|LARGER)\z/) {
+ delete $q->{sql}; # can't use over.sqlite3
+ my $bytes = shift(@$rest) // '';
+ $bytes =~ /\A[0-9]+\z/ or return "BAD $k not a number";
+ $q->{xap} .= ' bytes:' . ($k eq 'SMALLER' ?
+ '..'.(--$bytes) :
+ (++$bytes).'..');
+ } elsif (defined(my $xk = $I2X{$k})) {
+ delete $q->{sql}; # can't use over.sqlite3
+ my $arg = shift @$rest;
+ defined($arg) or return "BAD $k no arg";
+
+ # Xapian can't handle [*"] in probabilistic terms
+ $arg =~ tr/*"//d;
+ $q->{xap} .= qq[ $xk:"$arg"];
+ } else {
+ # TODO: parentheses, OR, NOT ...
+ return "BAD $k not supported (yet?)";
+ }
+ }
+
+ # favor using over.sqlite3 if possible, since Xapian is optional
+ if (exists $q->{sql}) {
+ delete($q->{xap});
+ delete($q->{sql}) if $sql eq '';
+ } elsif (!$self->{ibx}->search) {
+ return 'BAD Xapian not configured for mailbox';
+ }
+
+ if (my $uid = $q->{uid}) {
+ ((@$uid > 1) || $uid->[0] =~ /,/) and
+ return 'BAD multiple ranges not supported, yet';
+ ($q->{sql} // $q->{xap}) and
+ return 'BAD ranges and queries do not mix, yet';
+ $q->{uid} = join(',', @$uid); # TODO: multiple ranges
+ }
+ $q;
+}
+
sub cmd_uid_search ($$$;) {
- my ($self, $tag, $arg, @rest) = @_;
+ my ($self, $tag) = splice(@_, 0, 2);
my $ibx = $self->{ibx} or return "$tag BAD No mailbox selected\r\n";
- $arg = uc($arg);
- if ($arg eq 'ALL' && !@rest) {
+ my $q = parse_query($self, \@_);
+ return "$tag $q\r\n" if !ref($q);
+ my $sql = delete $q->{sql};
+
+ if (!scalar(keys %$q)) {
$self->msg_more('* SEARCH');
- my $num = 0;
- long_response($self, \&uid_search_all, $tag, \$num);
- } elsif ($arg eq 'UID' && scalar(@rest) == 1) {
- if ($rest[0] =~ /\A([0-9]+):([0-9]+|\*)\z/s) {
+ my $beg = $self->{uid_min} // 1;
+ my $end = $ibx->mm->max;
+ uid_clamp($self, \$beg, \$end);
+ long_response($self, \&uid_search_uid_range,
+ $tag, \$beg, $end, $sql);
+ } elsif (my $uid = $q->{uid}) {
+ if ($uid =~ /\A([0-9]+):([0-9]+|\*)\z/s) {
my ($beg, $end) = ($1, $2);
$end = $ibx->mm->max if $end eq '*';
+ uid_clamp($self, \$beg, \$end);
$self->msg_more('* SEARCH');
long_response($self, \&uid_search_uid_range,
- $tag, \$beg, $end);
- } elsif ($rest[0] =~ /\A[0-9]+\z/s) {
- my $uid = $rest[0];
+ $tag, \$beg, $end, $sql);
+ } elsif ($uid =~ /\A[0-9]+\z/s) {
$uid = $ibx->over->get_art($uid) ? " $uid" : '';
"* SEARCH$uid\r\n$tag OK Search done\r\n";
} else {
# we're read-only, so SELECT and EXAMINE do the same thing
no warnings 'once';
*cmd_select = \&cmd_examine;
+*cmd_fetch = \&cmd_uid_fetch;
1;