X-Git-Url: http://www.git.stargrave.org/?a=blobdiff_plain;f=lib%2FPublicInbox%2FLeiInspect.pm;h=ab2c98d99228b2af7851199ffb6eca501d2ab5e0;hb=0c385e6500f26babc47a0768b730ea38e290a5f5;hp=46b9197f0c4b5c86a4fcba5081781bd6f99ecc82;hpb=172d2d126cb9c0fa78b41a01f285f9294cc78f15;p=public-inbox.git diff --git a/lib/PublicInbox/LeiInspect.pm b/lib/PublicInbox/LeiInspect.pm index 46b9197f..ab2c98d9 100644 --- a/lib/PublicInbox/LeiInspect.pm +++ b/lib/PublicInbox/LeiInspect.pm @@ -8,27 +8,62 @@ package PublicInbox::LeiInspect; use strict; use v5.10.1; +use parent qw(PublicInbox::IPC); use PublicInbox::Config; +use PublicInbox::MID qw(mids); +use PublicInbox::NetReader qw(imap_uri nntp_uri); sub inspect_blob ($$) { my ($lei, $oidhex) = @_; my $ent = {}; if (my $lse = $lei->{lse}) { - my @docids = $lse ? $lse->over->blob_exists($oidhex) : (); + my $oidbin = pack('H*', $oidhex); + my @docids = $lse ? $lse->over->oidbin_exists($oidbin) : (); $ent->{'lei/store'} = \@docids if @docids; - my $lms = $lse->lms; - if (my $loc = $lms ? $lms->locations_for($oidhex) : undef) { + my $lms = $lei->lms; + if (my $loc = $lms ? $lms->locations_for($oidbin) : undef) { $ent->{'mail-sync'} = $loc; } } $ent; } +sub inspect_imap_uid ($$) { + my ($lei, $uid_uri) = @_; + my $ent = {}; + my $lms = $lei->lms or return $ent; + my $oidhex = $lms->imap_oid($lei, $uid_uri); + if (ref(my $err = $oidhex)) { # arg2folder error + $lei->qerr(@{$err->{qerr}}) if $err->{qerr}; + } + $ent->{$$uid_uri} = $oidhex; + $ent; +} + +sub inspect_nntp_range { + my ($lei, $uri) = @_; + my ($ng, $beg, $end) = $uri->group; + $uri = $uri->clone; + $uri->group($ng); + my $ent = {}; + my $ret = { "$uri" => $ent }; + my $lms = $lei->lms or return $ret; + my $err = $lms->arg2folder($lei, my $folders = [ $$uri ]); + if ($err) { + $lei->qerr(@{$err->{qerr}}) if $err->{qerr}; + } + $end //= $beg; + for my $art ($beg..$end) { + my $oidbin = $lms->imap_oidbin($folders->[0], $art); + $ent->{$art} = $oidbin ? unpack('H*', $oidbin) : undef; + } + $ret; +} + sub inspect_sync_folder ($$) { my ($lei, $folder) = @_; my $ent = {}; - my $lse = $lei->{lse} or return $ent; - my $lms = $lse->lms or return $ent; + my $lms = $lei->lms or return $ent; my $folders = [ $folder ]; my $err = $lms->arg2folder($lei, $folders); if ($err) { @@ -44,14 +79,134 @@ sub inspect_sync_folder ($$) { $ent } +sub inspect_docid ($$;$) { + my ($lei, $docid, $ent) = @_; + require PublicInbox::Search; + $ent //= {}; + my $xdb; + if ($xdb = delete $ent->{xdb}) { # from inspect_num + } elsif (defined(my $dir = $lei->{opt}->{dir})) { + no warnings 'once'; + $xdb = $PublicInbox::Search::X{Database}->new($dir); + } else { + $xdb = $lei->{lse}->xdb; + } + $xdb or return $lei->fail('no Xapian DB'); + my $doc = $xdb->get_document($docid); # raises + my $data = $doc->get_data; + $ent->{docid} = $docid; + $ent->{data_length} = length($data); + $ent->{description} = $doc->get_description; + $ent->{$_} = $doc->$_ for (qw(termlist_count values_count)); + my $cur = $doc->termlist_begin; + my $end = $doc->termlist_end; + for (; $cur != $end; $cur++) { + my $tn = $cur->get_termname; + $tn =~ s/\A([A-Z]+)// or warn "$tn no prefix! (???)"; + my $term = ($1 // ''); + push @{$ent->{terms}->{$term}}, $tn; + } + @$_ = sort(@$_) for values %{$ent->{terms} // {}}; + $cur = $doc->values_begin; + $end = $doc->values_end; + for (; $cur != $end; $cur++) { + my $n = $cur->get_valueno; + my $v = $cur->get_value; + my $iv = PublicInbox::Search::sortable_unserialise($v); + $v = $iv + 0 if defined $iv; + # not using ->[$n] since we may have large gaps in $n + $ent->{'values'}->{$n} = $v; + } + $ent; +} + +sub dir2ibx ($$) { + my ($lei, $dir) = @_; + if (-f "$dir/ei.lock") { + require PublicInbox::ExtSearch; + PublicInbox::ExtSearch->new($dir); + } elsif (-f "$dir/inbox.lock" || -d "$dir/public-inbox") { + require PublicInbox::Inbox; # v2, v1 + bless { inboxdir => $dir }, 'PublicInbox::Inbox'; + } else { + $lei->fail("no (indexed) inbox or extindex at $dir"); + } +} + +sub inspect_num ($$) { + my ($lei, $num) = @_; + my ($docid, $ibx); + my $ent = { num => $num }; + if (defined(my $dir = $lei->{opt}->{dir})) { + $ibx = dir2ibx($lei, $dir) or return; + if ($ent->{xdb} = $ibx->xdb) { + my $num2docid = $lei->{lse}->can('num2docid'); + $docid = $num2docid->($ibx, $num); + } + } else { + $ibx = $lei->{lse}; + $lei->{lse}->xdb; # set {nshard} for num2docid + $docid = $lei->{lse}->num2docid($num); + } + if ($ibx && $ibx->over) { + my $smsg = $ibx->over->get_art($num); + $ent->{smsg} = { %$smsg } if $smsg; + } + defined($docid) ? inspect_docid($lei, $docid, $ent) : $ent; +} + +sub inspect_mid ($$) { + my ($lei, $mid) = @_; + my ($ibx, $over); + my $ent = { mid => $mid }; + if (defined(my $dir = $lei->{opt}->{dir})) { + my $num2docid = $lei->{lse}->can('num mid => [ $mid ] 2docid'); + $ibx = dir2ibx($lei, $dir) or return; + # $ent->{xdb} = $ibx->xdb // + # return $lei->fail("no Xapian DB for $dir"); + } else { + $ibx = $lei->{lse}; + $lei->{lse}->xdb; # set {nshard} for num2docid + } + if ($ibx && $ibx->over) { + my ($id, $prev); + while (my $smsg = $ibx->over->next_by_mid($mid, \$id, \$prev)) { + push @{$ent->{smsg}}, { %$smsg } + } + } + $ent; +} + sub inspect1 ($$$) { my ($lei, $item, $more) = @_; my $ent; if ($item =~ /\Ablob:(.+)/) { $ent = inspect_blob($lei, $1); - } elsif ($item =~ m!\Aimaps?://!i || - $item =~ m!\A(?:maildir|mh):!i || -d $item) { + } elsif ($item =~ m!\A(?:maildir|mh):!i || -d $item) { $ent = inspect_sync_folder($lei, $item); + } elsif ($item =~ m!\Adocid:([0-9]+)\z!) { + $ent = inspect_docid($lei, $1 + 0); + } elsif ($item =~ m!\Anum:([0-9]+)\z!) { + $ent = inspect_num($lei, $1 + 0); + } elsif ($item =~ m!\A(?:mid|m):(.+)\z!) { + $ent = inspect_mid($lei, $1); + } elsif (my $iuri = imap_uri($item)) { + if (defined($iuri->uid)) { + $ent = inspect_imap_uid($lei, $iuri); + } else { + $ent = inspect_sync_folder($lei, $item); + } + } elsif (my $nuri = nntp_uri($item)) { + if (defined(my $mid = $nuri->message)) { + $ent = inspect_mid($lei, $mid); + } else { + my ($group, $beg, $end) = $nuri->group; + if (defined($beg)) { + $ent = inspect_nntp_range($lei, $nuri); + } else { + $ent = inspect_sync_folder($lei, $item); + } + } } else { # TODO: more things return $lei->fail("$item not understood"); } @@ -60,23 +215,71 @@ sub inspect1 ($$$) { 1; } -sub lei_inspect { - my ($lei, @argv) = @_; +sub inspect_argv { # via wq_do + my ($self) = @_; + my ($lei, $argv) = delete @$self{qw(lei argv)}; + my $multi = scalar(@$argv) > 1; $lei->{1}->autoflush(0); - my $multi = scalar(@argv) > 1; $lei->out('[') if $multi; + while (defined(my $x = shift @$argv)) { + inspect1($lei, $x, scalar(@$argv)) or return; + } + $lei->out(']') if $multi; +} + +sub inspect_start ($$) { + my ($lei, $argv) = @_; + my $self = bless { lei => $lei, argv => $argv }, __PACKAGE__; + my ($op_c, $ops) = $lei->workers_start($self, 1); + $lei->{wq1} = $self; + $lei->wait_wq_events($op_c, $ops); + $self->wq_do('inspect_argv'); + $self->wq_close(1); +} + +sub ins_add { # InputPipe->consume callback + my ($lei) = @_; # $_[1] = $rbuf + if (defined $_[1]) { + $_[1] eq '' and return eval { + my $str = delete $lei->{istr}; + $str =~ s/\A[\r\n]*From [^\r\n]*\r?\n//s; + my $eml = PublicInbox::Eml->new(\$str); + inspect_start($lei, [ + 'blob:'.$lei->git_oid($eml)->hexdigest, + map { "mid:$_" } @{mids($eml)} ]); + }; + $lei->{istr} .= $_[1]; + } else { + $lei->fail("error reading stdin: $!"); + } +} + +sub lei_inspect { + my ($lei, @argv) = @_; $lei->{json} = ref(PublicInbox::Config::json())->new->utf8->canonical; $lei->{lse} = ($lei->{opt}->{external} // 1) ? do { my $sto = $lei->_lei_store; $sto ? $sto->search : undef; } : undef; - if ($lei->{opt}->{pretty} || -t $lei->{1}) { - $lei->{json}->pretty(1)->indent(2); - } - while (defined(my $x = shift @argv)) { - inspect1($lei, $x, scalar(@argv)) or return; + my $isatty = -t $lei->{1}; + $lei->{json}->pretty(1)->indent(2) if $lei->{opt}->{pretty} || $isatty; + $lei->start_pager if $isatty; + if ($lei->{opt}->{stdin}) { + return $lei->fail(<<'') if @argv; +no args allowed on command-line with --stdin + + require PublicInbox::InputPipe; + PublicInbox::InputPipe::consume($lei->{0}, \&ins_add, $lei); + } else { + inspect_start($lei, \@argv); } - $lei->out(']') if $multi; +} + +sub _complete_inspect { + my ($lei, @argv) = @_; + my $lms = $lei->lms or return; + my $match_cb = $lei->complete_url_prepare(\@argv); + map { $match_cb->($_) } $lms->folders; } 1;