use warnings;
use URI::Escape qw/uri_escape_utf8/;
use Date::Parse qw/str2time/;
-use Encode qw/find_encoding/;
use Encode::MIME::Header;
-use Email::MIME::ContentType qw/parse_content_type/;
+use Plack::Util;
use PublicInbox::Hval qw/ascii_html/;
use PublicInbox::Linkify;
use PublicInbox::MID qw/mid_clean id_compress mid2path mid_mime/;
+use PublicInbox::MsgIter;
+use PublicInbox::Address;
require POSIX;
use constant INDENT => ' ';
+use constant TCHILD => '` ';
+sub th_pfx ($) { $_[0] == 0 ? '' : TCHILD };
-my $enc_utf8 = find_encoding('UTF-8');
-
-# public functions:
+# public functions: (unstable)
+# TODO: stream this, since threading is expensive but also oh-so-important
sub msg_html {
my ($ctx, $mime, $footer) = @_;
$footer = defined($footer) ? "\n$footer" : '';
my $hdr = $mime->header_obj;
- headers_to_html_header($hdr, $ctx) .
- multipart_text_as_html($mime) .
- '</pre><hr /><pre>' .
- html_footer($hdr, 1, $ctx) .
- $footer .
- '</pre></body></html>';
+ my $n = 0;
+ Plack::Util::inline_object(
+ close => sub {}, # noop
+ getline => sub {
+ my $nr = $n++;
+ if ($nr == 0) {
+ headers_to_html_header($hdr, $ctx) .
+ multipart_text_as_html($mime, '') .
+ '</pre><hr />'
+ } elsif ($nr == 1) {
+ '<pre>' .
+ html_footer($hdr, 1, $ctx) .
+ '</pre>' . msg_reply($ctx, $hdr) .
+ '<hr /><pre>'. $footer .
+ '</pre></body></html>'
+ } else {
+ undef
+ }
+ }
+ )
}
-# /$LISTNAME/$MESSAGE_ID/R/
+# /$INBOX/$MESSAGE_ID/#R
sub msg_reply {
- my ($ctx, $hdr, $footer) = @_;
- my $s = $hdr->header('Subject');
- $s = '(no subject)' if (!defined $s) || ($s eq '');
- my $f = $hdr->header('From');
- $f = '' unless defined $f;
- my $mid = $hdr->header_raw('Message-ID');
- $mid = PublicInbox::Hval->new_msgid($mid);
- my $t = ascii_html($s);
+ my ($ctx, $hdr) = @_;
my $se_url =
'https://kernel.org/pub/software/scm/git/docs/git-send-email.html';
my ($arg, $link) = mailto_arg_link($hdr);
push @$arg, '/path/to/YOUR_REPLY';
- "<html><head><title>replying to \"$t\"</title></head><body><pre>" .
- "replying to message:\n\n" .
- "Subject: <b>$t</b>\n" .
- "From: ". ascii_html($f) .
- "\nDate: " . ascii_html($hdr->header('Date')) .
- "\nMessage-ID: <" . $mid->as_html . ">\n\n" .
- "There are multiple ways to reply:\n\n" .
+ "<hr /><pre\nid=R>".
+ "You may reply publically to <a\nhref=#t>this message</a> via\n".
+ "plain-text email using any one of the following methods:\n\n" .
"* Save the following mbox file, import it into your mail client,\n" .
- " and reply-to-all from there: <a\nhref=../raw>mbox</a>\n\n" .
+ " and reply-to-all from there: <a\nhref=raw>mbox</a>\n\n" .
"* Reply to all the recipients using the <b>--to</b>, <b>--cc</b>,\n" .
" and <b>--in-reply-to</b> switches of git-send-email(1):\n\n" .
"\tgit send-email \\\n\t\t" .
- join(" \\ \n\t\t", @$arg ). "\n\n" .
+ join(" \\\n\t\t", @$arg ). "\n\n" .
qq( <a\nhref="$se_url">$se_url</a>\n\n) .
"* If your mail client supports setting the <b>In-Reply-To</b>" .
" header\n via mailto: links, try the " .
qq(<a\nhref="$link">mailto: link</a>\n) .
- "\nFor context, the original <a\nhref=../>message</a> or " .
- qq(<a\nhref="../t/#u">thread</a>) .
- '</pre><hr /><pre>' . $footer . '</pre></body></html>';
-}
-
-sub feed_entry {
- my ($class, $mime) = @_;
-
- # no <head> here for <style>...
- PublicInbox::Hval::PRE . multipart_text_as_html($mime) . '</pre>';
+ '</pre>';
}
sub in_reply_to {
my $midx = $state->{anchor_idx}++;
my $ctx = $state->{ctx};
my $srch = $ctx->{srch};
- my $part_nr = 0;
my $hdr = $mime->header_obj;
- my $enc = enc_for($hdr->header("Content-Type"));
my $subj = $hdr->header('Subject');
my $mid_raw = mid_clean(mid_mime($mime));
$seen->{$id} = "#$id"; # save the anchor for children, later
my $mid = PublicInbox::Hval->new_msgid($mid_raw);
- my $from = $hdr->header('From');
- my @from = Email::Address->parse($from);
- $from = $from[0]->name;
+ my $from = PublicInbox::Address::from_name($hdr->header('From'));
my $root_anchor = $state->{root_anchor} || '';
my $path = $root_anchor ? '../../' : '';
my $mhref = "${path}$href/";
# scan through all parts, looking for displayable text
- $mime->walk_parts(sub {
- index_walk($fh, $_[0], $enc, \$part_nr);
- });
- $mime->body_set('');
- $rv = "\n" . html_footer($hdr, 0, $ctx, $mhref);
+ msg_iter($mime, sub { index_walk($fh, $mhref, $_[0]) });
+ $rv = "\n" . html_footer($hdr, 0, $ctx, "$path$href/#R");
if (defined $irt) {
unless (defined $parent_anchor) {
} elsif ($srch) {
my $threaded = 'threaded';
my $flat = 'flat';
+ my $end = '';
if ($ctx->{flat}) {
$flat = "<b>$flat</b>";
+ $end = "\n"; # for lynx
} else {
$threaded = "<b>$threaded</b>";
}
$rv .= " [<a\nhref=\"${path}$href/t/#u\">$threaded</a>";
- $rv .= "|<a\nhref=\"${path}$href/T/#u\">$flat</a>]";
+ $rv .= "|<a\nhref=\"${path}$href/T/#u\">$flat</a>]$end";
}
$fh->write($rv .= '</pre>');
}
sub emit_thread_html {
my ($res, $ctx, $foot, $srch) = @_;
my $mid = $ctx->{mid};
- my $msgs = load_results($srch->get_thread($mid));
+ my $flat = $ctx->{flat};
+ my $msgs = load_results($srch->get_thread($mid, { asc => $flat }));
my $nr = scalar @$msgs;
return missing_thread($res, $ctx) if $nr == 0;
- my $flat = $ctx->{flat};
my $seen = {};
my $state = {
res => $res,
('</ul></li>' x ($max - 1)) . '</ul>');
}
}
- Email::Address->purge_cache;
# there could be a race due to a message being deleted in git
# but still being in the Xapian index:
}
sub index_walk {
- my ($fh, $part, $enc, $part_nr) = @_;
- my $s = add_text_body($enc, $part, $part_nr);
+ my ($fh, $upfx, $p) = @_;
+ my $s = add_text_body($upfx, $p);
return if $s eq '';
$fh->write($s);
}
-sub enc_for {
- my ($ct, $default) = @_;
- $default ||= $enc_utf8;
- defined $ct or return $default;
- my $ct_parsed = parse_content_type($ct);
- if ($ct_parsed) {
- if (my $charset = $ct_parsed->{attributes}->{charset}) {
- my $enc = find_encoding($charset);
- return $enc if $enc;
- }
- }
- $default;
-}
-
sub multipart_text_as_html {
- my ($mime) = @_;
+ my ($mime, $upfx) = @_;
my $rv = "";
- my $part_nr = 0;
- my $enc = enc_for($mime->header("Content-Type"));
# scan through all parts, looking for displayable text
- $mime->walk_parts(sub {
- my ($part) = @_;
- $part = add_text_body($enc, $part, \$part_nr);
- $rv .= $part;
- $rv .= "\n" if $part ne '';
+ msg_iter($mime, sub {
+ my ($p) = @_;
+ $p = add_text_body($upfx, $p);
+ $rv .= $p;
+ $rv .= "\n" if $p ne '';
});
- $mime->body_set('');
$rv;
}
-sub add_filename_line {
- my ($enc, $fn) = @_;
- my $len = 72;
- my $pad = "-";
- $fn = $enc->decode($fn);
- $len -= length($fn);
- $pad x= ($len/2) if ($len > 0);
- "$pad " . ascii_html($fn) . " $pad\n";
-}
-
sub flush_quote {
- my ($s, $l, $quot, $part_nr) = @_;
+ my ($s, $l, $quot) = @_;
# show everything in the full version with anchor from
# short version (see above)
$$s .= qq(<span\nclass="q">) . $rv . '</span>'
}
-sub add_text_body {
- my ($enc_msg, $part, $part_nr) = @_;
- return '' if $part->subparts;
+sub attach_link ($$$$) {
+ my ($upfx, $ct, $p, $fn) = @_;
+ my ($part, $depth, @idx) = @$p;
+ my $nl = $idx[-1] > 1 ? "\n" : '';
+ my $idx = join('.', @idx);
+ my $size = bytes::length($part->body);
+ $ct ||= 'text/plain';
+ $ct =~ s/;.*//; # no attributes
+ $ct = ascii_html($ct);
+ my $desc = $part->header('Content-Description');
+ $desc = $fn unless defined $desc;
+ $desc = '' unless defined $desc;
+ my $sfn;
+ if (defined $fn && $fn =~ /\A[[:alnum:]][\w\.-]+[[:alnum:]]\z/) {
+ $sfn = $fn;
+ } elsif ($ct eq 'text/plain') {
+ $sfn = 'a.txt';
+ } else {
+ $sfn = 'a.bin';
+ }
+ my @ret = qq($nl<a\nhref="$upfx$idx-$sfn">[-- Attachment #$idx: );
+ my $ts = "Type: $ct, Size: $size bytes";
+ push(@ret, ($desc eq '') ? "$ts --]" : "$desc --]\n[-- $ts --]");
+ join('', @ret, '</a>');
+}
+sub add_text_body {
+ my ($upfx, $p) = @_; # from msg_iter: [ Email::MIME, depth, @idx ]
+ my ($part, $depth, @idx) = @$p;
my $ct = $part->content_type;
- # account for filter bugs...
+ my $fn = $part->filename;
+
if (defined $ct && $ct =~ m!\btext/x?html\b!i) {
- $part->body_set('');
- return '';
+ return attach_link($upfx, $ct, $p, $fn);
}
- my $enc = enc_for($ct, $enc_msg);
- my $s = $part->body;
- $part->body_set('');
- $s = $enc->decode($s);
+
+ my $s = eval { $part->body_str };
+
+ # badly-encoded message? tell the world about it!
+ return attach_link($upfx, $ct, $p, $fn) if $@;
+
my @lines = split(/^/m, $s);
$s = '';
-
- if ($$part_nr > 0) {
- my $fn = $part->filename;
- defined($fn) or $fn = "part #" . ($$part_nr + 1);
- $s .= add_filename_line($enc, $fn);
+ if (defined($fn) || $depth > 0) {
+ $s .= attach_link($upfx, $ct, $p, $fn);
+ $s .= "\n\n";
}
-
my @quot;
my $l = PublicInbox::Linkify->new;
while (defined(my $cur = shift @lines)) {
if ($cur !~ /^>/) {
# show the previously buffered quote inline
- flush_quote(\$s, $l, \@quot, $$part_nr) if @quot;
+ flush_quote(\$s, $l, \@quot) if @quot;
# regular line, OK
$cur = $l->linkify_1($cur);
}
}
- flush_quote(\$s, $l, \@quot, $$part_nr) if @quot;
- ++$$part_nr;
-
+ flush_quote(\$s, $l, \@quot) if @quot;
$s =~ s/[ \t]+$//sgm; # kill per-line trailing whitespace
$s =~ s/\A\n+//s; # kill leading blank lines
$s =~ s/\s+\z//s; # kill all trailing spaces (final "\n" added if ne '')
$v = PublicInbox::Hval->new($v);
if ($h eq 'From') {
- my @from = Email::Address->parse($v->raw);
- $title[1] = ascii_html($from[0]->name);
+ my $n = PublicInbox::Address::from_name($v->raw);
+ $title[1] = ascii_html($n);
} elsif ($h eq 'Subject') {
$title[0] = $v->as_html;
if ($srch) {
}
sub thread_skel {
- my ($dst, $ctx, $hdr, $upfx) = @_;
+ my ($dst, $ctx, $hdr, $tpfx) = @_;
my $srch = $ctx->{srch};
my $mid = mid_clean($hdr->header_raw('Message-ID'));
my $sres = $srch->get_thread($mid);
my $nr = $sres->{total};
- my $expand = "<a\nhref=\"${upfx}t/#u\">expand</a> " .
- "/ <a\nhref=\"${upfx}t.mbox.gz\">mbox.gz</a>";
+ my $expand = qq(<a\nhref="${tpfx}t/#u">expand</a> ) .
+ qq(/ <a\nhref="${tpfx}t.mbox.gz">mbox.gz</a> ) .
+ qq(/ <a\nhref="${tpfx}t.atom">Atom feed</a>);
my $parent = in_reply_to($hdr);
if ($nr <= 1) {
if (defined $parent) {
$$dst .= "($expand)\n ";
- $$dst .= ghost_parent("$upfx../", $parent) . "\n";
+ $$dst .= ghost_parent("$tpfx../", $parent) . "\n";
} else {
$$dst .= "[no followups, yet] ($expand)\n";
}
prev_level => 0,
};
for (thread_results(load_results($sres))->rootset) {
- skel_dump($dst, $state, $upfx, $_, 0);
+ skel_dump($dst, $state, $tpfx, $_, 0);
}
$ctx->{next_msg} = $state->{next_msg};
$ctx->{parent_msg} = $parent;
foreach my $h (qw(From To Cc)) {
my $v = $hdr->header($h);
defined($v) && ($v ne '') or next;
- my @addrs = Email::Address->parse($v);
- foreach my $recip (@addrs) {
- my $address = $recip->address;
+ my @addrs = PublicInbox::Address::emails($v);
+ foreach my $address (@addrs) {
my $dst = lc($address);
$cc{$dst} ||= $address;
$to ||= $dst;
}
}
- Email::Address->purge_cache;
my @arg;
my $subj = $hdr->header('Subject') || '';
}
sub html_footer {
- my ($hdr, $standalone, $ctx, $mhref) = @_;
+ my ($hdr, $standalone, $ctx, $rhref) = @_;
my $srch = $ctx->{srch} if $ctx;
my $upfx = '../';
my $tpfx = '';
my $idx = $standalone ? " <a\nhref=\"$upfx\">index</a>" : '';
my $irt = '';
-
- if ($srch && $standalone) {
- $idx .= qq{ / follow: <a\nhref="${tpfx}t.atom">Atom feed</a>\n};
- }
if ($idx && $srch) {
+ $idx .= "\n";
thread_skel(\$idx, $ctx, $hdr, $tpfx);
my $p = $ctx->{parent_msg};
my $next = $ctx->{next_msg};
if ($p) {
$p = PublicInbox::Hval->new_msgid($p);
$p = $p->as_href;
- $irt = "<a\nhref=\"$upfx$p/\">parent</a> ";
+ $irt = "<a\nhref=\"$upfx$p/\"rel=prev>parent</a> ";
} else {
$irt = ' ' x length('parent ');
}
if ($next) {
- $irt .= "<a\nhref=\"$upfx$next/\">next</a> ";
+ my $n = PublicInbox::Hval->new_msgid($next)->as_href;
+ $irt .= "<a\nhref=\"$upfx$n/\"\nrel=next>next</a> ";
} else {
$irt .= ' ' x length('next ');
}
} else {
$irt = '';
}
-
- $irt . qq(<a\nhref="${tpfx}R/">reply</a>) . $idx;
+ $rhref ||= '#R';
+ $irt .= qq(<a\nhref="$rhref">reply</a>);
+ $irt .= $idx;
}
sub linkify_ref_nosrch {
}
sub thread_results {
- my ($msgs, $nosubject, $nosort) = @_;
+ my ($msgs) = @_;
require PublicInbox::Thread;
my $th = PublicInbox::Thread->new(@$msgs);
-
- # WARNING! both these Mail::Thread knobs were found by inspecting
- # the Mail::Thread 2.55 source code, and we have some monkey patches
- # in PublicInbox::Thread to fix memory leaks. Since Mail::Thread
- # appears unmaintained, I suppose it's safe to depend on these
- # variables for now:
- no warnings 'once';
- $Mail::Thread::nosubject = $nosubject;
- # Keep ghosts with only a single direct child:
- $Mail::Thread::noprune = 1;
$th->thread;
- $th->order(*sort_ts) unless $nosort;
+ $th->order(*sort_ts);
$th
}
sub _skel_header {
my ($dst, $state, $upfx, $hdr, $level) = @_;
- my $dot = $level == 0 ? '' : '` ';
my $cur = $state->{cur};
my $mid = mid_clean($hdr->header_raw('Message-ID'));
my $f = ascii_html($hdr->header('X-PI-From'));
my $d = _msg_date($hdr);
- my $pfx = ' ' . $d . ' ' . indent_for($level);
+ my $pfx = "$d " . indent_for($level) . th_pfx($level);
my $attr = $f;
$state->{first_level} ||= $level;
if ($cur) {
if ($cur eq $mid) {
delete $state->{cur};
- $$dst .= "$pfx$dot<b><a\nid=r\nhref=\"#b\">".
+ $$dst .= "$pfx<b><a\nid=r\nhref=\"#t\">".
"$attr [this message]</a></b>\n";
return;
}
my $m = PublicInbox::Hval->new_msgid($mid);
$m = $upfx . '../' . $m->as_href . '/';
- if (defined $s) {
- $$dst .= "$pfx$dot<a\nhref=\"$m\">$s</a> $attr\n";
- } else {
- $$dst .= "$pfx$dot<a\nhref=\"$m\">$f</a>\n";
- }
+ $$dst .= "$pfx<a\nhref=\"$m\">";
+ $$dst .= defined($s) ? "$s</a> $f\n" : "$f</a>\n";
}
sub skel_dump {
if ($mid eq 'subject dummy') {
$$dst .= "\t[no common parent]\n";
} else {
- $$dst .= ' [not found] ';
- my $dot = $level == 0 ? '' : '` ';
- $$dst .= indent_for($level) . $dot;
+ $$dst .= ' [not found] ';
+ $$dst .= indent_for($level) . th_pfx($level);
$mid = PublicInbox::Hval->new_msgid($mid);
my $href = "$upfx../" . $mid->as_href . '/';
my $html = $mid->as_html;
$cur = undef;
}
$cur ||= [ $ts, '' ];
- my $dot = $level == 0 ? '' : '` ';
$cur->[0] = $ts if $ts > $cur->[0];
- $cur->[1] .= "$nl$pfx$dot<a\nhref=\"$mid/t/#u\"><b>";
- $cur->[1] .= $subj;
- $cur->[1] .= "</b></a>\n";
+ $cur->[1] .= $nl . $pfx . th_pfx($level) .
+ "<a\nhref=\"$mid/t/#u\"><b>" .
+ $subj . "</b></a>\n";
$ts = fmt_ts($ts);
my $attr = " $ts UTC";
sub emit_index_topics {
my ($state) = @_;
- my $off = $state->{ctx}->{cgi}->param('o');
- $off = 0 unless defined $off;
+ my ($off) = (($state->{ctx}->{cgi}->param('o') || '0') =~ /(\d+)/);
$state->{order} = [];
$state->{subjs} = {};
$state->{latest} = {};
my $max = 25;
- my %opts = ( offset => int $off, limit => $max * 4 );
+ my %opts = ( offset => $off, limit => $max * 4 );
while (scalar @{$state->{order}} < $max) {
my $sres = $state->{srch}->query('', \%opts);
my $nr = scalar @{$sres->{msgs}} or last;
- for (thread_results(load_results($sres), 1)->rootset) {
+ for (thread_results(load_results($sres))->rootset) {
add_topic($state, $_, 0);
}
$opts{offset} += $nr;