# Copyright (C) 2014-2015 all contributors
# License: AGPLv3 or later (https://www.gnu.org/licenses/agpl-3.0.txt)
#
# represents a header value in various forms. Used for HTML generation
# in our web interface(s)
package PublicInbox::Hval;
use strict;
use warnings;
use Encode qw(find_encoding);
use URI::Escape qw(uri_escape_utf8);
use PublicInbox::MID qw/mid_clean/;
use base qw/Exporter/;
our @EXPORT_OK = qw/ascii_html/;
# for user-generated content (UGC) which may have excessively long lines
# and screw up rendering on some browsers. This is the only CSS style
# feature we use.
use constant STYLE => '';
my $enc_ascii = find_encoding('us-ascii');
sub new {
my ($class, $raw, $href) = @_;
# we never care about trailing whitespace
$raw =~ s/\s*\z//;
bless {
raw => $raw,
href => defined $href ? $href : $raw,
}, $class;
}
sub new_msgid {
my ($class, $msgid) = @_;
$msgid = mid_clean($msgid);
$class->new($msgid, $msgid);
}
sub new_oneline {
my ($class, $raw) = @_;
$raw = '' unless defined $raw;
$raw =~ tr/\t\n / /s; # squeeze spaces
$raw =~ tr/\r//d; # kill CR
$class->new($raw);
}
my %xhtml_map = (
'"' => '"',
'&' => '&',
"'" => ''',
'<' => '<',
'>' => '>',
);
sub ascii_html {
my ($s) = @_;
$s =~ s/\r\n/\n/sg; # fixup bad line endings
$s =~ s/([<>&'"])/$xhtml_map{$1}/ge;
$enc_ascii->encode($s, Encode::HTMLCREF);
}
sub as_html { ascii_html($_[0]->{raw}) }
sub as_href { ascii_html(uri_escape_utf8($_[0]->{href})) }
sub raw {
if (defined $_[1]) {
$_[0]->{raw} = $_[1];
} else {
$_[0]->{raw};
}
}
sub prurl {
my ($env, $u) = @_;
index($u, '//') == 0 ? "$env->{'psgi.url_scheme'}:$u" : $u;
}
1;