X-Git-Url: http://www.git.stargrave.org/?a=blobdiff_plain;f=lib%2FPublicInbox%2FHTTP.pm;h=e65988bedf06fe2c5236e333bd7fc075021168b4;hb=c410bf707fb77b15698e14119dbf6e14e43479ba;hp=d0708c5be4caf0a31740d5b23266ca32cf0bd3d7;hpb=af0b0fb7a454470a32c452119d0392e0dedb3fe1;p=public-inbox.git diff --git a/lib/PublicInbox/HTTP.pm b/lib/PublicInbox/HTTP.pm index d0708c5b..e65988be 100644 --- a/lib/PublicInbox/HTTP.pm +++ b/lib/PublicInbox/HTTP.pm @@ -21,13 +21,11 @@ package PublicInbox::HTTP; use strict; use parent qw(PublicInbox::DS); -use bytes (); # only for bytes::length use Fcntl qw(:seek); use Plack::HTTPParser qw(parse_http_request); # XS or pure Perl use Plack::Util; use HTTP::Status qw(status_message); use HTTP::Date qw(time2str); -use IO::Handle; # ->write use PublicInbox::DS qw(msg_more); use PublicInbox::Syscall qw(EPOLLIN EPOLLONESHOT); use PublicInbox::Tmpfile; @@ -39,16 +37,6 @@ use constant { }; use Errno qw(EAGAIN); -my $pipelineq = []; -sub process_pipelineq () { - my $q = $pipelineq; - $pipelineq = []; - foreach (@$q) { - next unless $_->{sock}; - rbuf_process($_); - } -} - # Use the same configuration parameter as git since this is primarily # a slow-client sponge for git-http-backend # TODO: support per-respository http.maxRequestBuffer somehow... @@ -88,45 +76,29 @@ sub event_step { # called by PublicInbox::DS # otherwise we can be buffering infinitely w/o backpressure return read_input($self) if ref($self->{env}); - my $rbuf = $self->{rbuf} // (\(my $x = '')); - $self->do_read($rbuf, 8192, bytes::length($$rbuf)) or return; - rbuf_process($self, $rbuf); -} - -sub rbuf_process { - my ($self, $rbuf) = @_; - $rbuf //= $self->{rbuf} // (\(my $x = '')); + my $rbuf = $self->{rbuf} // (\(my $x = '')); my %env = %{$self->{httpd}->{env}}; # full hash copy - my $r = parse_http_request($$rbuf, \%env); - - # We do not support Trailers in chunked requests, for now - # (they are rarely-used and git (as of 2.7.2) does not use them) - if ($r == -1 || $env{HTTP_TRAILER} || - # this length-check is necessary for PURE_PERL=1: - ($r == -2 && bytes::length($$rbuf) > 0x4000)) { - return quit($self, 400); - } - if ($r < 0) { # incomplete - $self->rbuf_idle($rbuf); - return $self->requeue; + my $r; + while (($r = parse_http_request($$rbuf, \%env)) < 0) { + # We do not support Trailers in chunked requests, for + # now (they are rarely-used and git (as of 2.7.2) does + # not use them). + # this length-check is necessary for PURE_PERL=1: + if ($r == -1 || $env{HTTP_TRAILER} || + ($r == -2 && length($$rbuf) > 0x4000)) { + return quit($self, 400); + } + $self->do_read($rbuf, 8192, length($$rbuf)) or return; } + return quit($self, 400) if grep(/\s/, keys %env); # stop smugglers $$rbuf = substr($$rbuf, $r); - my $len = input_prepare($self, \%env); - defined $len or return write_err($self, undef); # EMFILE/ENFILE + my $len = input_prepare($self, \%env) // + return write_err($self, undef); # EMFILE/ENFILE $len ? read_input($self, $rbuf) : app_dispatch($self, undef, $rbuf); } -# IO::Handle::write returns boolean, this returns bytes written: -sub xwrite ($$$) { - my ($fh, $rbuf, $max) = @_; - my $w = bytes::length($$rbuf); - $w = $max if $w > $max; - $fh->write($$rbuf, $w) or return; - $w; -} - sub read_input ($;$) { my ($self, $rbuf) = @_; $rbuf //= $self->{rbuf} // (\(my $x = '')); @@ -139,7 +111,7 @@ sub read_input ($;$) { while ($len > 0) { if ($$rbuf ne '') { - my $w = xwrite($input, $rbuf, $len); + my $w = syswrite($input, $$rbuf, $len); return write_err($self, $len) unless $w; $len -= $w; die "BUG: $len < 0 (w=$w)" if $len < 0; @@ -182,7 +154,7 @@ sub app_dispatch { } }; if ($@) { - err($self, "response_write error: $@"); + warn "response_write error: $@"; $self->close; } } @@ -236,7 +208,7 @@ sub response_header_write { sub chunked_write ($$) { my $self = $_[0]; return if $_[1] eq ''; - msg_more($self, sprintf("%x\r\n", bytes::length($_[1]))); + msg_more($self, sprintf("%x\r\n", length($_[1]))); msg_more($self, $_[1]); # use $self->write(\"\n\n") if you care about real-time @@ -249,22 +221,11 @@ sub identity_write ($$) { $self->write(\($_[1])) if $_[1] ne ''; } -sub next_request ($) { - my ($self) = @_; - if ($self->{rbuf}) { - # avoid recursion for pipelined requests - PublicInbox::DS::requeue(\&process_pipelineq) if !@$pipelineq; - push @$pipelineq, $self; - } else { # wait for next request - $self->requeue; - } -} - sub response_done { my ($self, $alive) = @_; delete $self->{env}; # we're no longer busy $self->write(\"0\r\n\r\n") if $alive == 2; - $self->write($alive ? \&next_request : \&close); + $self->write($alive ? $self->can('requeue') : \&close); } sub getline_pull { @@ -274,7 +235,7 @@ sub getline_pull { # limit our own running time for fairness with other # clients and to avoid buffering too much: my $buf = eval { - local $/ = \8192; + local $/ = \65536; $forward->getline; } if $forward; @@ -296,14 +257,14 @@ sub getline_pull { return; # likely } } elsif ($@) { - err($self, "response ->getline error: $@"); + warn "response ->getline error: $@"; $self->close; } # avoid recursion if (delete $self->{forward}) { eval { $forward->close }; if ($@) { - err($self, "response ->close error: $@"); + warn "response ->close error: $@"; $self->close; # idempotent } } @@ -334,12 +295,6 @@ sub response_write { } } -sub input_tmpfile ($) { - my $input = tmpfile('http.input', $_[0]->{sock}) or return; - $input->autoflush(1); - $input; -} - sub input_prepare { my ($self, $env) = @_; my ($input, $len); @@ -355,39 +310,33 @@ sub input_prepare { return quit($self, 400) if $hte !~ /\Achunked\z/i; $len = CHUNK_START; - $input = input_tmpfile($self); + $input = tmpfile('http.input', $self->{sock}); } else { $len = $env->{CONTENT_LENGTH}; if (defined $len) { # rfc7230 3.3.3.4 return quit($self, 400) if $len !~ /\A[0-9]+\z/; - return quit($self, 413) if $len > $MAX_REQUEST_BUFFER; - $input = $len ? input_tmpfile($self) : $null_io; + $input = $len ? tmpfile('http.input', $self->{sock}) + : $null_io; } else { $input = $null_io; } } # TODO: expire idle clients on ENFILE / EMFILE - return unless $input; - - $env->{'psgi.input'} = $input; + $env->{'psgi.input'} = $input // return; $self->{env} = $env; $self->{input_left} = $len || 0; } sub env_chunked { ($_[0]->{HTTP_TRANSFER_ENCODING} // '') =~ /\Achunked\z/i } -sub err ($$) { - eval { $_[0]->{httpd}->{env}->{'psgi.errors'}->print($_[1]."\n") }; -} - sub write_err { my ($self, $len) = @_; my $msg = $! || '(zero write)'; $msg .= " ($len bytes remaining)" if defined $len; - err($self, "error buffering to input: $msg"); + warn "error buffering to input: $msg"; quit($self, 500); } @@ -396,7 +345,7 @@ sub recv_err { if ($! == EAGAIN) { # epoll/kevent watch already set by do_read $self->{input_left} = $len; } else { - err($self, "error reading input: $! ($len bytes remaining)"); + warn "error reading input: $! ($len bytes remaining)"; } } @@ -411,12 +360,12 @@ sub read_input_chunked { # unlikely... $$rbuf =~ s/\A\r\n//s and return app_dispatch($self, $input, $rbuf); - return quit($self, 400) if bytes::length($$rbuf) > 2; + return quit($self, 400) if length($$rbuf) > 2; } if ($len == CHUNK_END) { if ($$rbuf =~ s/\A\r\n//s) { $len = CHUNK_START; - } elsif (bytes::length($$rbuf) > 2) { + } elsif (length($$rbuf) > 2) { return quit($self, 400); } } @@ -426,14 +375,14 @@ sub read_input_chunked { # unlikely... if (($len + -s $input) > $MAX_REQUEST_BUFFER) { return quit($self, 413); } - } elsif (bytes::length($$rbuf) > CHUNK_MAX_HDR) { + } elsif (length($$rbuf) > CHUNK_MAX_HDR) { return quit($self, 400); } # will break from loop since $len >= 0 } if ($len < 0) { # chunk header is trickled, read more - $self->do_read($rbuf, 8192, bytes::length($$rbuf)) or + $self->do_read($rbuf, 8192, length($$rbuf)) or return recv_err($self, $len); # (implicit) goto chunk_start if $r > 0; } @@ -442,7 +391,7 @@ sub read_input_chunked { # unlikely... # drain the current chunk until ($len <= 0) { if ($$rbuf ne '') { - my $w = xwrite($input, $rbuf, $len); + my $w = syswrite($input, $$rbuf, $len); return write_err($self, "$len chunk") if !$w; $len -= $w; if ($len == 0) { @@ -477,15 +426,14 @@ sub close { my $self = $_[0]; if (my $forward = delete $self->{forward}) { eval { $forward->close }; - err($self, "forward ->close error: $@") if $@; + warn "forward ->close error: $@" if $@; } $self->SUPER::close; # PublicInbox::DS::close } -# for graceful shutdown in PublicInbox::Daemon: -sub busy () { +sub busy { # for graceful shutdown in PublicInbox::Daemon: my ($self) = @_; - ($self->{rbuf} || exists($self->{env}) || $self->{wbuf}); + defined($self->{rbuf}) || exists($self->{env}) || defined($self->{wbuf}) } # runs $cb on the next iteration of the event loop at earliest