2 # Copyright (C) 2019-2021 all contributors <meta@public-inbox.org>
3 # License: AGPL-3.0+ <https://www.gnu.org/licenses/agpl-3.0.txt>
5 # Parallel test runner which preloads code and reuses worker processes
6 # to give a nice speedup over prove(1). It also generates per-test
7 # .log files (similar to automake tests).
9 # *.t files run by this should not rely on global state.
11 # Usage: $PERL -I lib -w t/run.perl -j4
12 # Or via prove(1): prove -lvw t/run.perl :: -j4
15 use IO::Handle; # ->autoflush
16 use PublicInbox::TestCommon;
17 use PublicInbox::Spawn;
18 use Getopt::Long qw(:config gnu_getopt no_ignore_case auto_abbrev);
21 use POSIX qw(_POSIX_PIPE_BUF WNOHANG);
25 our $log_suffix = '.log';
26 my ($shuffle, %pids, @err);
27 GetOptions('j|jobs=i' => \$jobs,
28 'repeat=i' => \$repeat,
29 'log=s' => \$log_suffix,
30 's|shuffle' => \$shuffle,
31 ) or die "Usage: $0 [-j JOBS] [--log=SUFFIX] [--repeat RUNS]";
32 if (($ENV{TEST_RUN_MODE} // 2) == 0) {
33 die "$0 is not compatible with TEST_RUN_MODE=0\n";
35 my @tests = scalar(@ARGV) ? @ARGV : glob('t/*.t');
36 open my $cwd_fh, '<', '.' or die "open .: $!";
37 open my $OLDOUT, '>&STDOUT' or die "dup STDOUT: $!";
38 open my $OLDERR, '>&STDERR' or die "dup STDERR: $!";
39 $OLDOUT->autoflush(1);
40 $OLDERR->autoflush(1);
42 key2sub($_) for @tests; # precache
44 my ($for_destroy, $lei_env, $lei_daemon_pid, $owner_pid);
45 if (!$ENV{TEST_LEI_DAEMON_PERSIST_DIR} &&
46 (PublicInbox::Spawn->can('recv_cmd4') ||
47 eval { require Socket::MsgHdr })) {
49 ($lei_env->{XDG_RUNTIME_DIR}, $for_destroy) = tmpdir;
50 $ENV{TEST_LEI_DAEMON_PERSIST_DIR} = $lei_env->{XDG_RUNTIME_DIR};
51 run_script([qw(lei daemon-pid)], $lei_env, { 1 => \$lei_daemon_pid });
52 chomp $lei_daemon_pid;
53 $lei_daemon_pid =~ /\A[0-9]+\z/ or die "no daemon pid: $lei_daemon_pid";
54 kill(0, $lei_daemon_pid) or die "kill $lei_daemon_pid: $!";
55 if (my $t = $ENV{GNU_TAIL}) {
56 system("$t --pid=$lei_daemon_pid -F " .
57 "$lei_env->{XDG_RUNTIME_DIR}/lei/errors.log >&2 &");
59 if (my $strace_cmd = $ENV{STRACE_CMD}) {
60 system("$strace_cmd -p $lei_daemon_pid &");
67 } elsif (open(my $prove_state, '<', '.prove') && eval { require YAML::XS }) {
68 # reuse "prove --state=save" data to start slowest tests, first
69 my $state = YAML::XS::Load(do { local $/; <$prove_state> });
70 my $t = $state->{tests};
72 ($t->{$b}->{elapsed} // 0) <=> ($t->{$a}->{elapsed} // 0)
76 our $tb = Test::More->builder;
83 our ($worker, $worker_test);
86 $? = 255 if $? == 0 && !$tb->is_passing;
87 my $status = $? ? 'not ok' : 'ok';
88 chdir($cwd_fh) or DIE "fchdir: $!";
89 if ($log_suffix ne '') {
90 my $log = $worker_test;
91 $log =~ s/\.t\z/$log_suffix/;
93 if (open my $fh, '<', $log) {
94 my @not_ok = grep(!/^(?:ok |[ \t]*#)/ms, <$fh>);
95 my $last = $not_ok[-1] // '';
96 pop @not_ok if $last =~ /^[0-9]+\.\.[0-9]+$/;
98 print $OLDERR map { $pfx.$_ } @not_ok;
99 seek($fh, 0, SEEK_SET) or die "seek: $!";
101 # show unique skip texts and the number of times
102 # each text was skipped
104 my @sk = (<$fh> =~ m/^ok [0-9]+ (# skip [^\n]+)/mgs);
107 my @err = grep { !$nr{$_}++ } @sk;
108 print $OLDERR "$pfx$_ ($nr{$_})\n" for @err;
109 $skip = ' # total skipped: '.scalar(@sk);
112 print $OLDERR "could not open: $log: $!\n";
114 print $OLDOUT "$status $worker_test$skip\n";
118 # Test::Builder or Test2::Hub may call exit() from plan(skip_all => ...)
119 END { test_status() if (defined($worker_test) && $worker == $$) }
124 if ($log_suffix ne '') {
126 $log =~ s/\.[^\.]+\z/$log_suffix/ or DIE "can't log for $test";
127 open $log_fh, '>', $log or DIE "open $log: $!";
128 $log_fh->autoflush(1);
129 $tb->output($log_fh);
130 $tb->failure_output($log_fh);
131 $tb->todo_output($log_fh);
132 open STDOUT, '>&', $log_fh or DIE "1>$log: $!";
133 open STDERR, '>&', $log_fh or DIE "2>$log: $!";
135 $worker_test = $test;
138 $worker_test = undef;
139 push @err, "$test ($?)" if $?;
142 sub UINT_SIZE () { 4 }
144 # worker processes will SIGUSR1 the producer process when it
145 # sees EOF on the pipe. On FreeBSD 11.2 and Perl 5.30.0,
146 # sys/ioctl.ph gives the wrong value for FIONREAD().
148 my $eof; # we stop respawning if true
150 my $start_worker = sub {
151 my ($j, $rd, $wr, $todo) = @_;
152 my $pid = fork // DIE "fork: $!";
157 my $r = sysread($rd, my $buf, UINT_SIZE);
163 DIE "short read $r" if $r != UINT_SIZE;
164 my $t = unpack('I', $buf);
165 run_test($todo->[$t]);
168 kill 'USR1', $producer if !$eof; # sets $eof in $producer
169 DIE join('', map { "E: $_\n" } @err) if @err;
176 # negative $repeat means loop forever:
177 for (my $i = $repeat; $i != 0; $i--) {
178 my @todo = $shuffle ? List::Util::shuffle(@tests) : @tests;
180 # single-producer, multi-consumer queue relying on POSIX pipe semantics
181 # POSIX.1-2008 stipulates a regular file should work, but Linux <3.14
182 # had broken read(2) semantics according to the read(2) manpage
183 pipe(my ($rd, $wr)) or DIE "pipe: $!";
185 # fill the queue before forking so children can start earlier
186 my $n = (_POSIX_PIPE_BUF / UINT_SIZE);
188 print $wr join('', map { pack('I', $_) } (0..$#todo)) or DIE;
190 } else { # write what we can...
192 print $wr join('', map { pack('I', $_) } (0..$n)) or DIE;
193 $n += 1; # and send more ($n..$#todo), later
196 local $SIG{USR1} = sub { $eof = 1 };
199 my $flags = $sig ? WNOHANG : 0;
201 my $pid = waitpid(-1, $flags) or return;
203 my $j = delete $pids{$pid};
205 push @err, "reaped unknown $pid ($?)";
208 push @err, "job[$j] ($?)" if $?;
209 # skip_all can exit(0), respawn if needed:
211 print $OLDERR "# respawning job[$j]\n";
212 $start_worker->($j, $rd, $wr, \@todo);
217 # start the workers to consume the queue
218 for (my $j = 0; $j < $jobs; $j++) {
219 $start_worker->($j, $rd, $wr, \@todo);
222 local $SIG{CHLD} = $sigchld;
223 # too many tests to fit in the pipe before starting workers,
224 # send the rest now the workers are running
225 print $wr join('', map { pack('I', $_) } ($n..$#todo)) or DIE;
229 $sigchld->(0) while scalar(keys(%pids));
230 DIE join('', map { "E: $_\n" } @err) if @err;
233 print $OLDOUT "1..".($repeat * scalar(@tests))."\n" if $repeat >= 0;
234 if ($lei_env && $$ == $owner_pid) {
235 my $opt = { 1 => $OLDOUT, 2 => $OLDERR };
236 run_script([qw(lei daemon-kill)], $lei_env, $opt);