git-commit-vandalism/t/chainlint.pl

#!/usr/bin/env perl
#
# Copyright (c) 2021-2022 Eric Sunshine <sunshine@sunshineco.com>
#
# This tool scans shell scripts for test definitions and checks those tests for
# problems, such as broken &&-chains, which might hide bugs in the tests
# themselves or in behaviors being exercised by the tests.
#
# Input arguments are pathnames of shell scripts containing test definitions,
# or globs referencing a collection of scripts. For each problem discovered,
# the pathname of the script containing the test is printed along with the test
# name and the test body with a `?!FOO?!` annotation at the location of each
# detected problem, where "FOO" is a tag such as "AMP" which indicates a broken
# &&-chain. Returns zero if no problems are discovered, otherwise non-zero.

use warnings;
use strict;
use File::Glob;
use Getopt::Long;

my $show_stats;
my $emit_all;

# Lexer tokenizes POSIX shell scripts. It is roughly modeled after section 2.3
# "Token Recognition" of POSIX chapter 2 "Shell Command Language". Although
# similar to lexical analyzers for other languages, this one differs in a few
# substantial ways due to quirks of the shell command language.
#
# For instance, in many languages, newline is just whitespace like space or
# TAB, but in shell a newline is a command separator, thus a distinct lexical
# token. A newline is significant and returned as a distinct token even at the
# end of a shell comment.
#
# In other languages, `1+2` would typically be scanned as three tokens
# (`1`, `+`, and `2`), but in shell it is a single token. However, the similar
# `1 + 2`, which embeds whitepace, is scanned as three token in shell, as well.
# In shell, several characters with special meaning lose that meaning when not
# surrounded by whitespace. For instance, the negation operator `!` is special
# when standing alone surrounded by whitespace; whereas in `foo!uucp` it is
# just a plain character in the longer token "foo!uucp". In many other
# languages, `"string"/foo:'string'` might be scanned as five tokens ("string",
# `/`, `foo`, `:`, and 'string'), but in shell, it is just a single token.
#
# The lexical analyzer for the shell command language is also somewhat unusual
# in that it recursively invokes the parser to handle the body of `$(...)`
# expressions which can contain arbitrary shell code. Such expressions may be
# encountered both inside and outside of double-quoted strings.
#
# The lexical analyzer is responsible for consuming shell here-doc bodies which
# extend from the line following a `<<TAG` operator until a line consisting
# solely of `TAG`. Here-doc consumption begins when a newline is encountered.
# It is legal for multiple here-doc `<<TAG` operators to be present on a single
# line, in which case their bodies must be present one following the next, and
# are consumed in the (left-to-right) order the `<<TAG` operators appear on the
# line. A special complication is that the bodies of all here-docs must be
# consumed when the newline is encountered even if the parse context depth has
# changed. For instance, in `cat <<A && x=$(cat <<B &&\n`, bodies of here-docs
# "A" and "B" must be consumed even though "A" was introduced outside the
# recursive parse context in which "B" was introduced and in which the newline
# is encountered.
package Lexer;

sub new {
	my ($class, $parser, $s) = @_;
	bless {
		parser => $parser,
		buff => $s,
		heretags => []
	} => $class;
}

sub scan_heredoc_tag {
	my $self = shift @_;
	${$self->{buff}} =~ /\G(-?)/gc;
	my $indented = $1;
	my $tag = $self->scan_token();
	$tag =~ s/['"\\]//g;
	push(@{$self->{heretags}}, $indented ? "\t$tag" : "$tag");
	return "<<$indented$tag";
}

sub scan_op {
	my ($self, $c) = @_;
	my $b = $self->{buff};
	return $c unless $$b =~ /\G(.)/sgc;
	my $cc = $c . $1;
	return scan_heredoc_tag($self) if $cc eq '<<';
	return $cc if $cc =~ /^(?:&&|\|\||>>|;;|<&|>&|<>|>\|)$/;
	pos($$b)--;
	return $c;
}

sub scan_sqstring {
	my $self = shift @_;
	${$self->{buff}} =~ /\G([^']*'|.*\z)/sgc;
	return "'" . $1;
}

sub scan_dqstring {
	my $self = shift @_;
	my $b = $self->{buff};
	my $s = '"';
	while (1) {
		# slurp up non-special characters
		$s .= $1 if $$b =~ /\G([^"\$\\]+)/gc;
		# handle special characters
		last unless $$b =~ /\G(.)/sgc;
		my $c = $1;
		$s .= '"', last if $c eq '"';
		$s .= '$' . $self->scan_dollar(), next if $c eq '$';
		if ($c eq '\\') {
			$s .= '\\', last unless $$b =~ /\G(.)/sgc;
			$c = $1;
			next if $c eq "\n"; # line splice
			# backslash escapes only $, `, ", \ in dq-string
			$s .= '\\' unless $c =~ /^[\$`"\\]$/;
			$s .= $c;
			next;
		}
		die("internal error scanning dq-string '$c'\n");
	}
	return $s;
}

sub scan_balanced {
	my ($self, $c1, $c2) = @_;
	my $b = $self->{buff};
	my $depth = 1;
	my $s = $c1;
	while ($$b =~ /\G([^\Q$c1$c2\E]*(?:[\Q$c1$c2\E]|\z))/gc) {
		$s .= $1;
		$depth++, next if $s =~ /\Q$c1\E$/;
		$depth--;
		last if $depth == 0;
	}
	return $s;
}

sub scan_subst {
	my $self = shift @_;
	my @tokens = $self->{parser}->parse(qr/^\)$/);
	$self->{parser}->next_token(); # closing ")"
	return @tokens;
}

sub scan_dollar {
	my $self = shift @_;
	my $b = $self->{buff};
	return $self->scan_balanced('(', ')') if $$b =~ /\G\((?=\()/gc; # $((...))
	return '(' . join(' ', $self->scan_subst()) . ')' if $$b =~ /\G\(/gc; # $(...)
	return $self->scan_balanced('{', '}') if $$b =~ /\G\{/gc; # ${...}
	return $1 if $$b =~ /\G(\w+)/gc; # $var
	return $1 if $$b =~ /\G([@*#?$!0-9-])/gc; # $*, $1, $$, etc.
	return '';
}

sub swallow_heredocs {
	my $self = shift @_;
	my $b = $self->{buff};
	my $tags = $self->{heretags};
	while (my $tag = shift @$tags) {
		my $indent = $tag =~ s/^\t// ? '\\s*' : '';
		$$b =~ /(?:\G|\n)$indent\Q$tag\E(?:\n|\z)/gc;
	}
}

sub scan_token {
	my $self = shift @_;
	my $b = $self->{buff};
	my $token = '';
RESTART:
	$$b =~ /\G[ \t]+/gc; # skip whitespace (but not newline)
	return "\n" if $$b =~ /\G#[^\n]*(?:\n|\z)/gc; # comment
	while (1) {
		# slurp up non-special characters
		$token .= $1 if $$b =~ /\G([^\\;&|<>(){}'"\$\s]+)/gc;
		# handle special characters
		last unless $$b =~ /\G(.)/sgc;
		my $c = $1;
		last if $c =~ /^[ \t]$/; # whitespace ends token
		pos($$b)--, last if length($token) && $c =~ /^[;&|<>(){}\n]$/;
		$token .= $self->scan_sqstring(), next if $c eq "'";
		$token .= $self->scan_dqstring(), next if $c eq '"';
		$token .= $c . $self->scan_dollar(), next if $c eq '$';
		$self->swallow_heredocs(), $token = $c, last if $c eq "\n";
		$token = $self->scan_op($c), last if $c =~ /^[;&|<>]$/;
		$token = $c, last if $c =~ /^[(){}]$/;
		if ($c eq '\\') {
			$token .= '\\', last unless $$b =~ /\G(.)/sgc;
			$c = $1;
			next if $c eq "\n" && length($token); # line splice
			goto RESTART if $c eq "\n"; # line splice
			$token .= '\\' . $c;
			next;
		}
		die("internal error scanning character '$c'\n");
	}
	return length($token) ? $token : undef;
}

package ScriptParser;

sub new {
	my $class = shift @_;
	my $self = bless {} => $class;
	$self->{output} = [];
	$self->{ntests} = 0;
	return $self;
}

sub parse_cmd {
	return undef;
}

# main contains high-level functionality for processing command-line switches,
# feeding input test scripts to ScriptParser, and reporting results.
package main;

my $getnow = sub { return time(); };
my $interval = sub { return time() - shift; };
if (eval {require Time::HiRes; Time::HiRes->import(); 1;}) {
	$getnow = sub { return [Time::HiRes::gettimeofday()]; };
	$interval = sub { return Time::HiRes::tv_interval(shift); };
}

sub show_stats {
	my ($start_time, $stats) = @_;
	my $walltime = $interval->($start_time);
	my ($usertime) = times();
	my ($total_workers, $total_scripts, $total_tests, $total_errs) = (0, 0, 0, 0);
	for (@$stats) {
		my ($worker, $nscripts, $ntests, $nerrs) = @$_;
		print(STDERR "worker $worker: $nscripts scripts, $ntests tests, $nerrs errors\n");
		$total_workers++;
		$total_scripts += $nscripts;
		$total_tests += $ntests;
		$total_errs += $nerrs;
	}
	printf(STDERR "total: %d workers, %d scripts, %d tests, %d errors, %.2fs/%.2fs (wall/user)\n", $total_workers, $total_scripts, $total_tests, $total_errs, $walltime, $usertime);
}

sub check_script {
	my ($id, $next_script, $emit) = @_;
	my ($nscripts, $ntests, $nerrs) = (0, 0, 0);
	while (my $path = $next_script->()) {
		$nscripts++;
		my $fh;
		unless (open($fh, "<", $path)) {
			$emit->("?!ERR?! $path: $!\n");
			next;
		}
		my $s = do { local $/; <$fh> };
		close($fh);
		my $parser = ScriptParser->new(\$s);
		1 while $parser->parse_cmd();
		if (@{$parser->{output}}) {
			my $s = join('', @{$parser->{output}});
			$emit->("# chainlint: $path\n" . $s);
			$nerrs += () = $s =~ /\?![^?]+\?!/g;
		}
		$ntests += $parser->{ntests};
	}
	return [$id, $nscripts, $ntests, $nerrs];
}

sub exit_code {
	my $stats = shift @_;
	for (@$stats) {
		my ($worker, $nscripts, $ntests, $nerrs) = @$_;
		return 1 if $nerrs;
	}
	return 0;
}

Getopt::Long::Configure(qw{bundling});
GetOptions(
	"emit-all!" => \$emit_all,
	"stats|show-stats!" => \$show_stats) or die("option error\n");

my $start_time = $getnow->();
my @stats;

my @scripts;
push(@scripts, File::Glob::bsd_glob($_)) for (@ARGV);
unless (@scripts) {
	show_stats($start_time, \@stats) if $show_stats;
	exit;
}

push(@stats, check_script(1, sub { shift(@scripts); }, sub { print(@_); }));
show_stats($start_time, \@stats) if $show_stats;
exit(exit_code(\@stats));
t: add skeleton chainlint.pl Although chainlint.sed usefully identifies broken &&-chains in tests, it has several shortcomings which include: * only detects &&-chain breakage in subshells (one-level deep) * does not check for broken top-level &&-chains; that task is left to the "magic exit code 117" checker built into test-lib.sh, however, that detection does not extend to `{...}` blocks, `$(...)` expressions, or compound statements such as `if...fi`, `while...done`, `case...esac` * uses heuristics, which makes it (potentially) fallible and difficult to tweak to handle additional real-world cases * written in `sed` and employs advanced `sed` operators which are probably not well-known to many programmers, thus the pool of people who can maintain it is likely small * manually simulates recursion into subshells which makes it much more difficult to reason about than, say, a traditional top-down parser * checks each test as the test is run, which can get expensive for tests which are run repeatedly by functions or loops since their bodies will be checked over and over (tens or hundreds of times) unnecessarily To address these shortcomings, begin implementing a more functional and precise test linter which understands shell syntax and semantics rather than employing heuristics, thus is able to recognize structural problems with tests beyond broken &&-chains. The new linter is written in Perl, thus should be more accessible to a wider audience, and is structured as a traditional top-down parser which makes it much easier to reason about, and allows it to inspect compound statements within test bodies to any depth. Furthermore, it can check all test definitions in the entire project in a single invocation rather than having to be invoked once per test, and each test definition is checked only once no matter how many times the test is actually run. At this stage, the new linter is just a skeleton containing boilerplate which handles command-line options, collects and reports statistics, and feeds its arguments -- paths of test scripts -- to a (presently) do-nothing script parser for validation. Subsequent changes will flesh out the functionality. Signed-off-by: Eric Sunshine <sunshine@sunshineco.com> Signed-off-by: Junio C Hamano <gitster@pobox.com> 2022-09-01 02:29:39 +02:00			`#!/usr/bin/env perl`
			`#`
			`# Copyright (c) 2021-2022 Eric Sunshine <sunshine@sunshineco.com>`
			`#`
			`# This tool scans shell scripts for test definitions and checks those tests for`
			`# problems, such as broken &&-chains, which might hide bugs in the tests`
			`# themselves or in behaviors being exercised by the tests.`
			`#`
			`# Input arguments are pathnames of shell scripts containing test definitions,`
			`# or globs referencing a collection of scripts. For each problem discovered,`
			`# the pathname of the script containing the test is printed along with the test`
			# name and the test body with a `?!FOO?!` annotation at the location of each
			`# detected problem, where "FOO" is a tag such as "AMP" which indicates a broken`
			`# &&-chain. Returns zero if no problems are discovered, otherwise non-zero.`

			`use warnings;`
			`use strict;`
			`use File::Glob;`
			`use Getopt::Long;`

			`my $show_stats;`
			`my $emit_all;`

chainlint.pl: add POSIX shell lexical analyzer Begin fleshing out chainlint.pl by adding a lexical analyzer for the POSIX shell command language. The sole entry point Lexer::scan_token() returns the next token from the input. It will be called by the upcoming shell language parser. Signed-off-by: Eric Sunshine <sunshine@sunshineco.com> Signed-off-by: Junio C Hamano <gitster@pobox.com> 2022-09-01 02:29:40 +02:00			`# Lexer tokenizes POSIX shell scripts. It is roughly modeled after section 2.3`
			`# "Token Recognition" of POSIX chapter 2 "Shell Command Language". Although`
			`# similar to lexical analyzers for other languages, this one differs in a few`
			`# substantial ways due to quirks of the shell command language.`
			`#`
			`# For instance, in many languages, newline is just whitespace like space or`
			`# TAB, but in shell a newline is a command separator, thus a distinct lexical`
			`# token. A newline is significant and returned as a distinct token even at the`
			`# end of a shell comment.`
			`#`
			# In other languages, `1+2` would typically be scanned as three tokens
			# (`1`, `+`, and `2`), but in shell it is a single token. However, the similar
			# `1 + 2`, which embeds whitepace, is scanned as three token in shell, as well.
			`# In shell, several characters with special meaning lose that meaning when not`
			# surrounded by whitespace. For instance, the negation operator `!` is special
			# when standing alone surrounded by whitespace; whereas in `foo!uucp` it is
			`# just a plain character in the longer token "foo!uucp". In many other`
			# languages, `"string"/foo:'string'` might be scanned as five tokens ("string",
			# `/`, `foo`, `:`, and 'string'), but in shell, it is just a single token.
			`#`
			`# The lexical analyzer for the shell command language is also somewhat unusual`
			# in that it recursively invokes the parser to handle the body of `$(...)`
			`# expressions which can contain arbitrary shell code. Such expressions may be`
			`# encountered both inside and outside of double-quoted strings.`
			`#`
			`# The lexical analyzer is responsible for consuming shell here-doc bodies which`
			# extend from the line following a `<<TAG` operator until a line consisting
			# solely of `TAG`. Here-doc consumption begins when a newline is encountered.
			# It is legal for multiple here-doc `<<TAG` operators to be present on a single
			`# line, in which case their bodies must be present one following the next, and`
			# are consumed in the (left-to-right) order the `<<TAG` operators appear on the
			`# line. A special complication is that the bodies of all here-docs must be`
			`# consumed when the newline is encountered even if the parse context depth has`
			# changed. For instance, in `cat <<A && x=$(cat <<B &&\n`, bodies of here-docs
			`# "A" and "B" must be consumed even though "A" was introduced outside the`
			`# recursive parse context in which "B" was introduced and in which the newline`
			`# is encountered.`
			`package Lexer;`

			`sub new {`
			`my ($class, $parser, $s) = @_;`
			`bless {`
			`parser => $parser,`
			`buff => $s,`
			`heretags => []`
			`} => $class;`
			`}`

			`sub scan_heredoc_tag {`
			`my $self = shift @_;`
			`${$self->{buff}} =~ /\G(-?)/gc;`
			`my $indented = $1;`
			`my $tag = $self->scan_token();`
			`$tag =~ s/['"\\]//g;`
			`push(@{$self->{heretags}}, $indented ? "\t$tag" : "$tag");`
			`return "<<$indented$tag";`
			`}`

			`sub scan_op {`
			`my ($self, $c) = @_;`
			`my $b = $self->{buff};`
			`return $c unless $$b =~ /\G(.)/sgc;`
			`my $cc = $c . $1;`
			`return scan_heredoc_tag($self) if $cc eq '<<';`
			`return $cc if $cc =~ /^(?:&&\|\\|\\|\|>>\|;;\|<&\|>&\|<>\|>\\|)$/;`
			`pos($$b)--;`
			`return $c;`
			`}`

			`sub scan_sqstring {`
			`my $self = shift @_;`
			`${$self->{buff}} =~ /\G([^']'\|.\z)/sgc;`
			`return "'" . $1;`
			`}`

			`sub scan_dqstring {`
			`my $self = shift @_;`
			`my $b = $self->{buff};`
			`my $s = '"';`
			`while (1) {`
			`# slurp up non-special characters`
			`$s .= $1 if $$b =~ /\G([^"\$\\]+)/gc;`
			`# handle special characters`
			`last unless $$b =~ /\G(.)/sgc;`
			`my $c = $1;`
			`$s .= '"', last if $c eq '"';`
			`$s .= '$' . $self->scan_dollar(), next if $c eq '$';`
			`if ($c eq '\\') {`
			`$s .= '\\', last unless $$b =~ /\G(.)/sgc;`
			`$c = $1;`
			`next if $c eq "\n"; # line splice`
			# backslash escapes only $, `, ", \ in dq-string
			$s .= '\\' unless $c =~ /^[\$`"\\]$/;
			`$s .= $c;`
			`next;`
			`}`
			`die("internal error scanning dq-string '$c'\n");`
			`}`
			`return $s;`
			`}`

			`sub scan_balanced {`
			`my ($self, $c1, $c2) = @_;`
			`my $b = $self->{buff};`
			`my $depth = 1;`
			`my $s = $c1;`
			`while ($$b =~ /\G([^\Q$c1$c2\E]*(?:[\Q$c1$c2\E]\|\z))/gc) {`
			`$s .= $1;`
			`$depth++, next if $s =~ /\Q$c1\E$/;`
			`$depth--;`
			`last if $depth == 0;`
			`}`
			`return $s;`
			`}`

			`sub scan_subst {`
			`my $self = shift @_;`
			`my @tokens = $self->{parser}->parse(qr/^\)$/);`
			`$self->{parser}->next_token(); # closing ")"`
			`return @tokens;`
			`}`

			`sub scan_dollar {`
			`my $self = shift @_;`
			`my $b = $self->{buff};`
			`return $self->scan_balanced('(', ')') if $$b =~ /\G\((?=\()/gc; # $((...))`
			`return '(' . join(' ', $self->scan_subst()) . ')' if $$b =~ /\G\(/gc; # $(...)`
			`return $self->scan_balanced('{', '}') if $$b =~ /\G\{/gc; # ${...}`
			`return $1 if $$b =~ /\G(\w+)/gc; # $var`
			`return $1 if $$b =~ /\G([@#?$!0-9-])/gc; # $, $1, $$, etc.`
			`return '';`
			`}`

			`sub swallow_heredocs {`
			`my $self = shift @_;`
			`my $b = $self->{buff};`
			`my $tags = $self->{heretags};`
			`while (my $tag = shift @$tags) {`
			`my $indent = $tag =~ s/^\t// ? '\\s*' : '';`
			`$$b =~ /(?:\G\|\n)$indent\Q$tag\E(?:\n\|\z)/gc;`
			`}`
			`}`

			`sub scan_token {`
			`my $self = shift @_;`
			`my $b = $self->{buff};`
			`my $token = '';`
			`RESTART:`
			`$$b =~ /\G[ \t]+/gc; # skip whitespace (but not newline)`
			`return "\n" if $$b =~ /\G#[^\n]*(?:\n\|\z)/gc; # comment`
			`while (1) {`
			`# slurp up non-special characters`
			`$token .= $1 if $$b =~ /\G([^\\;&\|<>(){}'"\$\s]+)/gc;`
			`# handle special characters`
			`last unless $$b =~ /\G(.)/sgc;`
			`my $c = $1;`
			`last if $c =~ /^[ \t]$/; # whitespace ends token`
			`pos($$b)--, last if length($token) && $c =~ /^[;&\|<>(){}\n]$/;`
			`$token .= $self->scan_sqstring(), next if $c eq "'";`
			`$token .= $self->scan_dqstring(), next if $c eq '"';`
			`$token .= $c . $self->scan_dollar(), next if $c eq '$';`
			`$self->swallow_heredocs(), $token = $c, last if $c eq "\n";`
			`$token = $self->scan_op($c), last if $c =~ /^[;&\|<>]$/;`
			`$token = $c, last if $c =~ /^[(){}]$/;`
			`if ($c eq '\\') {`
			`$token .= '\\', last unless $$b =~ /\G(.)/sgc;`
			`$c = $1;`
			`next if $c eq "\n" && length($token); # line splice`
			`goto RESTART if $c eq "\n"; # line splice`
			`$token .= '\\' . $c;`
			`next;`
			`}`
			`die("internal error scanning character '$c'\n");`
			`}`
			`return length($token) ? $token : undef;`
			`}`

t: add skeleton chainlint.pl Although chainlint.sed usefully identifies broken &&-chains in tests, it has several shortcomings which include: * only detects &&-chain breakage in subshells (one-level deep) * does not check for broken top-level &&-chains; that task is left to the "magic exit code 117" checker built into test-lib.sh, however, that detection does not extend to `{...}` blocks, `$(...)` expressions, or compound statements such as `if...fi`, `while...done`, `case...esac` * uses heuristics, which makes it (potentially) fallible and difficult to tweak to handle additional real-world cases * written in `sed` and employs advanced `sed` operators which are probably not well-known to many programmers, thus the pool of people who can maintain it is likely small * manually simulates recursion into subshells which makes it much more difficult to reason about than, say, a traditional top-down parser * checks each test as the test is run, which can get expensive for tests which are run repeatedly by functions or loops since their bodies will be checked over and over (tens or hundreds of times) unnecessarily To address these shortcomings, begin implementing a more functional and precise test linter which understands shell syntax and semantics rather than employing heuristics, thus is able to recognize structural problems with tests beyond broken &&-chains. The new linter is written in Perl, thus should be more accessible to a wider audience, and is structured as a traditional top-down parser which makes it much easier to reason about, and allows it to inspect compound statements within test bodies to any depth. Furthermore, it can check all test definitions in the entire project in a single invocation rather than having to be invoked once per test, and each test definition is checked only once no matter how many times the test is actually run. At this stage, the new linter is just a skeleton containing boilerplate which handles command-line options, collects and reports statistics, and feeds its arguments -- paths of test scripts -- to a (presently) do-nothing script parser for validation. Subsequent changes will flesh out the functionality. Signed-off-by: Eric Sunshine <sunshine@sunshineco.com> Signed-off-by: Junio C Hamano <gitster@pobox.com> 2022-09-01 02:29:39 +02:00			`package ScriptParser;`

			`sub new {`
			`my $class = shift @_;`
			`my $self = bless {} => $class;`
			`$self->{output} = [];`
			`$self->{ntests} = 0;`
			`return $self;`
			`}`

			`sub parse_cmd {`
			`return undef;`
			`}`

			`# main contains high-level functionality for processing command-line switches,`
			`# feeding input test scripts to ScriptParser, and reporting results.`
			`package main;`

			`my $getnow = sub { return time(); };`
			`my $interval = sub { return time() - shift; };`
			`if (eval {require Time::HiRes; Time::HiRes->import(); 1;}) {`
			`$getnow = sub { return [Time::HiRes::gettimeofday()]; };`
			`$interval = sub { return Time::HiRes::tv_interval(shift); };`
			`}`

			`sub show_stats {`
			`my ($start_time, $stats) = @_;`
			`my $walltime = $interval->($start_time);`
			`my ($usertime) = times();`
			`my ($total_workers, $total_scripts, $total_tests, $total_errs) = (0, 0, 0, 0);`
			`for (@$stats) {`
			`my ($worker, $nscripts, $ntests, $nerrs) = @$_;`
			`print(STDERR "worker $worker: $nscripts scripts, $ntests tests, $nerrs errors\n");`
			`$total_workers++;`
			`$total_scripts += $nscripts;`
			`$total_tests += $ntests;`
			`$total_errs += $nerrs;`
			`}`
			`printf(STDERR "total: %d workers, %d scripts, %d tests, %d errors, %.2fs/%.2fs (wall/user)\n", $total_workers, $total_scripts, $total_tests, $total_errs, $walltime, $usertime);`
			`}`

			`sub check_script {`
			`my ($id, $next_script, $emit) = @_;`
			`my ($nscripts, $ntests, $nerrs) = (0, 0, 0);`
			`while (my $path = $next_script->()) {`
			`$nscripts++;`
			`my $fh;`
			`unless (open($fh, "<", $path)) {`
			`$emit->("?!ERR?! $path: $!\n");`
			`next;`
			`}`
			`my $s = do { local $/; <$fh> };`
			`close($fh);`
			`my $parser = ScriptParser->new(\$s);`
			`1 while $parser->parse_cmd();`
			`if (@{$parser->{output}}) {`
			`my $s = join('', @{$parser->{output}});`
			`$emit->("# chainlint: $path\n" . $s);`
			`$nerrs += () = $s =~ /\?![^?]+\?!/g;`
			`}`
			`$ntests += $parser->{ntests};`
			`}`
			`return [$id, $nscripts, $ntests, $nerrs];`
			`}`

			`sub exit_code {`
			`my $stats = shift @_;`
			`for (@$stats) {`
			`my ($worker, $nscripts, $ntests, $nerrs) = @$_;`
			`return 1 if $nerrs;`
			`}`
			`return 0;`
			`}`

			`Getopt::Long::Configure(qw{bundling});`
			`GetOptions(`
			`"emit-all!" => \$emit_all,`
			`"stats\|show-stats!" => \$show_stats) or die("option error\n");`

			`my $start_time = $getnow->();`
			`my @stats;`

			`my @scripts;`
			`push(@scripts, File::Glob::bsd_glob($_)) for (@ARGV);`
			`unless (@scripts) {`
			`show_stats($start_time, \@stats) if $show_stats;`
			`exit;`
			`}`

			`push(@stats, check_script(1, sub { shift(@scripts); }, sub { print(@_); }));`
			`show_stats($start_time, \@stats) if $show_stats;`
			`exit(exit_code(\@stats));`