Files
littlefs/scripts/bench.py
Christopher Haster 275ca0e0ec scripts: bench.py: Fixed issue where cumul results were mixed together
Whoops, looks like cumulative results were overlooked when multiple
bench measurements per bench were added. We were just adding all
cumulative results together!

This led to some very confusing bench results.

The solution here is to keep track of per-measurement cumulative results
via a Python dict. Which adds some memory usage, but definitely not
enough to be noticeable in the context of the bench-runner.
2025-05-15 16:16:41 -05:00

1740 lines
63 KiB
Python
Executable File

#!/usr/bin/env python3
#
# Script to compile and runs benches.
#
# Example:
# ./scripts/bench.py runners/bench_runner -b
#
# Copyright (c) 2022, The littlefs authors.
# SPDX-License-Identifier: BSD-3-Clause
#
# prevent local imports
if __name__ == "__main__":
__import__('sys').path.pop(0)
import collections as co
import csv
import errno
import fnmatch
import itertools as it
import functools as ft
import os
import pty
import re
import shlex
import shutil
import signal
import subprocess as sp
import sys
import threading as th
import time
try:
import tomllib as toml
except ModuleNotFoundError:
import tomli as toml
RUNNER_PATH = ['./runners/bench_runner']
HEADER_PATH = 'runners/bench_runner.h'
GDB_PATH = ['gdb']
VALGRIND_PATH = ['valgrind']
PERF_SCRIPT = ['./scripts/perf.py']
# open with '-' for stdin/stdout
def openio(path, mode='r', buffering=-1):
import os
if path == '-':
if 'r' in mode:
return os.fdopen(os.dup(sys.stdin.fileno()), mode, buffering)
else:
return os.fdopen(os.dup(sys.stdout.fileno()), mode, buffering)
else:
return open(path, mode, buffering)
# a define range
class DRange:
def __init__(self, start, stop=None, step=None):
if stop is None:
start, stop = None, start
self.start = start if start is not None else 0
self.stop = stop
self.step = step if step is not None else 1
def __len__(self):
if self.step > 0:
return (self.stop-1 - self.start) // self.step + 1
else:
return (self.start-1 - self.stop) // -self.step + 1
def next(self, i):
return '(%s)*%d + %d' % (i, self.step, self.start)
class BenchCase:
# create a BenchCase object from a config
def __init__(self, config, args={}):
self.name = config.pop('name')
self.path = config.pop('path')
self.suite = config.pop('suite')
self.lineno = config.pop('lineno', None)
self.if_ = config.pop('if', [])
if not isinstance(self.if_, list):
self.if_ = [self.if_]
self.ifdef = config.pop('ifdef', [])
if not isinstance(self.ifdef, list):
self.ifdef = [self.ifdef]
self.code = config.pop('code')
self.code_lineno = config.pop('code_lineno', None)
self.in_ = config.pop('in',
config.pop('suite_in', None))
self.internal = bool(self.in_)
# figure out defines and build possible permutations
self.defines = set()
self.permutations = []
# defines can be a dict or a list or dicts
suite_defines = config.pop('suite_defines', {})
if not isinstance(suite_defines, list):
suite_defines = [suite_defines]
defines = config.pop('defines', {})
if not isinstance(defines, list):
defines = [defines]
def csplit(v):
# split commas but only outside of parens
parens = 0
i_ = 0
for i in range(len(v)):
if v[i] == ',' and parens == 0:
yield v[i_:i]
i_ = i+1
elif v[i] in '([{':
parens += 1
elif v[i] in '}])':
parens -= 1
if v[i_:].strip():
yield v[i_:]
def parse_define(v):
# a define entry can be a list
if isinstance(v, list):
return sum((parse_define(v_) for v_ in v), [])
# or a string
elif isinstance(v, str):
# which can be comma-separated values, with optional
# range statements. This matches the runtime define parser in
# the runner itself.
vs = []
for v_ in csplit(v):
m = re.match(r'^\s*range\s*\((.*)\)\s*$', v_)
if m:
vs.append(DRange(*[
int(a, 0) for a in csplit(m.group(1))]))
else:
vs.append(v_)
return vs
# or a literal value
elif isinstance(v, bool):
return ['true' if v else 'false']
else:
return [v]
# build possible permutations
for suite_defines_ in suite_defines:
self.defines |= suite_defines_.keys()
for defines_ in defines:
self.defines |= defines_.keys()
self.permutations.append({
k: parse_define(v)
for k, v in (suite_defines_ | defines_).items()})
for k in config.keys():
print('%swarning:%s in %s, found unused key %r' % (
'\x1b[1;33m' if args['color'] else '',
'\x1b[m' if args['color'] else '',
self.name,
k),
file=sys.stderr)
def __repr__(self):
return '<BenchCase %s>' % self.name
def __lt__(self, other):
# sort by suite, lineno, and name
return ((self.suite, self.lineno, self.name)
< (other.suite, other.lineno, other.name))
def isin(self, path):
return (self.in_ is not None
and os.path.normpath(self.in_)
== os.path.normpath(path))
class BenchSuite:
# create a BenchSuite object from a toml file
def __init__(self, path, args={}):
self.path = path
self.name = os.path.basename(path)
if self.name.endswith('.toml'):
self.name = self.name[:-len('.toml')]
# load toml file and parse bench cases
with open(self.path) as f:
# load benches
config = toml.load(f.buffer)
# find line numbers
f.seek(0)
case_linenos = []
code_linenos = []
for i, line in enumerate(f):
match = re.match(
'(?P<case>\[\s*cases\s*\.\s*(?P<name>\w+)\s*\])'
'|' '(?P<code>code\s*=)',
line)
if match and match.group('case'):
case_linenos.append((i+1, match.group('name')))
elif match and match.group('code'):
code_linenos.append(i+2)
# sort in case toml parsing did not retain order
case_linenos.sort()
cases = config.pop('cases', {})
for (lineno, name), (nlineno, _) in it.zip_longest(
case_linenos, case_linenos[1:],
fillvalue=(float('inf'), None)):
code_lineno = min(
(l for l in code_linenos
if l >= lineno and l < nlineno),
default=None)
cases[name]['lineno'] = lineno
cases[name]['code_lineno'] = code_lineno
self.if_ = config.pop('if', [])
if not isinstance(self.if_, list):
self.if_ = [self.if_]
self.ifdef = config.pop('ifdef', [])
if not isinstance(self.ifdef, list):
self.ifdef = [self.ifdef]
self.code = config.pop('code', None)
self.code_lineno = min(
(l for l in code_linenos
if not case_linenos or l < case_linenos[0][0]),
default=None)
self.in_ = config.pop('in', None)
self.after = config.pop('after', [])
if not isinstance(self.after, list):
self.after = [self.after]
# a couple of these we just forward to all cases
defines = config.pop('defines', {})
self.cases = []
for name, case in cases.items():
self.cases.append(BenchCase(
config={
'name': name,
'path': path + (':%d' % case['lineno']
if 'lineno' in case else ''),
'suite': self.name,
'suite_defines': defines,
'suite_in': self.in_,
**case},
args=args))
# sort for consistency
self.cases.sort()
# combine per-case defines
self.defines = set.union(set(), *(
set(case.defines) for case in self.cases))
# combine other per-case things
self.internal = any(case.internal for case in self.cases)
for k in config.keys():
print('%swarning:%s in %s, found unused key %r' % (
'\x1b[1;33m' if args['color'] else '',
'\x1b[m' if args['color'] else '',
self.name,
k),
file=sys.stderr)
def __repr__(self):
return '<BenchSuite %s>' % self.name
def __lt__(self, other):
# sort by name
#
# note we override this with a topological sort during compilation
return self.name < other.name
def isin(self, path):
return (self.in_ is not None
and os.path.normpath(self.in_)
== os.path.normpath(path))
def compile(bench_paths, **args):
# load the suites
suites = [BenchSuite(path, args) for path in bench_paths]
# sort suites by:
# 1. topologically by "after" dependencies
# 2. lexicographically for consistency
pending = co.OrderedDict((suite.name, suite)
for suite in sorted(suites))
suites = []
while pending:
pending_ = co.OrderedDict()
for suite in pending.values():
if not any(after in pending for after in suite.after):
suites.append(suite)
else:
pending_[suite.name] = suite
if len(pending_) == len(pending):
print('%serror:%s cycle detected in suite ordering: {%s}' % (
'\x1b[1;31m' if args['color'] else '',
'\x1b[m' if args['color'] else '',
', '.join(suite.name for suite in pending.values())),
file=sys.stderr)
sys.exit(-1)
pending = pending_
# check for name conflicts, these will cause ambiguity problems later
# when running benches
seen = {}
for suite in suites:
if suite.name in seen:
print('%swarning:%s conflicting suite %r, %s and %s' % (
'\x1b[1;33m' if args['color'] else '',
'\x1b[m' if args['color'] else '',
suite.name,
suite.path,
seen[suite.name].path),
file=sys.stderr)
seen[suite.name] = suite
for case in suite.cases:
# only allow conflicts if a case and its suite share a name
if case.name in seen and not (
isinstance(seen[case.name], BenchSuite)
and seen[case.name].cases == [case]):
print('%swarning:%s conflicting case %r, %s and %s' % (
'\x1b[1;33m' if args['color'] else '',
'\x1b[m' if args['color'] else '',
case.name,
case.path,
seen[case.name].path),
file=sys.stderr)
seen[case.name] = case
# we can only compile one bench suite at a time
if not args.get('source'):
if len(suites) > 1:
print('%serror:%s compiling more than one bench suite? (%r)' % (
'\x1b[1;31m' if args['color'] else '',
'\x1b[m' if args['color'] else '',
bench_paths),
file=sys.stderr)
sys.exit(-1)
suite = suites[0]
# write generated bench source
if 'output' in args:
with openio(args['output'], 'w') as f:
_write = f.write
def write(s):
f.lineno += s.count('\n')
_write(s)
def writeln(s=''):
f.lineno += s.count('\n') + 1
_write(s)
_write('\n')
f.lineno = 1
f.write = write
f.writeln = writeln
f.writeln("// Generated by %s:" % sys.argv[0])
f.writeln("//")
f.writeln("// %s" % ' '.join(sys.argv))
f.writeln("//")
f.writeln()
# include bench_runner.h in every generated file
f.writeln("#include \"%s\"" % args['include'])
f.writeln()
# write out generated functions, this can end up in different
# files depending on the "in" attribute
#
# note it's up to the specific generated file to declare
# the bench defines
def write_case_functions(f, suite, case):
# write any ifdef prologues
if case.ifdef:
for ifdef in case.ifdef:
f.writeln('#ifdef %s' % ifdef)
f.writeln()
# create case define functions
for i, permutation in enumerate(case.permutations):
for k, vs in sorted(permutation.items()):
f.writeln('intmax_t __bench__%s__%s__%d('
'__attribute__((unused)) void *data, '
'size_t i) {' % (
case.name, k, i))
j = 0
for v in vs:
# generate range
if isinstance(v, DRange):
f.writeln(4*' '+'if (i < %d) '
'return %s;' % (
j+len(v), v.next('i-%d' % j)))
j += len(v)
# translate index to define
else:
f.writeln(4*' '+'if (i == %d) '
'return %s;' % (
j, v))
j += 1
f.writeln(4*' '+'__builtin_unreachable();')
f.writeln('}')
f.writeln()
# create case if function
if suite.if_ or case.if_:
f.writeln('bool __bench__%s__if(void) {' % (
case.name))
for if_ in it.chain(suite.if_, case.if_):
f.writeln(4*' '+'if (!(%s)) return false;' % (
'true' if if_ is True
else 'false' if if_ is False
else if_))
f.writeln(4*' '+'return true;')
f.writeln('}')
f.writeln()
# create case run function
f.writeln('void __bench__%s__run('
'__attribute__((unused)) '
'struct lfs_config *CFG) {' % (
case.name))
f.writeln(4*' '+'// bench case %s' % case.name)
if case.code_lineno is not None:
f.writeln(4*' '+'#line %d "%s"' % (
case.code_lineno, suite.path))
f.write(case.code)
if case.code_lineno is not None:
f.writeln(4*' '+'#line %d "%s"' % (
f.lineno+1, args['output']))
f.writeln('}')
f.writeln()
# write any ifdef epilogues
if case.ifdef:
for ifdef in case.ifdef:
f.writeln('#endif')
f.writeln()
if not args.get('source'):
# write any ifdef prologues
if suite.ifdef:
for ifdef in suite.ifdef:
f.writeln('#ifdef %s' % ifdef)
f.writeln()
# write any suite defines
if suite.defines:
for define in sorted(suite.defines):
f.writeln('__attribute__((weak)) intmax_t %s;' % (
define))
f.writeln()
# write any suite code
if suite.code is not None and suite.in_ is None:
if suite.code_lineno is not None:
f.writeln('#line %d "%s"' % (
suite.code_lineno, suite.path))
f.write(suite.code)
if suite.code_lineno is not None:
f.writeln('#line %d "%s"' % (
f.lineno+1, args['output']))
f.writeln()
# create case functions
for case in suite.cases:
if case.in_ is None:
write_case_functions(f, suite, case)
else:
for i, permutation in enumerate(case.permutations):
for k, vs in sorted(permutation.items()):
f.writeln('extern intmax_t __bench__%s__%s__%d('
'void *data, size_t i);' % (
case.name, k, i))
if suite.if_ or case.if_:
f.writeln('extern bool __bench__%s__if('
'void);' % (
case.name))
f.writeln('extern void __bench__%s__run('
'struct lfs_config *CFG);' % (
case.name))
f.writeln()
# write any ifdef epilogues
if suite.ifdef:
for ifdef in suite.ifdef:
f.writeln('#endif')
f.writeln()
# create suite struct
f.writeln('const struct bench_suite __bench__%s__suite = {' % (
suite.name))
f.writeln(4*' '+'.name = "%s",' % suite.name)
f.writeln(4*' '+'.path = "%s",' % suite.path)
f.writeln(4*' '+'.flags = %s,' % (
' | '.join(filter(None, [
'BENCH_INTERNAL' if suite.internal else None]))
or 0))
for ifdef in suite.ifdef:
f.writeln(4*' '+'#ifdef %s' % ifdef)
# create suite defines
if suite.defines:
f.writeln(4*' '+'.defines = (const bench_define_t[]){')
for k in sorted(suite.defines):
f.writeln(8*' '+'{"%s", &%s, NULL, NULL, 0},' % (
k, k))
f.writeln(4*' '+'},')
f.writeln(4*' '+'.define_count = %d,' % len(suite.defines))
for ifdef in suite.ifdef:
f.writeln(4*' '+'#endif')
if suite.cases:
f.writeln(4*' '+'.cases = (const struct bench_case[]){')
for case in suite.cases:
# create case structs
f.writeln(8*' '+'{')
f.writeln(12*' '+'.name = "%s",' % case.name)
f.writeln(12*' '+'.path = "%s",' % case.path)
f.writeln(12*' '+'.flags = %s,' % (
' | '.join(filter(None, [
'BENCH_INTERNAL' if case.internal
else None]))
or 0))
for ifdef in it.chain(suite.ifdef, case.ifdef):
f.writeln(12*' '+'#ifdef %s' % ifdef)
# create case defines
if case.defines:
f.writeln(12*' '+'.defines'
' = (const bench_define_t*)'
'(const bench_define_t[][%d]){' % (
len(suite.defines)))
for i, permutation in enumerate(case.permutations):
f.writeln(16*' '+'{')
for k, vs in sorted(permutation.items()):
f.writeln(20*' '+'[%d] = {'
'"%s", &%s, '
'__bench__%s__%s__%d, '
'NULL, %d},' % (
sorted(suite.defines).index(k),
k, k, case.name, k, i,
sum(len(v)
if isinstance(
v, DRange)
else 1
for v in vs)))
f.writeln(16*' '+'},')
f.writeln(12*' '+'},')
f.writeln(12*' '+'.permutations = %d,' % (
len(case.permutations)))
if suite.if_ or case.if_:
f.writeln(12*' '+'.if_ = __bench__%s__if,' % (
case.name))
f.writeln(12*' '+'.run = __bench__%s__run,' % (
case.name))
for ifdef in it.chain(suite.ifdef, case.ifdef):
f.writeln(12*' '+'#endif')
f.writeln(8*' '+'},')
f.writeln(4*' '+'},')
f.writeln(4*' '+'.case_count = %d,' % len(suite.cases))
f.writeln('};')
f.writeln()
else:
# copy source
f.writeln('#line 1 "%s"' % args['source'])
with open(args['source']) as sf:
shutil.copyfileobj(sf, f)
f.writeln()
# merge all defines we need, otherwise we will run into
# redefinition errors
defines = ({define
for suite in suites
if suite.isin(args['source'])
for define in suite.defines}
| {define
for suite in suites
for case in suite.cases
if case.isin(args['source'])
for define in case.defines})
if defines:
for define in sorted(defines):
f.writeln('__attribute__((weak)) intmax_t %s;' % (
define))
f.writeln()
# write any internal benches
for suite in suites:
# any ifdef prologues
if suite.ifdef:
for ifdef in suite.ifdef:
f.writeln('#ifdef %s' % ifdef)
f.writeln()
# any suite code
if suite.isin(args['source']):
if suite.code_lineno is not None:
f.writeln('#line %d "%s"' % (
suite.code_lineno, suite.path))
f.write(suite.code)
if suite.code_lineno is not None:
f.writeln('#line %d "%s"' % (
f.lineno+1, args['output']))
f.writeln()
# any case functions
for case in suite.cases:
if case.isin(args['source']):
write_case_functions(f, suite, case)
# any ifdef epilogues
if suite.ifdef:
for ifdef in suite.ifdef:
f.writeln('#endif')
f.writeln()
# declare our bench suites
#
# by declaring these as weak we can write these to every
# source file without issue, eventually one of these copies
# will be linked
for suite in suites:
f.writeln('extern const struct bench_suite '
'__bench__%s__suite;' % (
suite.name))
f.writeln()
f.writeln('__attribute__((weak))')
f.writeln('const struct bench_suite *const bench_suites[] = {')
for suite in suites:
f.writeln(4*' '+'&__bench__%s__suite,' % suite.name)
if len(suites) == 0:
f.writeln(4*' '+'0,')
f.writeln('};')
f.writeln('__attribute__((weak))')
f.writeln('const size_t bench_suite_count = %d;' % len(suites))
f.writeln()
def find_runner(runner, id=None, main=True, **args):
cmd = runner.copy()
# run under some external command?
if args.get('exec'):
cmd[:0] = args['exec']
# run under valgrind?
if args.get('valgrind'):
cmd[:0] = args['valgrind_path'] + [
'--leak-check=full',
'--track-origins=yes',
'--error-exitcode=4',
'-q']
# run under perf?
if args.get('perf'):
cmd[:0] = args['perf_script'] + list(filter(None, [
'--record',
'--perf-freq=%s' % args['perf_freq']
if args.get('perf_freq') else None,
'--perf-period=%s' % args['perf_period']
if args.get('perf_period') else None,
'--perf-events=%s' % args['perf_events']
if args.get('perf_events') else None,
'--perf-path=%s' % args['perf_path']
if args.get('perf_path') else None,
'-o%s' % args['perf']]))
# other context
if args.get('define_depth'):
cmd.append('--define-depth=%s' % args['define_depth'])
if args.get('all'):
cmd.append('-a')
# only one thread should write to disk/trace, otherwise the output
# ends up clobbered and useless
if main:
if args.get('disk'):
cmd.append('-d%s' % args['disk'])
if args.get('trace'):
cmd.append('-t%s' % args['trace'])
if args.get('trace_backtrace'):
cmd.append('--trace-backtrace')
if args.get('trace_period'):
cmd.append('--trace-period=%s' % args['trace_period'])
if args.get('trace_freq'):
cmd.append('--trace-freq=%s' % args['trace_freq'])
if args.get('read_sleep'):
cmd.append('--read-sleep=%s' % args['read_sleep'])
if args.get('prog_sleep'):
cmd.append('--prog-sleep=%s' % args['prog_sleep'])
if args.get('erase_sleep'):
cmd.append('--erase-sleep=%s' % args['erase_sleep'])
# defines?
if args.get('define') and id is None:
for define in args.get('define'):
cmd.append('-D%s' % define)
# bench id?
#
# note we disable defines above when id is explicit, defines override id
# in the bench runner, which is not what we want when querying an explicit
# bench id
if id is not None:
cmd.append(id)
return cmd
def find_perms(runner, bench_ids=[], **args):
runner_ = find_runner(runner, main=False, **args)
case_suites = {}
expected_case_perms = co.OrderedDict()
expected_perms = 0
total_perms = 0
# query cases from the runner
cmd = runner_ + ['--list-cases'] + bench_ids
if args.get('verbose'):
print(' '.join(shlex.quote(c) for c in cmd))
proc = sp.Popen(cmd,
stdout=sp.PIPE,
universal_newlines=True,
errors='replace',
close_fds=False)
pattern = re.compile(
'^(?P<case>[^\s]+)'
'\s+(?P<flags>[^\s]+)'
'\s+(?P<filtered>\d+)/(?P<perms>\d+)')
# skip the first line
for line in it.islice(proc.stdout, 1, None):
m = pattern.match(line)
if m:
filtered = int(m.group('filtered'))
perms = int(m.group('perms'))
expected_case_perms[m.group('case')] = (
expected_case_perms.get(m.group('case'), 0)
+ filtered)
expected_perms += filtered
total_perms += perms
proc.wait()
if proc.returncode != 0:
sys.exit(-1)
# get which suite each case belongs to via paths
cmd = runner_ + ['--list-case-paths'] + bench_ids
if args.get('verbose'):
print(' '.join(shlex.quote(c) for c in cmd))
proc = sp.Popen(cmd,
stdout=sp.PIPE,
universal_newlines=True,
errors='replace',
close_fds=False)
pattern = re.compile(
'^(?P<case>[^\s]+)'
'\s+(?P<path>[^:]+):(?P<lineno>\d+)')
# skip the first line
for line in it.islice(proc.stdout, 1, None):
m = pattern.match(line)
if m:
path = m.group('path')
# strip path/suffix here
suite = os.path.basename(path)
if suite.endswith('.toml'):
suite = suite[:-len('.toml')]
case_suites[m.group('case')] = suite
proc.wait()
if proc.returncode != 0:
sys.exit(-1)
# figure out expected suite perms
expected_suite_perms = co.OrderedDict()
for case, suite in case_suites.items():
expected_suite_perms[suite] = (
expected_suite_perms.get(suite, 0)
+ expected_case_perms.get(case, 0))
return (case_suites,
expected_suite_perms,
expected_case_perms,
expected_perms,
total_perms)
def find_path(runner, id, **args):
runner_ = find_runner(runner, id, main=False, **args)
path = None
# query from runner
cmd = runner_ + ['--list-case-paths', id]
if args.get('verbose'):
print(' '.join(shlex.quote(c) for c in cmd))
proc = sp.Popen(cmd,
stdout=sp.PIPE,
universal_newlines=True,
errors='replace',
close_fds=False)
pattern = re.compile(
'^(?P<case>[^\s]+)'
'\s+(?P<path>[^:]+):(?P<lineno>\d+)')
# skip the first line
for line in it.islice(proc.stdout, 1, None):
m = pattern.match(line)
if m and path is None:
path_ = m.group('path')
lineno = int(m.group('lineno'))
path = (path_, lineno)
proc.wait()
if proc.returncode != 0:
sys.exit(-1)
return path
def find_defines(runner, id, **args):
runner_ = find_runner(runner, id, main=False, **args)
# query permutation defines from runner
cmd = runner_ + ['--list-permutation-defines', id]
if args.get('verbose'):
print(' '.join(shlex.quote(c) for c in cmd))
proc = sp.Popen(cmd,
stdout=sp.PIPE,
universal_newlines=True,
errors='replace',
close_fds=False)
defines = co.OrderedDict()
pattern = re.compile('^(?P<define>\w+)=(?P<value>.+)')
for line in proc.stdout:
m = pattern.match(line)
if m:
define = m.group('define')
value = m.group('value')
defines[define] = value
proc.wait()
if proc.returncode != 0:
sys.exit(-1)
return defines
def find_ids(runner, bench_ids=[], **args):
# no ids => all ids, we don't need an extra lookup if no special
# behavior is requested
if not (args.get('by_cases')
or args.get('by_suites')
or bench_ids):
return []
# lookup suites/cases
(suite_cases,
expected_suite_perms,
expected_case_perms,
_,
_) = find_perms(runner, **args)
# no ids => all ids, before we evaluate globs
if not bench_ids and args.get('by_cases'):
return [case_ for case_ in expected_case_perms.keys()]
if not bench_ids and args.get('by_suites'):
return [suite for suite in expected_suite_perms.keys()]
# find suite/case by id
bench_ids_ = []
for id in bench_ids:
# strip permutation
name, *_ = id.split(':', 1)
bench_ids__ = []
# resolve globs
if '*' in name:
bench_ids__.extend(suite
for suite in expected_suite_perms.keys()
if fnmatch.fnmatchcase(suite, name))
if not bench_ids__:
bench_ids__.extend(case_
for case_ in expected_case_perms.keys()
if fnmatch.fnmatchcase(case_, name))
# literal suite
elif name in expected_suite_perms:
bench_ids__.append(id)
# literal case
elif name in expected_case_perms:
bench_ids__.append(id)
# no suite/case found? error
if not bench_ids__:
print('%serror:%s no benches match id %r?' % (
'\x1b[1;31m' if args['color'] else '',
'\x1b[m' if args['color'] else '',
id),
file=sys.stderr)
sys.exit(-1)
bench_ids_.extend(bench_ids__)
bench_ids = bench_ids_
# expand suites to cases?
if args.get('by_cases'):
bench_ids_ = []
for id in bench_ids:
if id in expected_suite_perms:
for case_, suite in suite_cases.items():
if suite == id:
bench_ids_.append(case_)
else:
bench_ids_.append(id)
bench_ids = bench_ids_
# no bench ids found? return a garbage id for consistency
return bench_ids if bench_ids else ['?']
def list_(runner, bench_ids=[], **args):
cmd = find_runner(runner, main=False, **args)
cmd.extend(find_ids(runner, bench_ids, **args))
if args.get('summary'): cmd.append('--summary')
if args.get('list_suites'): cmd.append('--list-suites')
if args.get('list_cases'): cmd.append('--list-cases')
if args.get('list_suite_paths'): cmd.append('--list-suite-paths')
if args.get('list_case_paths'): cmd.append('--list-case-paths')
if args.get('list_defines'): cmd.append('--list-defines')
if args.get('list_permutation_defines'):
cmd.append('--list-permutation-defines')
if args.get('list_implicit_defines'):
cmd.append('--list-implicit-defines')
if args.get('verbose'):
print(' '.join(shlex.quote(c) for c in cmd))
return sp.call(cmd)
# Thread-safe CSV writer
class BenchOutput:
def __init__(self, path, head=None, tail=None):
self.f = openio(path, 'w+', 1)
self.lock = th.Lock()
self.head = head or []
self.tail = tail or []
self.writer = csv.DictWriter(self.f, self.head + self.tail)
self.rows = []
def close(self):
self.f.close()
def __enter__(self):
return self
def __exit__(self, *_):
self.f.close()
def writerow(self, row):
with self.lock:
self.rows.append(row)
if all(k in self.head or k in self.tail for k in row.keys()):
# can simply append
self.writer.writerow(row)
else:
# need to rewrite the file
self.head.extend(row.keys() - (self.head + self.tail))
self.f.seek(0)
self.f.truncate()
self.writer = csv.DictWriter(self.f, self.head + self.tail)
self.writer.writeheader()
for row in self.rows:
self.writer.writerow(row)
# A bench failure
class BenchFailure(Exception):
def __init__(self, id, returncode, stdout, assert_=None):
self.id = id
self.returncode = returncode
self.stdout = stdout
self.assert_ = assert_
def run_stage(name, runner, bench_ids, stdout_, trace_, output_, **args):
# get expected suite/case/perm counts
(case_suites,
expected_suite_perms,
expected_case_perms,
expected_perms,
total_perms) = find_perms(runner, bench_ids, **args)
passed_suite_perms = co.defaultdict(lambda: 0)
passed_case_perms = co.defaultdict(lambda: 0)
passed_perms = 0
failed_perms = 0
readed = 0
proged = 0
erased = 0
failures = []
killed = False
pattern = re.compile('^(?:'
'(?P<op>running|finished|skipped)'
' (?P<id>(?P<case>[^:]+)[^\s]*)'
'|' '(?P<path>[^:]+):(?P<lineno>\d+):(?P<op_>assert):'
' *(?P<message>.*)'
'|' '(?P<op__>benched)'
' (?P<m>[^\s]+)'
' (?P<n>\d+)'
'(?: (?P<readed>[\d\.]+))?'
'(?: (?P<proged>[\d\.]+))?'
'(?: (?P<erased>[\d\.]+))?'
')$')
locals = th.local()
children = set()
def run_runner(runner_):
nonlocal passed_suite_perms
nonlocal passed_case_perms
nonlocal passed_perms
nonlocal readed
nonlocal proged
nonlocal erased
nonlocal locals
# run the benches!
cmd = runner_
if args.get('verbose'):
print(' '.join(shlex.quote(c) for c in cmd))
mpty, spty = pty.openpty()
proc = sp.Popen(cmd, stdout=spty, stderr=spty, close_fds=False)
os.close(spty)
children.add(proc)
mpty = os.fdopen(mpty, 'r', 1)
last_id = None
last_case = None
last_suite = None
last_defines = None # fetched on demand
last_stdout = co.deque(maxlen=args.get('context', 5) + 1)
last_assert = None
creaded = co.defaultdict(lambda: 0)
cproged = co.defaultdict(lambda: 0)
cerased = co.defaultdict(lambda: 0)
try:
while True:
# parse a line for state changes
try:
line = mpty.readline()
except OSError as e:
if e.errno != errno.EIO:
raise
break
if not line:
break
last_stdout.append(line)
if stdout_:
try:
stdout_.write(line)
stdout_.flush()
except BrokenPipeError:
pass
m = pattern.match(line)
if m:
op = m.group('op') or m.group('op_') or m.group('op__')
if op == 'running':
locals.seen_perms += 1
last_id = m.group('id')
last_case = m.group('case')
last_suite = case_suites[last_case]
last_defines = None
last_stdout.clear()
last_assert = None
creaded.clear()
cproged.clear()
cerased.clear()
elif op == 'finished':
# force a failure
if args.get('fail'):
proc.kill()
raise BenchFailure(last_id, 0, list(last_stdout))
# passed
case = m.group('case')
suite = case_suites[case]
passed_suite_perms[suite] += 1
passed_case_perms[case] += 1
passed_perms += 1
elif op == 'skipped':
locals.seen_perms += 1
elif op == 'assert':
last_assert = (
m.group('path'),
int(m.group('lineno')),
m.group('message'))
# go ahead and kill the process, aborting takes a while
if args.get('keep_going'):
proc.kill()
elif op == 'benched':
m_ = m.group('m')
n_ = int(m.group('n'))
# parse measurements
def dat(v):
if v is None:
return 0
elif '.' in v:
return float(v)
else:
return int(v)
readed_ = dat(m.group('readed'))
proged_ = dat(m.group('proged'))
erased_ = dat(m.group('erased'))
# keep track of cumulative measurements
creaded[m_] += readed_
cproged[m_] += proged_
cerased[m_] += erased_
if output_:
# fetch defines if needed, only do this at most
# once per perm
if last_defines is None:
last_defines = find_defines(
runner, last_id, **args)
# write measurements immediately, this allows
# analysis of partial results
output_.writerow({
'suite': last_suite,
'case': last_case,
**last_defines,
'm': m_,
'n': n_,
'bench_readed': readed_,
'bench_proged': proged_,
'bench_erased': erased_,
'bench_creaded': creaded[m_],
'bench_cproged': cproged[m_],
'bench_cerased': cerased[m_]})
# keep track of total for summary
readed += readed_
proged += proged_
erased += erased_
except KeyboardInterrupt:
proc.kill()
raise BenchFailure(last_id, 0, list(last_stdout))
finally:
children.remove(proc)
mpty.close()
proc.wait()
if proc.returncode != 0:
raise BenchFailure(
last_id,
proc.returncode,
list(last_stdout),
last_assert)
def run_job(main=True, start=None, step=None):
nonlocal failed_perms
nonlocal failures
nonlocal killed
nonlocal locals
start = start or 0
step = step or 1
while start < total_perms:
runner_ = find_runner(runner, main=main, **args)
if args.get('isolate') or args.get('valgrind'):
runner_.append('-s%s,%s,%s' % (start, start+step, step))
elif start != 0 or step != 1:
runner_.append('-s%s,,%s' % (start, step))
runner_.extend(bench_ids)
try:
# run the benches
locals.seen_perms = 0
run_runner(runner_)
assert locals.seen_perms > 0
start += locals.seen_perms*step
except BenchFailure as failure:
# race condition for multiple failures?
if not failures or args.get('keep_going'):
# keep track of how many failed
failed_perms += 1
# do not store more failures than we need to, otherwise
# we quickly explode RAM when a common bug fails a bunch
# of cases
if len(failures) < args.get('failures', 3):
failures.append(failure)
if args.get('keep_going') and not killed:
# resume after failed bench
assert locals.seen_perms > 0
start += locals.seen_perms*step
continue
else:
# stop other benches
killed = True
for child in children.copy():
child.kill()
break
# parallel jobs?
runners = []
if 'jobs' in args:
for job in range(args['jobs']):
runners.append(th.Thread(
target=run_job, args=(job == 0, job, args['jobs']),
daemon=True))
else:
runners.append(th.Thread(
target=run_job, args=(True, None, None),
daemon=True))
def print_update(done):
if (not args.get('quiet')
and not args.get('verbose')
and not args.get('stdout') == '-'
and (args['color'] or done)):
sys.stdout.write('%s%srunning %s%s:%s %s%s' % (
'\r\x1b[K' if args['color'] else '',
'\x1b[?7l' if not done else '',
('\x1b[34m' if not failed_perms else '\x1b[31m')
if args['color'] else '',
name,
'\x1b[m' if args['color'] else '',
', '.join(filter(None, [
'%d/%d suites' % (
sum(passed_suite_perms[k] == v
for k, v in expected_suite_perms.items()),
len(expected_suite_perms))
if (not args.get('by_suites')
and not args.get('by_cases')) else None,
'%d/%d cases' % (
sum(passed_case_perms[k] == v
for k, v in expected_case_perms.items()),
len(expected_case_perms))
if not args.get('by_cases') else None,
'%d/%d perms' % (passed_perms, expected_perms),
'%s%d/%d failures%s' % (
'\x1b[31m' if args['color'] else '',
failed_perms,
expected_perms,
'\x1b[m' if args['color'] else '')
if failed_perms else None])),
'\x1b[?7h' if not done else '\n'))
sys.stdout.flush()
for r in runners:
r.start()
try:
while any(r.is_alive() for r in runners):
time.sleep(0.01)
print_update(False)
except KeyboardInterrupt:
# this is handled by the runner threads, we just
# need to not abort here
killed = True
finally:
print_update(True)
for r in runners:
r.join()
return (expected_perms,
passed_perms,
failed_perms,
readed,
proged,
erased,
failures,
killed)
def run(runner, bench_ids=[], **args):
# query runner for benches
if not args.get('quiet'):
print('using runner: %s' % ' '.join(
shlex.quote(c) for c in find_runner(runner, **args)))
# query ids, perms, etc
bench_ids = find_ids(runner, bench_ids, **args)
(_,
expected_suite_perms,
expected_case_perms,
expected_perms,
total_perms) = find_perms(runner, bench_ids, **args)
if not args.get('quiet'):
print('found %d suites, %d cases, %d/%d permutations' % (
len(expected_suite_perms),
len(expected_case_perms),
expected_perms,
total_perms))
print()
# automatic job detection?
if args.get('jobs') == 0:
args['jobs'] = len(os.sched_getaffinity(0))
# truncate and open logs here so they aren't disconnected between benches
stdout = None
if args.get('stdout'):
stdout = openio(args['stdout'], 'w', 1)
trace = None
if args.get('trace'):
trace = openio(args['trace'], 'w', 1)
output = None
if args.get('output'):
output = BenchOutput(args['output'],
['suite', 'case'],
# defines go here
['m', 'n',
'bench_readed',
'bench_proged',
'bench_erased',
'bench_creaded',
'bench_cproged',
'bench_cerased'])
# measure runtime
start = time.time()
# spawn runners
expected = 0
passed = 0
failed = 0
readed = 0
proged = 0
erased = 0
failures = []
for by in (bench_ids if bench_ids else [None]):
# spawn jobs for stage
(expected_,
passed_,
failed_,
readed_,
proged_,
erased_,
failures_,
killed) = run_stage(
by or 'benches',
runner,
[by] if by is not None else [],
stdout,
trace,
output,
**args)
# collect passes/failures
expected += expected_
passed += passed_
failed += failed_
readed += readed_
proged += proged_
erased += erased_
# do not store more failures than we need to, otherwise we
# quickly explode RAM when a common bug fails a bunch of cases
failures.extend(failures_[:max(
args.get('failures', 3) - len(failures),
0)])
if (failed and not args.get('keep_going')) or killed:
break
stop = time.time()
if stdout:
try:
stdout.close()
except BrokenPipeError:
pass
if trace:
try:
trace.close()
except BrokenPipeError:
pass
if output:
output.close()
# show summary
if not args.get('quiet'):
print()
print('%sdone:%s %s' % (
('\x1b[34m' if not failed else '\x1b[31m')
if args['color'] else '',
'\x1b[m' if args['color'] else '',
', '.join(filter(None, [
'%d readed' % readed,
'%d proged' % proged,
'%d erased' % erased,
'in %.2fs' % (stop-start)]))))
print()
# print each failure
for failure in failures[:args.get('failures', 3)]:
assert failure.id is not None, '%s broken? %r' % (
' '.join(shlex.quote(c) for c in find_runner(runner, **args)),
failure)
# get some extra info from runner
path, lineno = find_path(runner, failure.id, **args)
defines = find_defines(runner, failure.id, **args)
# show summary of failure
print('%s%s:%d:%sfailure:%s %s%s failed' % (
'\x1b[01m' if args['color'] else '',
path, lineno,
'\x1b[1;31m' if args['color'] else '',
'\x1b[m' if args['color'] else '',
failure.id,
' (%s)' % ', '.join('%s=%s' % (k,v)
for k,v in defines.items())
if defines else ''))
if failure.stdout:
stdout = failure.stdout
if failure.assert_ is not None:
stdout = stdout[:-1]
for line in stdout[max(len(stdout)-args.get('context', 5), 0):]:
sys.stdout.write(line)
if failure.assert_ is not None:
path, lineno, message = failure.assert_
print('%s%s:%d:%sassert:%s %s' % (
'\x1b[01m' if args['color'] else '',
path, lineno,
'\x1b[1;31m' if args['color'] else '',
'\x1b[m' if args['color'] else '',
message))
with open(path) as f:
line = next(it.islice(f, lineno-1, None)).strip('\n')
print(line)
print()
# drop into gdb?
if failures and (args.get('gdb')
or args.get('gdb_perm')
or args.get('gdb_main')):
failure = failures[0]
cmd = find_runner(runner, failure.id, **args)
if args.get('gdb_main'):
# we don't really need the case breakpoint here, but it
# can be helpful
path, lineno = find_path(runner, failure.id, **args)
cmd[:0] = args['gdb_path'] + [
'-q',
'-ex', 'break main',
'-ex', 'break %s:%d' % (path, lineno),
'-ex', 'run',
'--args']
elif args.get('gdb_perm'):
path, lineno = find_path(runner, failure.id, **args)
cmd[:0] = args['gdb_path'] + [
'-q',
'-ex', 'break %s:%d' % (path, lineno),
'-ex', 'run',
'--args']
else:
cmd[:0] = args['gdb_path'] + [
'-q',
'-ex', 'run',
'--args']
# exec gdb interactively
if args.get('verbose'):
print(' '.join(shlex.quote(c) for c in cmd))
os.execvp(cmd[0], cmd)
return 1 if failed else 0
def main(**args):
# figure out what color should be
if args.get('color') == 'auto':
args['color'] = sys.stdout.isatty()
elif args.get('color') == 'always':
args['color'] = True
else:
args['color'] = False
if args.get('compile'):
return compile(**args)
elif (args.get('summary')
or args.get('list_suites')
or args.get('list_cases')
or args.get('list_suite_paths')
or args.get('list_case_paths')
or args.get('list_defines')
or args.get('list_permutation_defines')
or args.get('list_implicit_defines')):
return list_(**args)
else:
return run(**args)
if __name__ == "__main__":
import argparse
import sys
argparse.ArgumentParser._handle_conflict_ignore = lambda *_: None
argparse._ArgumentGroup._handle_conflict_ignore = lambda *_: None
parser = argparse.ArgumentParser(
description="Build and run benches.",
allow_abbrev=False,
conflict_handler='ignore')
parser.add_argument(
'-v', '--verbose',
action='store_true',
help="Output commands that run behind the scenes.")
parser.add_argument(
'-q', '--quiet',
action='store_true',
help="Show nothing except for bench failures.")
parser.add_argument(
'--color',
choices=['never', 'always', 'auto'],
default='auto',
help="When to use terminal colors. Defaults to 'auto'.")
# bench flags
bench_parser = parser.add_argument_group('bench options')
bench_parser.add_argument(
'bench_ids',
nargs='*',
help="Description of benches to run.")
bench_parser.add_argument(
'-R', '--runner',
type=lambda x: x.split(),
default=RUNNER_PATH,
help="Bench runner to use for benching. Defaults to "
"%r." % RUNNER_PATH)
bench_parser.add_argument(
'-Y', '--summary',
action='store_true',
help="Show quick summary.")
bench_parser.add_argument(
'-l', '--list-suites',
action='store_true',
help="List bench suites.")
bench_parser.add_argument(
'-L', '--list-cases',
action='store_true',
help="List bench cases.")
bench_parser.add_argument(
'--list-suite-paths',
action='store_true',
help="List the path for each bench suite.")
bench_parser.add_argument(
'--list-case-paths',
action='store_true',
help="List the path and line number for each bench case.")
bench_parser.add_argument(
'--list-defines',
action='store_true',
help="List all defines in this bench-runner.")
bench_parser.add_argument(
'--list-permutation-defines',
action='store_true',
help="List explicit defines in this bench-runner.")
bench_parser.add_argument(
'--list-implicit-defines',
action='store_true',
help="List implicit defines in this bench-runner.")
bench_parser.add_argument(
'-D', '--define',
action='append',
help="Override a bench define.")
bench_parser.add_argument(
'--define-depth',
help="How deep to evaluate recursive defines before erroring.")
bench_parser.add_argument(
'-a', '--all',
action='store_true',
help="Ignore bench filters.")
bench_parser.add_argument(
'-d', '--disk',
help="Direct block device operations to this file.")
bench_parser.add_argument(
'-t', '--trace',
help="Direct trace output to this file.")
bench_parser.add_argument(
'--trace-backtrace',
action='store_true',
help="Include a backtrace with every trace statement.")
bench_parser.add_argument(
'--trace-period',
help="Sample trace output at this period in cycles.")
bench_parser.add_argument(
'--trace-freq',
help="Sample trace output at this frequency in hz.")
bench_parser.add_argument(
'-O', '--stdout',
help="Direct stdout to this file. Note stderr is already merged "
"here.")
bench_parser.add_argument(
'-o', '--output',
help="CSV file to store results.")
bench_parser.add_argument(
'--read-sleep',
help="Artificial read delay in seconds.")
bench_parser.add_argument(
'--prog-sleep',
help="Artificial prog delay in seconds.")
bench_parser.add_argument(
'--erase-sleep',
help="Artificial erase delay in seconds.")
bench_parser.add_argument(
'-j', '--jobs',
nargs='?',
type=lambda x: int(x, 0),
const=0,
help="Number of parallel runners to run. 0 runs one runner per "
"core.")
bench_parser.add_argument(
'-k', '--keep-going',
action='store_true',
help="Don't stop on first failure.")
bench_parser.add_argument(
'-f', '--fail',
action='store_true',
help="Force a failure.")
bench_parser.add_argument(
'-i', '--isolate',
action='store_true',
help="Run each bench permutation in a separate process.")
bench_parser.add_argument(
'-b', '--by-suites',
action='store_true',
help="Step through benches by suite.")
bench_parser.add_argument(
'-B', '--by-cases',
action='store_true',
help="Step through benches by case.")
bench_parser.add_argument(
'-F', '--failures',
type=lambda x: int(x, 0),
default=3,
help="Show this many bench failures. Defaults to 3.")
bench_parser.add_argument(
'-C', '--context',
type=lambda x: int(x, 0),
default=5,
help="Show this many lines of stdout on bench failure. "
"Defaults to 5.")
bench_parser.add_argument(
'--gdb',
action='store_true',
help="Drop into gdb on bench failure.")
bench_parser.add_argument(
'--gdb-perm', '--gdb-permutation',
action='store_true',
help="Drop into gdb on bench failure but stop at the beginning "
"of the failing bench case.")
bench_parser.add_argument(
'--gdb-main',
action='store_true',
help="Drop into gdb on bench failure but stop at the beginning "
"of main.")
bench_parser.add_argument(
'--gdb-path',
type=lambda x: x.split(),
default=GDB_PATH,
help="Path to the gdb executable, may include flags. "
"Defaults to %r." % GDB_PATH)
bench_parser.add_argument(
'-e', '--exec',
type=lambda e: e.split(),
help="Run under another executable.")
bench_parser.add_argument(
'--valgrind',
action='store_true',
help="Run under Valgrind to find memory errors. Implicitly sets "
"--isolate.")
bench_parser.add_argument(
'--valgrind-path',
type=lambda x: x.split(),
default=VALGRIND_PATH,
help="Path to the Valgrind executable, may include flags. "
"Defaults to %r." % VALGRIND_PATH)
bench_parser.add_argument(
'-p', '--perf',
help="Run under Linux's perf to sample performance counters, "
"writing samples to this file.")
bench_parser.add_argument(
'--perf-freq',
help="perf sampling frequency. This is passed directly to the "
"perf script.")
bench_parser.add_argument(
'--perf-period',
help="perf sampling period. This is passed directly to the perf "
"script.")
bench_parser.add_argument(
'--perf-events',
help="perf events to record. This is passed directly to the perf "
"script.")
bench_parser.add_argument(
'--perf-script',
type=lambda x: x.split(),
default=PERF_SCRIPT,
help="Path to the perf script to use. Defaults to "
"%r." % PERF_SCRIPT)
bench_parser.add_argument(
'--perf-path',
type=lambda x: x.split(),
help="Path to the perf executable, may include flags. This is "
"passed directly to the perf script")
# compilation flags
comp_parser = parser.add_argument_group('compilation options')
comp_parser.add_argument(
'bench_paths',
nargs='*',
help="Set of *.toml files to compile.")
comp_parser.add_argument(
'-c', '--compile',
action='store_true',
help="Compile a bench suite or source file.")
comp_parser.add_argument(
'-s', '--source',
help="Source file to compile, possibly injecting internal benches.")
comp_parser.add_argument(
'--include',
default=HEADER_PATH,
help="Inject this header file into every compiled bench file. "
"Defaults to %r." % HEADER_PATH)
comp_parser.add_argument(
'-o', '--output',
help="Output file.")
# do the thing
args = parser.parse_intermixed_args()
args.bench_paths = args.bench_ids
sys.exit(main(**{k: v
for k, v in vars(args).items()
if v is not None}))