Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Benchmark script improvements #186

Merged
merged 8 commits into from
May 29, 2019
Merged
Show file tree
Hide file tree
Changes from 7 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
52 changes: 0 additions & 52 deletions scripts/bench.py

This file was deleted.

192 changes: 192 additions & 0 deletions scripts/benchmark.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,192 @@
#!/usr/bin/python3
import argparse
import json
import os
import statistics
import subprocess
import sys

from monotonic import monotonic

from detect_secrets.core.usage import PluginOptions


def main():
args = get_arguments()

print(
'Running performance tests on: {}'.format(
', '.join(args.plugin),
),
file=sys.stderr,
)
print(
'for: {}'.format(args.filenames),
file=sys.stderr,
)

# First, convert chosen plugins into their disabled flags
always_disabled_plugins = []
flag_list = {}
for info in PluginOptions.all_plugins:
if info.classname in args.plugin:
flag_list[info.disable_flag_text] = info.classname
else:
always_disabled_plugins.append(info.disable_flag_text)

# Then, iterate through each disabled flag, toggling them off
# individually.
timings = {}
if len(args.plugin) == len(PluginOptions.all_plugins):
# Only run benchmarks for all the cases, if already running all plugins
timings['all-plugins'] = time_execution(
filenames=args.filenames,
timeout=args.harakiri,
num_iterations=args.num_iterations,
)

for flag_number, flag in enumerate(flag_list):
plugins_to_ignore = list(flag_list.keys())
plugins_to_ignore.pop(flag_number)

key = flag_list[flag]
timings[key] = time_execution(
filenames=args.filenames,
timeout=args.harakiri,
num_iterations=args.num_iterations,
flags=plugins_to_ignore + always_disabled_plugins,
)

print_output(timings, args)


def get_arguments():
plugins = [
info.classname
for info in PluginOptions.all_plugins
]

parser = argparse.ArgumentParser(description='Run some benchmarks.')
parser.add_argument(
'filenames',
nargs=argparse.REMAINDER,
help='Filenames to check or detect-secrets compatible arguments.',
)
parser.add_argument(
'--pretty',
action='store_true',
help='Human readable output.',
)
parser.add_argument(
'--plugin',
default=None, # needs to be None, otherwise append won't work as expected
choices=plugins,
action='append',
help=(
'Specifies a plugin to test. May provide multiple values. '
'Defaults to all.'
),
)
parser.add_argument(
'--harakiri',
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

lol

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

FWIW, I copied uwsgi's syntax for this: https://uwsgi-docs.readthedocs.io/en/latest/Glossary.html

default=5,
type=float,
help=(
'Specifies an upper bound for the number of seconds to wait '
'per execution.'
),
)
parser.add_argument(
'-n',
'--num-iterations',
default=1,
# TODO: assert non-negative
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Whoops. Forgot to remove this lol.

Yeah, we're not breaking new ground here. We've done this before: https://github.com/Yelp/detect-secrets/blob/master/detect_secrets/core/usage.py#L396

type=int,
help=(
'Specifies the number of times to run the test. '
'Results will be averaged over this value.'
),
)

args = parser.parse_args()
if not args.filenames:
args.filenames = [
os.path.realpath(
os.path.join(
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Super nit: variable names could maybe help readability here

os.path.dirname(__file__),
'../',
),
),
]

if not args.plugin:
args.plugin = plugins

return args


def time_execution(filenames, timeout, num_iterations=1, flags=None):
"""
:type filenames: list
:type timeout: float
:type num_iterations: int

:type flags: list|None
:param flags: flags to disable
"""
if not flags:
flags = []

scores = []
for _ in range(num_iterations):
start_time = monotonic()
try:
subprocess.check_output(
'detect-secrets scan'.split() + filenames + flags,
timeout=timeout,
)
scores.append(monotonic() - start_time)
except subprocess.TimeoutExpired:
scores.append(timeout)

result = statistics.mean(scores)
if result == timeout:
return None

return statistics.mean(scores)


def print_output(timings, args):
"""
:type timings: dict
:type args: Namespace
"""
if not args.pretty:
print(json.dumps(timings))
return

# Print header
print('-' * 42)
print('{:<20s}{:>20s}'.format('plugin', 'time'))
print('-' * 42)

if 'all-plugins' in timings:
print_line('all-plugins', timings['all-plugins'])
del timings['all-plugins']

for key in sorted(timings):
print_line(key, timings[key])
print('-' * 42)


def print_line(name, time):
if not time:
time = 'Timeout exceeded!'
else:
time = '{}s'.format(str(time))

print('{:<20s}{:>20s}'.format(name, time))


if __name__ == '__main__':
main()
2 changes: 1 addition & 1 deletion tox.ini
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,7 @@ commands =
pre-commit install -f --install-hooks

[testenv:pre-commit]
deps = pre-commit>=0.16.3
deps = pre-commit >= 1.16.1
commands = pre-commit {posargs}

[pep8]
Expand Down