Merge 5f20ade into 830271f

Parquery · Dec 10, 2020 · 11de69a · 11de69a
2 parents 830271f + 5f20ade
commit 11de69a
Show file tree

Hide file tree

Showing 21 changed files with 3,472 additions and 55 deletions.
diff --git a/.gitignore b/.gitignore
@@ -10,3 +10,4 @@ dist/
 .coverage
 htmlcov
 README.html
+.hypothesis/
diff --git a/benchmarks/against_others/compare_with_hypothesis.py b/benchmarks/against_others/compare_with_hypothesis.py
@@ -0,0 +1,290 @@
+#!/usr/bin/env python3
+"""Benchmark icontract against deal when used together with hypothesis."""
+
+import math
+import os
+import sys
+import timeit
+from typing import List
+
+import deal
+import dpcontracts
+import hypothesis
+import hypothesis.strategies
+import hypothesis.extra.dpcontracts
+import tabulate
+
+import icontract
+import icontract.integration.with_hypothesis
+
+
+def benchmark_icontract_assume_preconditions(arg_count: int = 1) -> None:
+    """Benchmark the Hypothesis testing with icontract and rejection sampling."""
+    count = 0
+
+    if arg_count == 1:
+        @icontract.require(lambda a: a > 0)
+        def some_func(a: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+
+        assume_preconditions = icontract.integration.with_hypothesis.make_assume_preconditions(some_func)
+
+        @hypothesis.settings(suppress_health_check=(hypothesis.HealthCheck.filter_too_much,))
+        @hypothesis.given(a=hypothesis.strategies.integers())
+        def execute(a: int) -> None:
+            assume_preconditions(a)
+            some_func(a)
+
+    elif arg_count == 2:
+        @icontract.require(lambda a: a > 0)
+        @icontract.require(lambda b: b > 0)
+        def some_func(a: int, b: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+
+        assume_preconditions = icontract.integration.with_hypothesis.make_assume_preconditions(some_func)
+
+        @hypothesis.settings(suppress_health_check=(hypothesis.HealthCheck.filter_too_much,))
+        @hypothesis.given(a=hypothesis.strategies.integers(), b=hypothesis.strategies.integers())
+        def execute(a: int, b: int) -> None:
+            assume_preconditions(a=a, b=b)
+            some_func(a, b)
+
+    elif arg_count == 3:
+        @icontract.require(lambda a: a > 0)
+        @icontract.require(lambda b: b > 0)
+        @icontract.require(lambda c: c > 0)
+        def some_func(a: int, b: int, c: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+
+        assume_preconditions = icontract.integration.with_hypothesis.make_assume_preconditions(some_func)
+
+        @hypothesis.settings(suppress_health_check=(hypothesis.HealthCheck.filter_too_much,))
+        @hypothesis.given(
+            a=hypothesis.strategies.integers(),
+            b=hypothesis.strategies.integers(),
+            c=hypothesis.strategies.integers())
+        def execute(a: int, b: int, c: int) -> None:
+            assume_preconditions(a=a, b=b, c=c)
+            some_func(a, b, c)
+    else:
+        raise NotImplementedError("arg_count {}".format(arg_count))
+
+    execute()
+
+    # Assert the count of function executions for fair tests
+    assert count == 100
+
+
+def benchmark_icontract_inferred_strategies(arg_count: int = 1) -> None:
+    """Benchmark the Hypothesis testing with icontract and inferred search strategies."""
+    count = 0
+
+    if arg_count == 1:
+        @icontract.require(lambda a: a > 0)
+        def some_func(a: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+    elif arg_count == 2:
+        @icontract.require(lambda a: a > 0)
+        @icontract.require(lambda b: b > 0)
+        def some_func(a: int, b: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+    elif arg_count == 3:
+        @icontract.require(lambda a: a > 0)
+        @icontract.require(lambda b: b > 0)
+        @icontract.require(lambda c: c > 0)
+        def some_func(a: int, b: int, c: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+    else:
+        raise NotImplementedError("arg_count {}".format(arg_count))
+
+    icontract.integration.with_hypothesis.test_with_inferred_strategies(some_func)
+
+    # Assert the count of function executions for fair tests
+    assert count == 100
+
+
+def benchmark_dpcontracts(arg_count: int = 1) -> None:
+    """Benchmark the Hypothesis testing with dpcontracts."""
+    count = 0
+
+    if arg_count == 1:
+        @dpcontracts.require("some dummy contract", lambda args: args.a > 0)
+        def some_func(a: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+
+        @hypothesis.settings(suppress_health_check=(hypothesis.HealthCheck.filter_too_much,))
+        @hypothesis.given(a=hypothesis.strategies.integers())
+        def execute(a: int) -> None:
+            hypothesis.extra.dpcontracts.fulfill(some_func)(a)
+
+    elif arg_count == 2:
+        @dpcontracts.require("some dummy contract", lambda args: args.a > 0)
+        @dpcontracts.require("some dummy contract", lambda args: args.b > 0)
+        def some_func(a: int, b: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+
+        @hypothesis.settings(suppress_health_check=(hypothesis.HealthCheck.filter_too_much,))
+        @hypothesis.given(a=hypothesis.strategies.integers(), b=hypothesis.strategies.integers())
+        def execute(a: int, b: int) -> None:
+            hypothesis.extra.dpcontracts.fulfill(some_func)(a, b)
+
+    elif arg_count == 3:
+        @dpcontracts.require("some dummy contract", lambda args: args.a > 0)
+        @dpcontracts.require("some dummy contract", lambda args: args.b > 0)
+        @dpcontracts.require("some dummy contract", lambda args: args.c > 0)
+        def some_func(a: int, b: int, c: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+
+        @hypothesis.settings(suppress_health_check=(hypothesis.HealthCheck.filter_too_much,))
+        @hypothesis.given(
+            a=hypothesis.strategies.integers(),
+            b=hypothesis.strategies.integers(),
+            c=hypothesis.strategies.integers())
+        def execute(a: int, b: int, c: int) -> None:
+            hypothesis.extra.dpcontracts.fulfill(some_func)(a, b, c)
+
+    else:
+        raise NotImplementedError("arg_count {}".format(arg_count))
+
+    execute()
+
+    # Assert the count of function executions for fair tests
+    assert count == 100
+
+
+def benchmark_deal(arg_count: int = 1) -> None:
+    """Benchmark the Hypothesis testing with deal."""
+    count = 0
+
+    if arg_count == 1:
+        @deal.pre(lambda _: _.a > 0)
+        def some_func(a: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+
+        # Deal draws a certain number of samples and rejects samples from this fixed set.
+        # Therefore we need to double the number of samples for deal to get approximately the same number of
+        # tested cases.
+        for case in deal.cases(some_func, count=200):
+            case()
+
+    elif arg_count == 2:
+        @deal.pre(lambda _: _.a > 0)
+        @deal.pre(lambda _: _.b > 0)
+        def some_func(a: int, b: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+
+        # Deal draws a certain number of samples and rejects samples from this fixed set.
+        # Therefore we need to increase the number of samples for deal to get approximately the same number of
+        # tested cases.
+        for case in deal.cases(some_func, count=400):
+            case()
+
+    elif arg_count == 3:
+        @deal.pre(lambda _: _.a > 0)
+        @deal.pre(lambda _: _.b > 0)
+        @deal.pre(lambda _: _.c > 0)
+        def some_func(a: int, b: int, c: int) -> None:
+            nonlocal count
+            count += 1
+            pass
+
+        # Deal draws a certain number of samples and rejects samples from this fixed set.
+        # Therefore we need to increase the number of samples for deal to get approximately the same number of
+        # tested cases.
+        for case in deal.cases(some_func, count=800):
+            case()
+    else:
+        raise NotImplementedError("arg_count {}".format(arg_count))
+
+    # TODO: document this in Readme
+    # (mristin, 2020-12-07)
+    # We can not assert the exact number as it is too unstable and makes the script break.
+    # We inspected the number of executions manually and looked OK.
+    # assert abs(count - 100) < 50, "Expected the function to be called about 100 times, but got: {}".format(count)
+
+
+def writeln_utf8(text: str = "") -> None:
+    """
+    Write the text to STDOUT using UTF-8 encoding followed by a new-line character.
+
+    We can not use ``print()`` as we can not rely on the correct encoding in Windows.
+    See: https://stackoverflow.com/questions/31469707/changing-the-locale-preferred-encoding-in-python-3-in-windows
+    """
+    sys.stdout.buffer.write(text.encode('utf-8'))
+    sys.stdout.buffer.write(os.linesep.encode('utf-8'))
+
+
+def measure_functions() -> None:
+    # yapf: disable
+    funcs = [
+        'benchmark_icontract_inferred_strategies',
+        'benchmark_icontract_assume_preconditions',
+        'benchmark_dpcontracts',
+        'benchmark_deal',
+    ]
+    # yapf: enable
+
+    durations = [0.0] * len(funcs)
+
+    number = 10
+    for arg_count in [1, 2, 3]:
+        for i, func in enumerate(funcs):
+            duration = timeit.timeit(
+                "{}(arg_count={})".format(func, arg_count),
+                setup="from __main__ import {}".format(func),
+                number=number)
+
+            durations[i] = duration
+
+        table = []  # type: List[List[str]]
+
+        for func, duration in zip(funcs, durations):
+            # yapf: disable
+            table.append([
+                '`{}`'.format(func),
+                '{:.2f} s'.format(duration),
+                '{:.2f} ms'.format(duration * 1000 / number),
+                '{:.0f}%'.format(duration * 100 / durations[0])
+            ])
+            # yapf: enable
+
+        # yapf: disable
+        table_str = tabulate.tabulate(
+            table,
+            headers=['Case', 'Total time', 'Time per run', 'Relative time per run'],
+            colalign=('left', 'right', 'right', 'right'),
+            tablefmt='rst')
+        # yapf: enable
+
+        writeln_utf8()
+        writeln_utf8("Argument count: {}".format(arg_count))
+        writeln_utf8(table_str)
+
+
+if __name__ == "__main__":
+    writeln_utf8("Benchmarking Hypothesis testing:")
+    writeln_utf8('')
+    measure_functions()
+# TODO: include the benchmark in the readme