/
run_pandas_benchmark.py
72 lines (62 loc) · 2.5 KB
/
run_pandas_benchmark.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function
import os
import argparse
from subprocess import Popen, DEVNULL, TimeoutExpired
parser = argparse.ArgumentParser(description='run benchmarks')
parser.add_argument('--N', dest='n', default=1, nargs='?', type=int,
help='number of test iterations to run')
args = parser.parse_args()
num_iterations = args.n
files = os.listdir("benchmarks/data")
timeout = 60 * 20
for _ in range(num_iterations):
for f in files:
p = Popen(["python", "benchmarks/pandas/arithmetic_benchmark.py",
"--path", "benchmarks/data/{}".format(f),
"--logfile", "benchmark-results/pandas-arithmetic.log"],
stdout=DEVNULL, stderr=DEVNULL)
try:
p.wait(timeout)
except TimeoutExpired:
p.kill()
for f in files:
p = Popen(["python", "benchmarks/pandas/groupby_benchmark.py",
"--path", "benchmarks/data/{}".format(f),
"--logfile", "benchmark-results/pandas-groupby.log"],
stdout=DEVNULL, stderr=DEVNULL)
try:
p.wait(timeout)
except TimeoutExpired:
p.kill()
for f in files:
p = Popen(["python", "benchmarks/pandas/io_benchmark.py",
"--path", "benchmarks/data/{}".format(f),
"--logfile", "benchmark-results/pandas-io.log"],
stdout=DEVNULL, stderr=DEVNULL)
try:
p.wait(timeout)
except TimeoutExpired:
p.kill()
for f in files:
p = Popen(["python", "benchmarks/pandas/df_op_benchmark.py",
"--path", "benchmarks/data/{}".format(f),
"--logfile", "benchmark-results/pandas-df-op.log"],
stdout=DEVNULL, stderr=DEVNULL)
try:
p.wait(timeout)
except TimeoutExpired:
p.kill()
multi_df_files = os.listdir("benchmarks/data/multi")
for f in files:
for g in multi_df_files:
p = Popen(["python", "benchmarks/pandas/join_merge_benchmark.py",
"--left", "benchmarks/data/{}".format(f),
"--right", "benchmarks/data/{}".format(g),
"--logfile", "benchmark-results/pandas-join-merge.log"],
stdout=DEVNULL, stderr=DEVNULL)
try:
p.wait(timeout)
except TimeoutExpired:
p.kill()