-
Notifications
You must be signed in to change notification settings - Fork 43
Home
Waylon Flinn edited this page Jan 8, 2016
·
14 revisions
- Ubuntu 14.04.3
- Intel® Core™ i7 CPU 860 @ 2.80GHz × 8
- GeForce GTX 970/PCIe/SSE2
Version 0.6.0
TAP version 13
ok 1 128x128 . 128x128
# 316 ops/sec ±4.80% n = 51 µ = 3ms
ok 2 128x256 . 256x128
# 280 ops/sec ±6.15% n = 40 µ = 4ms
ok 3 256x256 . 256x256
# 171 ops/sec ±14.79% n = 47 µ = 6ms
ok 4 512x256 . 256x512
# 101 ops/sec ±6.68% n = 50 µ = 10ms
ok 5 256x512 . 512x256
# 139 ops/sec ±3.64% n = 49 µ = 7ms
ok 6 512x512 . 512x512
# 61.61 ops/sec ±3.14% n = 42 µ = 16ms
ok 7 513x513 . 513x513
# 52.92 ops/sec ±8.82% n = 49 µ = 19ms
ok 8 1024x512 . 512x1024
# 34.99 ops/sec ±4.86% n = 38 µ = 29ms
ok 9 512x1024 . 1024x512
# 52.03 ops/sec ±2.66% n = 47 µ = 19ms
ok 10 1024x1024 . 1024x1024
# 23.27 ops/sec ±12.70% n = 34 µ = 43ms
ok 11 2048x2048 . 2048x2048
# 4.89 ops/sec ±1.82% n = 17 µ = 204ms
1..11
# tests 11
# pass 11
# ok
- Python 2.7.6 (
python --version
) - Numpy 1.8.2 (
python -c "import numpy; print(numpy.__version__)"
) - OpenBLAS 0.2.8-6ubuntu1 (
apt-cache show libopenblas-dev
) export OMP_NUM_THREADS=8
TAP version 13
ok 1 128x128 . 128.128
# 5534.11 ops/sec n = 50 µ = 0.18ms
ok 2 128x256 . 256.128
# 2634.22 ops/sec n = 50 µ = 0.38ms
ok 3 256x256 . 256.256
# 886.88 ops/sec n = 50 µ = 1.13ms
ok 4 512x256 . 256.512
# 212.78 ops/sec n = 50 µ = 4.70ms
ok 5 256x512 . 512.256
# 449.14 ops/sec n = 50 µ = 2.23ms
ok 6 512x512 . 512.512
# 115.72 ops/sec n = 50 µ = 8.64ms
ok 7 1024x512 . 512.1024
# 28.10 ops/sec n = 50 µ = 35.58ms
ok 8 1024x512 . 512.1024
# 28.16 ops/sec n = 50 µ = 35.51ms
ok 9 1024x1024 . 1024.1024
# 14.61 ops/sec n = 50 µ = 68.44ms
ok 10 2048x2048 . 2048.2048
# 1.80 ops/sec n = 50 µ = 555.40ms
1..9
# tests 9
# pass 9
# ok
Same configuration as above with a mid-range graphics card.
- GeForce GTX 465/PCIe/SSE2
TAP version 13
ok 1 128x128 . 128x128
# 294 ops/sec ±3.97% n = 52 µ = 3ms
ok 2 128x256 . 256x128
# 229 ops/sec ±7.38% n = 33 µ = 4ms
ok 3 256x256 . 256x256
# 131 ops/sec ±4.28% n = 44 µ = 8ms
ok 4 512x256 . 256x512
# 54.99 ops/sec ±12.39% n = 42 µ = 18ms
ok 5 256x512 . 512x256
# 94.22 ops/sec ±8.23% n = 46 µ = 11ms
ok 6 512x512 . 512x512
# 42.01 ops/sec ±2.98% n = 40 µ = 24ms
ok 7 513x513 . 513x513
# 34.54 ops/sec ±8.46% n = 39 µ = 29ms
ok 8 1024x512 . 512x1024
# 18.32 ops/sec ±6.98% n = 35 µ = 55ms
ok 9 512x1024 . 1024x512
# 33.26 ops/sec ±5.28% n = 39 µ = 30ms
ok 10 1024x1024 . 1024x1024
# 11.76 ops/sec ±2.89% n = 24 µ = 85ms
ok 11 2048x2048 . 2048x2048
# 2.15 ops/sec ±1.48% n = 10 µ = 465ms
1..11
# tests 11
# pass 11
# ok