- cmake >= 3.8
- g++ >= 9.2
- nvcc >= 11.0
export GAS_HOME=$PWD
mkdir build
cd build
cmake ..
make # -j6
- benchmarks
cd examples/benchmark
# can replace cpi with L0-i-cache/L1-i-cache
cd cpi
make
./benchmark
- hgemm (Require Turing devices)
cd examples/hgemm
make
./run.sh
- sgemm
cd examples/sgemm
make
./run.sh
If cmake cannot find ANTRL. Copy bin/antlr-4.7.2-complete.jar to /usr/local/lib/antlr-4.7.2-complete.jar