Skip to content

Commit

Permalink
Added support for sm_52 target and flush denormals to zero for small …
Browse files Browse the repository at this point in the history
…performance boost.
  • Loading branch information
maddyscientist committed Oct 14, 2014
1 parent de8253f commit 36b5a00
Showing 1 changed file with 5 additions and 1 deletion.
6 changes: 5 additions & 1 deletion src/Makefile
Expand Up @@ -26,7 +26,7 @@ RPATH =
LIBXGPU = libxgpu.dll
else

NVCCFLAGS = -Xcompiler -D_REENTRANT -Xcompiler -Wall -Xcompiler -Wno-unused-function
NVCCFLAGS = -Xcompiler -D_REENTRANT -Xcompiler -Wall -Xcompiler -Wno-unused-function -ftz=true

ifneq ($(strip $(OSTYPE)),osx)
NVCCFLAGS += -Xcompiler -fopenmp
Expand Down Expand Up @@ -55,6 +55,10 @@ ifeq ($(strip $(CUDA_ARCH)),sm_50)
NVCCFLAGS += -maxrregcount=72
endif

ifeq ($(strip $(CUDA_ARCH)),sm_52)
NVCCFLAGS += -maxrregcount=72
endif

#NVCCFLAGS += -Xptxas -dlcm=cg # disable L1 cache

# Possibly (re-)build xgpu_version.h
Expand Down

0 comments on commit 36b5a00

Please sign in to comment.