-
Notifications
You must be signed in to change notification settings - Fork 2
/
CMakeLists.txt
115 lines (85 loc) · 4.56 KB
/
CMakeLists.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
cmake_minimum_required(VERSION 3.5)
project(amsfilter-samples)
set(CMAKE_MODULE_PATH ${CMAKE_MODULE_PATH} "${CMAKE_SOURCE_DIR}/cmake/Modules/" "${CMAKE_CURRENT_SOURCE_DIR}/cmake/Modules")
#set(CMAKE_VERBOSE_MAKEFILE ON)
set(CMAKE_CXX_STANDARD 14)
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -std=c++14 -fext-numeric-literals -Wall -Wno-deprecated -Wno-endif-labels -Wno-unused-function")
# Database Template Library (DTL)
include_directories(thirdparty/dtl/src)
include_directories(thirdparty/dtl/thirdparty)
# The target architecture.
set(TARGET_ARCH "native")
# Include the AMS-Filter.
set(AMSFILTER_NO_MAGIC 0) # Disables MAGIC addressing.
set(AMSFILTER_PARTIAL_BUILD 0) # Compiles only a small number of filters.
add_subdirectory(thirdparty/dtl/amsfilter amsfilter)
include_directories(thirdparty/dtl/amsfilter/src)
include_directories(thirdparty/dtl/amsfilter/thirdparty)
set_target_properties(amsfilter PROPERTIES COMPILE_FLAGS "-march=${TARGET_ARCH}")
set(LIBS
pthread
numa
)
#===------------------------------------------------------------------------===#
# CUDA
#===------------------------------------------------------------------------===#
find_package(CUDA 9)
if (CUDA_FOUND)
message("CUDA found")
# avoid implicitly synchronization with other streams
set(CUDA_NVCC_FLAGS --default-stream per-thread)
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} --restrict --std=c++14 -Xcompiler -D__CORRECT_ISO_CPP11_MATH_H_PROTO -D_MWAITXINTRIN_H_INCLUDED)
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} --source-in-ptx)
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} -Xptxas -dlcm=ca)
# enable NVCC warnings
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} -Xcompiler -Wall)
# the target architecture(s) - (see https://en.wikipedia.org/wiki/CUDA#GPUs_supported)
# set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} --generate-code arch=compute_52,code=sm_52) # e.g. GTX 970
# set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} --generate-code arch=compute_60,code=sm_60) # e.g. Tesla P100
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} --generate-code arch=compute_61,code=sm_61) # e.g. GTX 1080Ti
# don't show deprecation warnings (which are a lot with CUDA 9)
set(CUDA_NVCC_FLAGS ${CUDA_NVCC_FLAGS} -Wno-deprecated-declarations)
set(CUDA_NVCC_FLAGS_DEBUG -g --generate-line-info --keep -DDEBUG)
set(CUDA_NVCC_FLAGS_RELEASE -O3 --use_fast_math -DNDEBUG)
set(CUDA_PROPAGATE_HOST_FLAGS OFF)
set(CUDA_SEPARABLE_COMPILATION OFF)
include_directories(/usr/local/cuda/include)
set(LIBS ${LIBS} cudart)
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DHAVE_CUDA")
else()
message("CUDA found")
endif()
cuda_add_executable(amsfilter_lite_sample src/amsfilter_lite_sample.cpp)
set_target_properties(amsfilter_lite_sample
PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
set_target_properties(amsfilter_lite_sample PROPERTIES COMPILE_FLAGS "-march=${TARGET_ARCH}")
target_link_libraries(amsfilter_lite_sample ${LIBS} amsfilter)
cuda_add_executable(amsfilter_parameterization src/amsfilter_parameterization.cpp)
set_target_properties(amsfilter_parameterization
PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
set_target_properties(amsfilter_parameterization PROPERTIES COMPILE_FLAGS "-march=${TARGET_ARCH}")
target_link_libraries(amsfilter_parameterization ${LIBS} amsfilter)
cuda_add_executable(benchmark_device src/benchmark_device.cpp)
set_target_properties(benchmark_device
PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
set_target_properties(benchmark_device PROPERTIES COMPILE_FLAGS "-march=${TARGET_ARCH}")
target_link_libraries(benchmark_device ${LIBS} amsfilter)
cuda_add_executable(benchmark_device_raw src/benchmark_device_raw.cu)
set_target_properties(benchmark_device_raw
PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
set_target_properties(benchmark_device_raw PROPERTIES COMPILE_FLAGS "-march=${TARGET_ARCH}")
target_link_libraries(benchmark_device_raw ${LIBS} amsfilter)
cuda_add_executable(benchmark_host src/benchmark_host.cpp)
set_target_properties(benchmark_host
PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
set_target_properties(benchmark_host PROPERTIES COMPILE_FLAGS "-march=${TARGET_ARCH}")
target_link_libraries(benchmark_host ${LIBS} amsfilter)
cuda_add_executable(benchmark_coproc src/benchmark_coproc.cpp)
set_target_properties(benchmark_coproc
PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
set_target_properties(benchmark_coproc PROPERTIES COMPILE_FLAGS "-march=${TARGET_ARCH}")
target_link_libraries(benchmark_coproc ${LIBS} amsfilter)
# Include local CMake file.
if(EXISTS "${CMAKE_CURRENT_SOURCE_DIR}/CMakeListsLocal.cmake")
include(CMakeListsLocal.cmake)
endif()