forked from LLNL/RAJAPerf
-
Notifications
You must be signed in to change notification settings - Fork 0
/
CMakeLists.txt
234 lines (188 loc) · 7.67 KB
/
CMakeLists.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
###############################################################################
# Copyright (c) 2017-23, Lawrence Livermore National Security, LLC
# and RAJA Performance Suite project contributors.
# See the RAJAPerf/LICENSE file for details.
#
# SPDX-License-Identifier: (BSD-3-Clause)
###############################################################################
# C is required for googletest to find Threads
project(RAJAPerfSuite LANGUAGES CXX C)
if (ENABLE_HIP)
cmake_minimum_required(VERSION 3.23)
else()
cmake_minimum_required(VERSION 3.20)
endif()
option(ENABLE_RAJA_SEQUENTIAL "Run sequential variants of RAJA kernels. Disable
this, and all other variants, to run _only_ raw C loops." On)
option(ENABLE_KOKKOS "Include Kokkos implementations of the kernels in the RAJA Perfsuite" Off)
#
# Note: the BLT build system is inheritted by RAJA and is initialized by RAJA
#
if (PERFSUITE_ENABLE_WARNINGS)
set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wall -Wextra -Werror")
endif()
if (ENABLE_KOKKOS)
set(CMAKE_CXX_STANDARD 17)
set(BLT_CXX_STD c++17)
else()
set(CMAKE_CXX_STANDARD 14)
set(BLT_CXX_STD c++14)
endif()
include(blt/SetupBLT.cmake)
#
# Define RAJA PERFSUITE settings...
#
cmake_dependent_option(RAJA_PERFSUITE_ENABLE_TESTS "Enable RAJA Perf Suite Tests" On "ENABLE_TESTS" Off)
if (ENABLE_TESTS)
set(RAJA_ENABLE_TESTS Off CACHE BOOL "")
set(CAMP_ENABLE_TESTS Off CACHE BOOL "")
endif()
cmake_dependent_option(RAJA_PERFSUITE_ENABLE_MPI "Build with MPI" On "ENABLE_MPI" Off)
cmake_dependent_option(RAJA_PERFSUITE_ENABLE_OPENMP5_SCAN "Build OpenMP scan variants" Off "ENABLE_OPENMP" Off)
#
# Define RAJA settings...
#
set(RAJA_ENABLE_TESTS Off CACHE BOOL "")
set(RAJA_ENABLE_EXAMPLES Off CACHE BOOL "")
set(RAJA_ENABLE_EXERCISES Off CACHE BOOL "")
set(ENABLE_DOCUMENTATION Off CACHE BOOL "")
set(ENABLE_TBB Off CACHE BOOL "")
set(RAJA_USE_CHRONO On CACHE BOOL "")
set(RAJA_PERFSUITE_GPU_BLOCKSIZES "" CACHE STRING "Comma separated list of GPU block sizes, ex '256,1024'")
set(RAJA_RANGE_ALIGN 4)
set(RAJA_RANGE_MIN_LENGTH 32)
set(RAJA_DATA_ALIGN 64)
string(LENGTH "${RAJA_PERFSUITE_GPU_BLOCKSIZES}" BLOCKSIZES_LENGTH)
if (BLOCKSIZES_LENGTH GREATER 0)
message(STATUS "Using gpu block size(s): ${RAJA_PERFSUITE_GPU_BLOCKSIZES}")
else()
message(STATUS "Using default gpu block size(s)")
endif()
# exclude RAJA make targets from top-level build...
add_subdirectory(tpl/RAJA)
get_property(RAJA_INCLUDE_DIRS DIRECTORY tpl/RAJA PROPERTY INCLUDE_DIRECTORIES)
include_directories(${RAJA_INCLUDE_DIRS})
set(CAMP_ENABLE_TESTS Off CACHE BOOL "")
if (ENABLE_RAJA_SEQUENTIAL)
add_definitions(-DRUN_RAJA_SEQ)
endif ()
if (ENABLE_OPENMP)
add_definitions(-DRUN_OPENMP)
endif ()
set(RAJA_PERFSUITE_VERSION_MAJOR 2023)
set(RAJA_PERFSUITE_VERSION_MINOR 06)
set(RAJA_PERFSUITE_VERSION_PATCHLEVEL 0)
set(RAJA_PERFSUITE_DEPENDS RAJA)
if (RAJA_PERFSUITE_ENABLE_MPI)
list(APPEND RAJA_PERFSUITE_DEPENDS mpi)
endif()
if (ENABLE_OPENMP)
list(APPEND RAJA_PERFSUITE_DEPENDS openmp)
endif()
if (ENABLE_CUDA)
list(APPEND RAJA_PERFSUITE_DEPENDS cuda)
endif()
# Kokkos requires hipcc as the CMAKE_CXX_COMPILER for HIP AMD/VEGA GPU
# platforms, whereas RAJAPerf Suite uses blt/CMake FindHIP to set HIP compiler.
# Separate RAJAPerf Suite and Kokkos handling of HIP compilers
if ((ENABLE_HIP) AND (NOT ENABLE_KOKKOS))
message(STATUS "HIP version: ${hip_VERSION}")
if("${hip_VERSION}" VERSION_LESS "3.5")
message(FATAL_ERROR "Trying to use HIP/ROCm version ${hip_VERSION}. RAJA Perf Suite requires HIP/ROCm version 3.5 or newer. ")
endif()
list(APPEND RAJA_PERFSUITE_DEPENDS blt::hip)
list(APPEND RAJA_PERFSUITE_DEPENDS blt::hip_runtime)
endif()
#
# Are we using Caliper
#
set(RAJA_PERFSUITE_USE_CALIPER off CACHE BOOL "")
if (RAJA_PERFSUITE_USE_CALIPER)
find_package(caliper REQUIRED)
list(APPEND RAJA_PERFSUITE_DEPENDS caliper)
add_definitions(-DRAJA_PERFSUITE_USE_CALIPER)
message(STATUS "Using Caliper")
find_package(adiak REQUIRED)
# use ${adiak_LIBRARIES} since version could have adiak vs adiak::adiak export
list(APPEND RAJA_PERFSUITE_DEPENDS ${adiak_LIBRARIES})
if (ENABLE_CUDA)
# Adiak will propagate -pthread from spectrum mpi from a spack install of Caliper with +mpi; and needs to be handled even if RAJAPerf is non MPI program
# We should delegate to BLT to handle unguarded -pthread from any dependencies, but currently BLT doesn't
set_target_properties(${adiak_LIBRARIES} PROPERTIES INTERFACE_COMPILE_OPTIONS "$<$<NOT:$<COMPILE_LANGUAGE:CUDA>>:-pthread>;$<$<COMPILE_LANGUAGE:CUDA>:-Xcompiler=-pthread>")
# the following for adiak-0.2.2
if (TARGET adiak::mpi)
set_target_properties(adiak::mpi PROPERTIES INTERFACE_COMPILE_OPTIONS "$<$<NOT:$<COMPILE_LANGUAGE:CUDA>>:-pthread>;$<$<COMPILE_LANGUAGE:CUDA>:-Xcompiler=-pthread>")
endif ()
endif ()
message(STATUS "Caliper includes : ${caliper_INCLUDE_DIR}")
message(STATUS "Adiak includes : ${adiak_INCLUDE_DIRS}")
include_directories(${caliper_INCLUDE_DIR})
include_directories(${adiak_INCLUDE_DIRS})
endif ()
set(RAJAPERF_BUILD_SYSTYPE $ENV{SYS_TYPE})
set(RAJAPERF_BUILD_HOST $ENV{HOSTNAME})
if (ENABLE_CUDA)
if (ENABLE_KOKKOS)
set(CMAKE_CUDA_STANDARD 17)
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -restrict --extended-lambda --expt-relaxed-constexpr")
else()
set(CMAKE_CUDA_STANDARD 14)
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -restrict --expt-extended-lambda --expt-relaxed-constexpr")
endif()
set(RAJAPERF_COMPILER "${CUDA_NVCC_EXECUTABLE}")
list(APPEND RAJAPERF_COMPILER ${CMAKE_CXX_COMPILER})
set(RAJAPERF_COMPILER_OPTIONS "${CUDA_NVCC_FLAGS}")
elseif (ENABLE_HIP)
set(RAJAPERF_COMPILER "${HIP_HIPCC_EXECUTABLE}")
list(APPEND RAJAPERF_COMPILER ${CMAKE_CXX_COMPILER})
set(RAJAPERF_COMPILER_OPTIONS "${HIP_HIPCC_FLAGS}")
else()
set(RAJAPERF_COMPILER "${CMAKE_CXX_COMPILER}")
string(TOUPPER ${CMAKE_BUILD_TYPE} RAJAPERF_BUILD_TYPE)
set(RAJAPERF_COMPILER_OPTIONS "${CMAKE_CXX_FLAGS_${RAJAPERF_BUILD_TYPE}}")
list(APPEND RAJAPERF_COMPILER_OPTIONS ${CMAKE_CXX_FLAGS})
endif()
configure_file(${CMAKE_SOURCE_DIR}/src/rajaperf_config.hpp.in
${CMAKE_CURRENT_BINARY_DIR}/include/rajaperf_config.hpp)
include_directories($<BUILD_INTERFACE:${PROJECT_BINARY_DIR}/include>)
# Make sure RAJA flags propagate (we need to do some tidying to
# remove project-specific CMake variables that are no longer needed)
set (CUDA_NVCC_FLAGS ${RAJA_NVCC_FLAGS})
#
# Each directory in the perf suite has its own CMakeLists.txt file.
# ENABLE_KOKKOS is A RAJAPerf Suite Option
if(ENABLE_KOKKOS)
add_definitions(-DRUN_KOKKOS)
if(ENABLE_HIP)
set(Kokkos_ENABLE_HIP ON CACHE BOOL "Kokkos builds for AMD HIP set the
Kokkos_ENABLE_HIP variable to ON")
endif()
if(ENABLE_TARGET_OPENMP)
set(Kokkos_ENABLE_OPENMPTARGET ON CACHE BOOL "Docstring")
if(NOT CMAKE_BUILD_TYPE MATCHES Debug)
if(NOT EXPERIMENTAL_BUILD)
message(FATAL_ERROR "Kokkos builds with OpenMPTarget require a Debug build to succeed at the moment. Rebuild with CMAKE_BUILD_TYPE=Debug. If you're a compiler developer, rebuild with -DEXPERIMENTAL_BUILD=ON")
endif()
endif()
endif()
# ENABLE_CUDA IS A RAJA PERFSUITE OPTION
if(ENABLE_CUDA)
set(Kokkos_ENABLE_CUDA ON CACHE BOOL "Docstring")
set(Kokkos_ENABLE_CUDA_LAMBDA ON CACHE BOOL "Docstring")
enable_language(CUDA)
endif()
if(ENABLE_OPENMP)
set(Kokkos_ENABLE_OPENMP ON CACHE BOOL "Docstring")
endif()
add_subdirectory(tpl/kokkos)
get_property(KOKKOS_INCLUDE_DIRS DIRECTORY tpl/kokkos PROPERTY INCLUDE_DIRECTORIES)
include_directories(${KOKKOS_INCLUDE_DIRS})
list(APPEND RAJA_PERFSUITE_DEPENDS kokkos)
endif()
add_subdirectory(src)
if (RAJA_PERFSUITE_ENABLE_TESTS)
add_subdirectory(test)
endif()
if (RAJA_PERFSUITE_ENABLE_DOCUMENTATION)
add_subdirectory(docs)
endif ()