forked from reger-men/HPL_GPU
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathCMakeLists.txt
234 lines (213 loc) · 8.77 KB
/
CMakeLists.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
cmake_minimum_required( VERSION 3.0 FATAL_ERROR )
project( hplhip VERSION 0.1.0 LANGUAGES CXX )
# current Git branch
EXECUTE_PROCESS(
COMMAND git rev-parse --abbrev-ref HEAD
WORKING_DIRECTORY ${CMAKE_SOURCE_DIR}
OUTPUT_VARIABLE HPLHIP_GIT_BRANCH
OUTPUT_STRIP_TRAILING_WHITESPACE
)
# Git hash
EXECUTE_PROCESS(
COMMAND git log -1 --format=%h
WORKING_DIRECTORY ${CMAKE_SOURCE_DIR}
OUTPUT_VARIABLE HPLHIP_GIT_HASH
OUTPUT_STRIP_TRAILING_WHITESPACE
)
find_package(OpenMP)
# Add rocM root dir to CMAKE_PREFIX_PATH, usually /opt/rocm
if(NOT DEFINED ROCM_PATH)
if(DEFINED ENV{ROCM_PATH})
set(ROCM_PATH $ENV{ROCM_PATH})
else()
set(ROCM_PATH "/opt/rocm")
endif()
endif()
list(APPEND CMAKE_PREFIX_PATH ${ROCM_PATH})
set(CMAKE_MODULE_PATH "${ROCM_PATH}/hip/cmake" ${CMAKE_MODULE_PATH})
set(CMAKE_MODULE_PATH "${ROCM_PATH}/share/rocm/cmake" ${CMAKE_MODULE_PATH})
include(ROCMCheckTargetIds)
find_package( HIP REQUIRED )
find_package( rocblas REQUIRED )
# switch compiler and linker on non-Windows
# if(NOT WIN32)
# set(CMAKE_CXX_COMPILER ${HIP_HIPCC_EXECUTABLE})
# set(CMAKE_CXX_LINKER ${HIP_HIPCC_EXECUTABLE})
# endif()
option(ROCM "based on ROCm framework" ON)
option(PDFACT_OMP "pdfact with openmp" ON)
set( CMAKE_CXX_STANDARD 14 )
set(CMAKE_CXX_FLAGS_DEBUG "${CMAKE_CXX_FLAGS_DEBUG} -O0")
set(CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} -O3")
list(APPEND HIP_HIPCC_FLAGS "-O3 --std=c++14")
list(APPEND CMAKE_HOST_FLAGS "-O3;-march=native;--std=c++14;")
ADD_DEFINITIONS(-DHPL_COPY_L=1)
ADD_DEFINITIONS(-DHPL_NO_MPI_DATATYPE=1)
ADD_DEFINITIONS(-DHPL_PROGRESS_REPORT=1)
file(COPY ${CMAKE_CURRENT_SOURCE_DIR}/HPL.dat
DESTINATION ${CMAKE_CURRENT_BINARY_DIR})
file(COPY ${CMAKE_CURRENT_SOURCE_DIR}/scripts/mpirun_xhplhip.sh
DESTINATION ${CMAKE_CURRENT_BINARY_DIR})
file(COPY ${CMAKE_CURRENT_SOURCE_DIR}/scripts/run_xhplhip.sh
DESTINATION ${CMAKE_CURRENT_BINARY_DIR})
file(COPY ${CMAKE_CURRENT_SOURCE_DIR}/scripts/hostfile
DESTINATION ${CMAKE_CURRENT_BINARY_DIR})
# don't need MPI C++ bindings, now deprecated
if(NOT DEFINED MPI_DIR)
if(DEFINED ENV{MPI_DIR})
set(MPI_DIR $ENV{MPI_DIR})
list(APPEND CMAKE_PREFIX_PATH ${MPI_DIR})
include_directories(${MPI_DIR}/include)
endif()
else()
list(APPEND CMAKE_PREFIX_PATH ${MPI_DIR})
include_directories(${MPI_DIR}/include)
endif()
set( MPI_CXX_SKIP_MPICXX ON )
find_package( MPI REQUIRED )
# search for rocRAND/hipRAND-config.cmake in CMAKE_PREFIX_PATH
find_package(rocrand)
if (rocrand_FOUND)
message(STATUS "Found rocRAND version ${rocrand_VERSION}")
set(HPLHIP_DEVRAND_INCLUDE_DIRS "${rocrand_INCLUDE_DIRS}")
set(HPLHIP_USE_ROCRAND 1)
else ()
find_package(hiprand)
if (hiprand_FOUND)
message(STATUS "Found hipRAND version ${hiprand_VERSION}")
set(HPLHIP_DEVRAND_INCLUDE_DIRS "${hiprand_INCLUDE_DIRS}")
set(HPLHIP_USE_HIPRAND 1)
else ()
message(FATAL_ERROR "Didn't find any device random generators")
endif ()
endif ()
if(NOT DEFINED BLAS_DIR)
if(DEFINED ENV{BLAS_DIR})
set(BLAS_DIR $ENV{BLAS_DIR})
list(APPEND CMAKE_PREFIX_PATH ${BLAS_DIR})
endif()
else()
list(APPEND CMAKE_PREFIX_PATH ${BLAS_DIR})
endif()
find_library(BLAS_LIBRARIES NAMES blis openblas
PATHS ${BLAS_DIR}
HINTS ${BLAS_DIR}/lib/zen3 ${BLAS_DIR}/lib
NO_DEFAULT_PATH)
if (BLAS_LIBRARIES)
message(STATUS "Found BLAS: ${BLAS_LIBRARIES}")
else()
message(STATUS "BLAS NOT Found: ${BLAS_LIBRARIES}")
find_package(BLAS REQUIRED)
endif()
# find_package( BLAS REQUIRED )
# append math library, if found
find_library(MATH_LIBRARY m)
if( MATH_LIBRARY )
# OpenBLAS needs to link C math library (usually -lm) but MKL doesn't
set(BLAS_LIBRARIES ${BLAS_LIBRARIES} ${MATH_LIBRARY})
endif( MATH_LIBRARY )
file(GLOB_RECURSE hpl_device_source RELATIVE ${CMAKE_CURRENT_SOURCE_DIR} "testing/backend/HPL_backendHIP.cpp")
# Flag source files as hip source files
foreach(i ${hpl_device_source})
set_source_files_properties(${i} PROPERTIES HIP_SOURCE_PROPERTY_FORMAT TRUE)
endforeach()
if(ROCM)
if(PDFACT_OMP)
ADD_DEFINITIONS(-DPDFACT_OMP=1)
endif(PDFACT_OMP)
ADD_DEFINITIONS(-DROCM=1)
set(hpl_host_source ${hpl_host_source} src/pgesv/HPL_pdgesvK2_HIP.cpp)
else()
set(hpl_host_source ${hpl_host_source} src/pgesv/HPL_pdgesvK2.cpp src/pgesv/HPL_pdgesv0.cpp)
endif(ROCM)
set(hpl_host_source ${hpl_host_source}
testing/ptest/HPL_pddriver.cpp
testing/ptest/HPL_pdinfo.cpp testing/ptest/HPL_pdtest.cpp
testing/pmatgen/HPL_pdmatgen.cpp testing/matgen/HPL_jumpit.cpp
testing/matgen/HPL_rand.cpp testing/matgen/HPL_setran.cpp
testing/matgen/HPL_xjumpm.cpp testing/matgen/HPL_lmul.cpp
testing/matgen/HPL_ladd.cpp
src/auxil/HPL_dlamch.cpp src/auxil/HPL_fprintf.cpp src/grid/HPL_grid_exit.cpp
src/grid/HPL_all_reduce.cpp src/grid/HPL_broadcast.cpp
src/grid/HPL_grid_info.cpp src/grid/HPL_grid_init.cpp src/grid/HPL_max.cpp
src/grid/HPL_min.cpp src/grid/HPL_sum.cpp src/grid/HPL_barrier.cpp
src/pauxil/HPL_pdlamch.cpp src/pauxil/HPL_numroc.cpp src/pauxil/HPL_numrocI.cpp
src/pauxil/HPL_pdlange.cpp src/pauxil/HPL_indxg2p.cpp src/pauxil/HPL_infog2l.cpp
src/pfact/HPL_pdpancrN.cpp src/pfact/HPL_pdpancrT.cpp
src/pfact/HPL_pdpanllN.cpp src/pfact/HPL_pdpanllT.cpp
src/pfact/HPL_pdpanrlN.cpp src/pfact/HPL_pdpanrlT.cpp
src/pfact/HPL_pdrpancrN.cpp src/pfact/HPL_pdrpancrT.cpp
src/pfact/HPL_pdrpanllN.cpp src/pfact/HPL_pdrpanllT.cpp
src/pfact/HPL_pdrpanrlN.cpp src/pfact/HPL_pdrpanrlT.cpp
src/pgesv/HPL_pdupdateNT.cpp
src/pgesv/HPL_pdupdateNN.cpp src/pgesv/HPL_pdupdateTN.cpp src/pgesv/HPL_pdupdateTT.cpp
src/pgesv/HPL_pdupdateTN.cpp src/pgesv/HPL_pdupdateTT.cpp
src/pauxil/HPL_pwarn.cpp src/comm/HPL_bcast.cpp src/comm/HPL_blong.cpp
src/comm/HPL_blonM.cpp src/comm/HPL_bidir.cpp src/comm/HPL_1ring.cpp src/comm/HPL_2ring.cpp
src/comm/HPL_1rinM.cpp src/comm/HPL_2rinM.cpp src/comm/HPL_packL.cpp
src/comm/HPL_sdrv.cpp src/comm/HPL_send.cpp src/pgesv/HPL_pdlaswp00N.cpp
src/comm/HPL_recv.cpp src/grid/HPL_reduce.cpp src/comm/HPL_binit.cpp
src/comm/HPL_bwait.cpp src/comm/HPL_copyL.cpp
src/pgesv/HPL_pdlaswp00T.cpp src/pgesv/HPL_pdlaswp01N.cpp
src/pgesv/HPL_pdlaswp01T.cpp
src/pgesv/HPL_pdupdateNT.cpp
src/pfact/HPL_pdrpanllN.cpp src/pfact/HPL_pdrpanllT.cpp
src/pfact/HPL_pdrpanrlN.cpp src/pfact/HPL_pdrpanrlT.cpp
src/pauxil/HPL_dlaswp00N.cpp
src/pauxil/HPL_dlaswp01N.cpp
src/pauxil/HPL_dlaswp01T.cpp
src/pauxil/HPL_dlaswp02N.cpp
src/pauxil/HPL_dlaswp03N.cpp
src/pauxil/HPL_dlaswp03T.cpp
src/pauxil/HPL_dlaswp04N.cpp
src/pauxil/HPL_dlaswp04T.cpp
src/pauxil/HPL_dlaswp05N.cpp src/pauxil/HPL_dlaswp05T.cpp
src/pauxil/HPL_dlaswp06N.cpp
src/pauxil/HPL_dlaswp06T.cpp
src/pauxil/HPL_dlaswp10N.cpp
src/pfact/HPL_dlocmax.cpp
src/pfact/HPL_dlocswpN.cpp src/pfact/HPL_dlocswpT.cpp src/pgesv/HPL_equil.cpp
src/pfact/HPL_pdfact.cpp src/pauxil/HPL_pabort.cpp src/pfact/HPL_pdmxswp.cpp
src/pgesv/HPL_pipid.cpp src/pgesv/HPL_plindx0.cpp
src/pgesv/HPL_plindx1.cpp src/pgesv/HPL_plindx10.cpp
src/pgesv/HPL_rollN.cpp src/pgesv/HPL_rollT.cpp
src/pgesv/HPL_spreadN.cpp src/pgesv/HPL_spreadT.cpp
src/pgesv/HPL_logsort.cpp src/pgesv/HPL_perm.cpp
src/pgesv/HPL_pdgesv.cpp
src/pgesv/HPL_pdtrsv.cpp
src/blas/HPL_idamax.cpp
src/blas/HPL_daxpy.cpp src/blas/HPL_dscal.cpp src/blas/HPL_dswap.cpp
src/blas/HPL_dger.cpp src/blas/HPL_dtrsm.cpp src/blas/HPL_dtrsv.cpp
src/blas/HPL_dgemm.cpp src/blas/HPL_dgemv.cpp src/blas/HPL_dcopy.cpp
src/auxil/HPL_dlacpy.cpp src/auxil/HPL_dlatcpy.cpp
testing/ptimer/HPL_ptimer_walltime.cpp testing/ptimer/HPL_ptimer.cpp
testing/ptimer/HPL_ptimer_cputime.cpp
testing/timer/HPL_timer_walltime.cpp testing/timer/HPL_timer.cpp
testing/timer/HPL_timer_cputime.cpp
src/panel/HPL_pdpanel_new.cpp src/panel/HPL_pdpanel_init.cpp
src/panel/HPL_pdpanel_free.cpp src/panel/HPL_pdpanel_disp.cpp
testing/backend/HPL_backendWrapper.cpp
testing/backend/HPL_backendCPU.cpp
testing/backend/HPL_backendCommon.cpp
)
if(COMMAND rocm_check_target_ids)
set(DEFAULT_AMDGPU_TARGETS "gfx900:xnack-;gfx906:xnack-;gfx908:xnack-;gfx908:xnack+;gfx90a:xnack-;gfx90a:xnack+")
else()
set(DEFAULT_AMDGPU_TARGETS "gfx900;gfx906;gfx908;gfx908")
endif()
set(TARGETS "${DEFAULT_AMDGPU_TARGETS}" CACHE STRING "List of specific machine types for library to target")
# AMD targets
foreach(target ${TARGETS})
list(APPEND HIP_HIPCC_FLAGS "--amdgpu-target=${target}")
endforeach()
hip_add_executable( xhplhip ${hpl_device_source} ${hpl_host_source})
target_compile_options(xhplhip PRIVATE ${CMAKE_HOST_FLAGS})
target_include_directories( xhplhip PUBLIC hip:device
# ${HIP_ROOT_DIR}/include
${HPLHIP_DEVRAND_INCLUDE_DIRS}
$<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}/include>
$<INSTALL_INTERFACE:include>
)
target_link_libraries( xhplhip roc::rocblas roc::rocrand ${BLAS_LIBRARIES} ${MPI_CXX_LIBRARIES} OpenMP::OpenMP_CXX)
configure_file( include/hplhip_config.hin ${CMAKE_CURRENT_SOURCE_DIR}/include/hplhip_config.h @ONLY NEWLINE_STYLE LF )
install(TARGETS xhplhip RUNTIME DESTINATION bin)