|
1 | 1 | macro(add_offload_test_device_code test_filename test_name)
|
2 | 2 | message("Building Offload API device code for test '${test_name}'")
|
3 | 3 | set(SRC_PATH ${CMAKE_CURRENT_SOURCE_DIR}/${test_filename})
|
4 |
| - set(UTIL_PATH ${CMAKE_CURRENT_SOURCE_DIR}/util.h) |
5 | 4 |
|
6 | 5 | # Build for NVPTX
|
7 |
| - set(BIN_PATH ${CMAKE_CURRENT_BINARY_DIR}/${test_name}.nvptx64.bin) |
8 |
| - add_custom_command(OUTPUT ${BIN_PATH} |
9 |
| - COMMAND |
10 |
| - ${CMAKE_C_COMPILER} --target=nvptx64-nvidia-cuda -march=native |
11 |
| - --cuda-path=/usr/local/cuda |
12 |
| - ${SRC_PATH} -o ${BIN_PATH} |
13 |
| - DEPENDS ${SRC_PATH} ${UTIL_PATH} |
14 |
| - ) |
15 |
| - list(APPEND BIN_PATHS ${BIN_PATH}) |
| 6 | + if(OFFLOAD_TEST_TARGET_NVIDIA) |
| 7 | + set(BIN_PATH ${CMAKE_CURRENT_BINARY_DIR}/${test_name}.nvptx64.bin) |
| 8 | + add_custom_command(OUTPUT ${BIN_PATH} |
| 9 | + COMMAND |
| 10 | + ${CMAKE_C_COMPILER} --target=nvptx64-nvidia-cuda |
| 11 | + -march=${LIBOMPTARGET_DEP_CUDA_ARCH} |
| 12 | + --cuda-path=${CUDA_ROOT} |
| 13 | + ${SRC_PATH} -o ${BIN_PATH} |
| 14 | + DEPENDS ${SRC_PATH} |
| 15 | + ) |
| 16 | + list(APPEND BIN_PATHS ${BIN_PATH}) |
| 17 | + endif() |
16 | 18 |
|
17 | 19 | # Build for AMDGPU
|
18 |
| - set(BIN_PATH ${CMAKE_CURRENT_BINARY_DIR}/${test_name}.amdgpu.bin) |
19 |
| - add_custom_command(OUTPUT ${BIN_PATH} |
20 |
| - COMMAND |
21 |
| - ${CMAKE_C_COMPILER} --target=amdgcn-amd-amdhsa -nogpulib |
22 |
| - ${SRC_PATH} -o ${BIN_PATH} |
23 |
| - DEPENDS ${SRC_PATH} ${UTIL_PATH} |
24 |
| - ) |
25 |
| - list(APPEND BIN_PATHS ${BIN_PATH}) |
| 20 | + if(OFFLOAD_TEST_TARGET_AMDGPU) |
| 21 | + set(BIN_PATH ${CMAKE_CURRENT_BINARY_DIR}/${test_name}.amdgpu.bin) |
| 22 | + add_custom_command(OUTPUT ${BIN_PATH} |
| 23 | + COMMAND |
| 24 | + ${CMAKE_C_COMPILER} --target=amdgcn-amd-amdhsa -nogpulib |
| 25 | + -mcpu=${LIBOMPTARGET_DEP_AMDGPU_ARCH} |
| 26 | + ${SRC_PATH} -o ${BIN_PATH} |
| 27 | + DEPENDS ${SRC_PATH} |
| 28 | + ) |
| 29 | + list(APPEND BIN_PATHS ${BIN_PATH}) |
| 30 | + endif() |
26 | 31 |
|
27 | 32 | # TODO: Build for host CPU
|
28 | 33 | endmacro()
|
29 | 34 |
|
30 | 35 |
|
| 36 | +# Decide what device targets to build for. LibomptargetGetDependencies is |
| 37 | +# included at the top-level so the GPUs present on the system are already |
| 38 | +# detected. |
| 39 | +set(OFFLOAD_TESTS_FORCE_NVIDIA_ARCH "" CACHE STRING |
| 40 | + "Force building of NVPTX device code for Offload unit tests with the given arch, e.g. sm_61") |
| 41 | +set(OFFLOAD_TESTS_FORCE_AMDGPU_ARCH "" CACHE STRING |
| 42 | + "Force building of AMDGPU device code for Offload unit tests with the given arch, e.g. gfx1030") |
| 43 | + |
| 44 | +find_package(CUDAToolkit QUIET) |
| 45 | +if(CUDAToolkit_FOUND) |
| 46 | + get_filename_component(CUDA_ROOT "${CUDAToolkit_BIN_DIR}" DIRECTORY ABSOLUTE) |
| 47 | +endif() |
| 48 | +if (OFFLOAD_TESTS_FORCE_NVIDIA_ARCH) |
| 49 | + set(LIBOMPTARGET_DEP_CUDA_ARCH ${OFFLOAD_TESTS_FORCE_NVIDIA_ARCH}) |
| 50 | + set(OFFLOAD_TEST_TARGET_NVIDIA ON) |
| 51 | +elseif (LIBOMPTARGET_FOUND_NVIDIA_GPU AND CUDA_ROOT AND "cuda" IN_LIST LIBOMPTARGET_PLUGINS_TO_BUILD) |
| 52 | + set(OFFLOAD_TEST_TARGET_NVIDIA ON) |
| 53 | +endif() |
| 54 | + |
| 55 | +if (OFFLOAD_TESTS_FORCE_AMDGPU_ARCH) |
| 56 | + set(LIBOMPTARGET_DEP_AMDGPU_ARCH ${OFFLOAD_TESTS_FORCE_AMDGPU_ARCH}) |
| 57 | + set(OFFLOAD_TEST_TARGET_AMDGPU ON) |
| 58 | +elseif (LIBOMPTARGET_FOUND_AMDGPU_GPU AND "amdgpu" IN_LIST LIBOMPTARGET_PLUGINS_TO_BUILD) |
| 59 | + list(GET LIBOMPTARGET_AMDGPU_DETECTED_ARCH_LIST 0 LIBOMPTARGET_DEP_AMDGPU_ARCH) |
| 60 | + set(OFFLOAD_TEST_TARGET_AMDGPU ON) |
| 61 | +endif() |
| 62 | + |
31 | 63 | add_offload_test_device_code(foo.c foo)
|
32 | 64 | add_offload_test_device_code(bar.c bar)
|
33 | 65 |
|
34 |
| -add_custom_target(LibompUnitTestsDeviceBins DEPENDS ${BIN_PATHS}) |
| 66 | +add_custom_target(LibomptUnitTestsDeviceBins DEPENDS ${BIN_PATHS}) |
35 | 67 |
|
36 | 68 | set(OFFLOAD_TEST_DEVICE_CODE_PATH ${CMAKE_CURRENT_BINARY_DIR} PARENT_SCOPE)
|
0 commit comments