mirror of
https://github.com/Kitware/CMake.git
synced 2026-02-18 05:01:50 -06:00
The `native` architecture compiles for the host's GPUs, but our CI jobs
may may run on hosts with GPUs newer than supported by their version of
the CUDA toolkit. Add an undocumented environment variable to tell
CMake to clamp the native architecture to that supported by the toolkit.
Without this, we may try to compile for architectures not supported by
the CUDA Toolkit, which fails. Since commit d1b48bfabd (CUDA: Add
support for CUDA_ARCHITECTURES=native, 2022-03-04), our CUDA 9.2 CI job
fails when it runs on a CI host with a GPU architecture newer than that
CUDA 9.2 supports. Clamping the architecture level fixes that.
Do not document this clamp behavior publicly, at least for now.
Users can be responsible for building with a CUDA toolkit recent
enough to support their host's GPUs.
Issue: #22375
107 lines
4.2 KiB
CMake
107 lines
4.2 KiB
CMake
# See supported GPUs on Wikipedia
|
|
# https://en.wikipedia.org/wiki/CUDA#GPUs_supported
|
|
|
|
# Initial set based on CUDA 7.0.
|
|
set(CMAKE_CUDA_ARCHITECTURES_ALL 20 21 30 35 37 50 52 53)
|
|
set(CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 20 30 35 50)
|
|
|
|
if(CMAKE_CUDA_COMPILER_TOOLKIT_VERSION VERSION_GREATER_EQUAL 8.0)
|
|
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 60 61 62)
|
|
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 60)
|
|
endif()
|
|
|
|
if(CMAKE_CUDA_COMPILER_TOOLKIT_VERSION VERSION_GREATER_EQUAL 9.0)
|
|
if(NOT CMAKE_CUDA_COMPILER_ID STREQUAL "Clang" OR CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL 6.0)
|
|
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 70 72)
|
|
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 70)
|
|
endif()
|
|
|
|
list(REMOVE_ITEM CMAKE_CUDA_ARCHITECTURES_ALL 20 21)
|
|
list(REMOVE_ITEM CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 20 21)
|
|
endif()
|
|
|
|
if(CMAKE_CUDA_COMPILER_TOOLKIT_VERSION VERSION_GREATER_EQUAL 10.0
|
|
AND (NOT CMAKE_CUDA_COMPILER_ID STREQUAL "Clang" OR CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL 8.0))
|
|
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 75)
|
|
endif()
|
|
|
|
if(CMAKE_CUDA_COMPILER_TOOLKIT_VERSION VERSION_GREATER_EQUAL 11.0)
|
|
if(NOT CMAKE_CUDA_COMPILER_ID STREQUAL "Clang" OR CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL 11.0)
|
|
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 80)
|
|
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 80)
|
|
endif()
|
|
|
|
list(REMOVE_ITEM CMAKE_CUDA_ARCHITECTURES_ALL 30)
|
|
list(REMOVE_ITEM CMAKE_CUDA_ARCHITECTURES_ALL_MAJOR 30)
|
|
endif()
|
|
|
|
if(CMAKE_CUDA_COMPILER_TOOLKIT_VERSION VERSION_GREATER_EQUAL 11.1
|
|
AND (NOT CMAKE_CUDA_COMPILER_ID STREQUAL "Clang" OR CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL 13.0))
|
|
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 86)
|
|
endif()
|
|
|
|
if(CMAKE_CUDA_COMPILER_TOOLKIT_VERSION VERSION_GREATER_EQUAL 11.4
|
|
AND (NOT CMAKE_CUDA_COMPILER_ID STREQUAL "Clang"))
|
|
list(APPEND CMAKE_CUDA_ARCHITECTURES_ALL 87)
|
|
endif()
|
|
|
|
# FIXME(#23161): Detect architectures early since we test them during
|
|
# compiler detection. We already have code to detect them later during
|
|
# compiler testing, so we should not need to do this here.
|
|
if(NOT CMAKE_GENERATOR MATCHES "Visual Studio")
|
|
set(_CUDA_ARCHS_EXE "${CMAKE_PLATFORM_INFO_DIR}/CMakeDetermineCUDACompilerArchs.bin")
|
|
execute_process(
|
|
COMMAND "${_CUDA_NVCC_EXECUTABLE}" -o "${_CUDA_ARCHS_EXE}" --cudart=static "${CMAKE_ROOT}/Modules/CMakeCUDACompilerABI.cu"
|
|
RESULT_VARIABLE _CUDA_ARCHS_RESULT
|
|
OUTPUT_VARIABLE _CUDA_ARCHS_OUTPUT
|
|
ERROR_VARIABLE _CUDA_ARCHS_OUTPUT
|
|
)
|
|
if(_CUDA_ARCHS_RESULT EQUAL 0)
|
|
execute_process(
|
|
COMMAND "${_CUDA_ARCHS_EXE}"
|
|
RESULT_VARIABLE _CUDA_ARCHS_RESULT
|
|
OUTPUT_VARIABLE _CUDA_ARCHS_OUTPUT
|
|
ERROR_VARIABLE _CUDA_ARCHS_OUTPUT
|
|
OUTPUT_STRIP_TRAILING_WHITESPACE
|
|
)
|
|
endif()
|
|
if(_CUDA_ARCHS_RESULT EQUAL 0)
|
|
if("$ENV{CMAKE_CUDA_ARCHITECTURES_NATIVE_CLAMP}")
|
|
# Undocumented hook used by CMake's CI.
|
|
# Clamp native architecture to version range supported by this CUDA.
|
|
list(GET CMAKE_CUDA_ARCHITECTURES_ALL 0 _CUDA_ARCH_MIN)
|
|
list(GET CMAKE_CUDA_ARCHITECTURES_ALL -1 _CUDA_ARCH_MAX)
|
|
set(_CUDA_ARCHITECTURES_NATIVE "")
|
|
foreach(_CUDA_ARCH IN LISTS _CUDA_ARCHS_OUTPUT)
|
|
if(_CUDA_ARCH LESS _CUDA_ARCH_MIN)
|
|
set(_CUDA_ARCH "${_CUDA_ARCH_MIN}")
|
|
endif()
|
|
if(_CUDA_ARCH GREATER _CUDA_ARCH_MAX)
|
|
set(_CUDA_ARCH "${_CUDA_ARCH_MAX}")
|
|
endif()
|
|
list(APPEND _CUDA_ARCHITECTURES_NATIVE ${_CUDA_ARCH})
|
|
endforeach()
|
|
unset(_CUDA_ARCH)
|
|
unset(_CUDA_ARCH_MIN)
|
|
unset(_CUDA_ARCH_MAX)
|
|
else()
|
|
set(_CUDA_ARCHITECTURES_NATIVE "${_CUDA_ARCHS_OUTPUT}")
|
|
endif()
|
|
list(REMOVE_DUPLICATES _CUDA_ARCHITECTURES_NATIVE)
|
|
else()
|
|
if (NOT _CUDA_ARCHS_RESULT MATCHES "[0-9]+")
|
|
set(_CUDA_ARCHS_STATUS " (${_CUDA_ARCHS_RESULT})")
|
|
else()
|
|
set(_CUDA_ARCHS_STATUS "")
|
|
endif()
|
|
string(REPLACE "\n" "\n " _CUDA_ARCHS_OUTPUT " ${_CUDA_ARCHS_OUTPUT}")
|
|
file(APPEND ${CMAKE_BINARY_DIR}${CMAKE_FILES_DIRECTORY}/CMakeError.log
|
|
"Detecting the CUDA native architecture(s) failed with "
|
|
"the following output:\n${_CUDA_ARCHS_OUTPUT}\n\n")
|
|
set(_CUDA_ARCHS_OUTPUT "")
|
|
endif()
|
|
unset(_CUDA_ARCHS_EXE)
|
|
unset(_CUDA_ARCHS_RESULT)
|
|
unset(_CUDA_ARCHS_OUTPUT)
|
|
endif()
|