mirror of
https://github.com/Kitware/CMake.git
synced 2026-05-13 01:29:02 -05:00
Merge branch 'cuda-thread-flags' into release-3.13
Merge-request: !2512
This commit is contained in:
@@ -208,7 +208,9 @@ if(THREADS_FOUND AND NOT TARGET Threads::Threads)
|
||||
add_library(Threads::Threads INTERFACE IMPORTED)
|
||||
|
||||
if(THREADS_HAVE_PTHREAD_ARG)
|
||||
set_property(TARGET Threads::Threads PROPERTY INTERFACE_COMPILE_OPTIONS "-pthread")
|
||||
set_property(TARGET Threads::Threads
|
||||
PROPERTY INTERFACE_COMPILE_OPTIONS "$<$<COMPILE_LANGUAGE:CUDA>:SHELL:-Xcompiler -pthread>"
|
||||
"$<$<NOT:$<COMPILE_LANGUAGE:CUDA>>:-pthread>")
|
||||
endif()
|
||||
|
||||
if(CMAKE_THREAD_LIBS_INIT)
|
||||
|
||||
@@ -25,6 +25,23 @@ cmLinkLineDeviceComputer::~cmLinkLineDeviceComputer()
|
||||
{
|
||||
}
|
||||
|
||||
static bool cmLinkItemValidForDevice(std::string const& item)
|
||||
{
|
||||
// Valid items are:
|
||||
// * Non-flags (does not start in '-')
|
||||
// * Specific flags --library, --library-path, -l, -L
|
||||
// For example:
|
||||
// * 'cublas_device' => pass-along
|
||||
// * '--library pthread' => pass-along
|
||||
// * '-lpthread' => pass-along
|
||||
// * '-pthread' => drop
|
||||
// * '-a' => drop
|
||||
return (!cmHasLiteralPrefix(item, "-") || //
|
||||
cmHasLiteralPrefix(item, "-l") || //
|
||||
cmHasLiteralPrefix(item, "-L") || //
|
||||
cmHasLiteralPrefix(item, "--library"));
|
||||
}
|
||||
|
||||
std::string cmLinkLineDeviceComputer::ComputeLinkLibraries(
|
||||
cmComputeLinkInformation& cli, std::string const& stdLibString)
|
||||
{
|
||||
@@ -69,7 +86,7 @@ std::string cmLinkLineDeviceComputer::ComputeLinkLibraries(
|
||||
}
|
||||
out +=
|
||||
this->ConvertToOutputFormat(this->ConvertToLinkReference(item.Value));
|
||||
} else {
|
||||
} else if (cmLinkItemValidForDevice(item.Value)) {
|
||||
out += item.Value;
|
||||
}
|
||||
|
||||
|
||||
@@ -4,5 +4,6 @@ ADD_TEST_MACRO(Cuda.ConsumeCompileFeatures CudaConsumeCompileFeatures)
|
||||
ADD_TEST_MACRO(Cuda.ObjectLibrary CudaObjectLibrary)
|
||||
ADD_TEST_MACRO(Cuda.MixedStandardLevels MixedStandardLevels)
|
||||
ADD_TEST_MACRO(Cuda.ToolkitInclude CudaToolkitInclude)
|
||||
ADD_TEST_MACRO(Cuda.ProperDeviceLibraries ProperDeviceLibraries)
|
||||
ADD_TEST_MACRO(Cuda.ProperLinkFlags ProperLinkFlags)
|
||||
ADD_TEST_MACRO(Cuda.WithC CudaWithC)
|
||||
|
||||
@@ -0,0 +1,45 @@
|
||||
cmake_minimum_required(VERSION 3.13)
|
||||
project(ProperDeviceLibraries CXX CUDA)
|
||||
|
||||
string(APPEND CMAKE_CUDA_FLAGS " -gencode arch=compute_35,code=compute_35 -gencode arch=compute_35,code=sm_35")
|
||||
set(CMAKE_CUDA_STANDARD 11)
|
||||
|
||||
set(THREADS_PREFER_PTHREAD_FLAG ON)
|
||||
find_package(Threads)
|
||||
|
||||
add_executable(ProperDeviceLibraries main.cu)
|
||||
set_target_properties(ProperDeviceLibraries
|
||||
PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
|
||||
|
||||
add_library(UseThreadsMixed SHARED use_pthreads.cxx use_pthreads.cu)
|
||||
target_link_libraries(UseThreadsMixed Threads::Threads)
|
||||
|
||||
add_library(UseThreadsCuda SHARED use_pthreads.cu)
|
||||
target_link_libraries(UseThreadsCuda Threads::Threads)
|
||||
|
||||
target_link_libraries(ProperDeviceLibraries PRIVATE UseThreadsMixed UseThreadsCuda)
|
||||
|
||||
if(THREADS_HAVE_PTHREAD_ARG AND CMAKE_USE_PTHREADS_INIT)
|
||||
add_library(UseExplicitPThreadsFlag SHARED use_pthreads.cu)
|
||||
target_compile_options(UseExplicitPThreadsFlag PUBLIC "-Xcompiler=-pthread")
|
||||
target_link_libraries(UseExplicitPThreadsFlag PUBLIC "-pthread")
|
||||
|
||||
add_library(UseExplicitLThreadsFlag SHARED use_pthreads.cu)
|
||||
target_compile_options(UseExplicitLThreadsFlag PUBLIC "-Xcompiler=-pthread")
|
||||
target_link_libraries(UseExplicitLThreadsFlag PUBLIC "-lpthread")
|
||||
|
||||
add_library(UseExplicitLongThreadsFlag SHARED use_pthreads.cu)
|
||||
target_link_libraries(UseExplicitLongThreadsFlag PUBLIC "--library pthread")
|
||||
|
||||
target_link_libraries(ProperDeviceLibraries PRIVATE UseExplicitPThreadsFlag UseExplicitLThreadsFlag UseExplicitLongThreadsFlag)
|
||||
endif()
|
||||
|
||||
if(CMAKE_CUDA_COMPILER_VERSION VERSION_LESS 10.0.0)
|
||||
#CUDA 10 removed the cublas_device library
|
||||
target_link_libraries(ProperDeviceLibraries PRIVATE cublas_device)
|
||||
endif()
|
||||
|
||||
if(APPLE)
|
||||
# Help the static cuda runtime find the driver (libcuda.dyllib) at runtime.
|
||||
set_property(TARGET ProperDeviceLibraries PROPERTY BUILD_RPATH ${CMAKE_CUDA_IMPLICIT_LINK_DIRECTORIES})
|
||||
endif()
|
||||
+9
@@ -3,6 +3,15 @@
|
||||
#include <cuda_runtime.h>
|
||||
#include <iostream>
|
||||
|
||||
#if defined(USE_THREADS_POSIX) && defined(HAVE_PTHREAD_H)
|
||||
|
||||
# include <pthread.h>
|
||||
static int verify_linking_to_pthread()
|
||||
{
|
||||
return static_cast<int>(pthread_self());
|
||||
}
|
||||
#endif
|
||||
|
||||
// this test only makes sense for versions of CUDA that ships
|
||||
// static libraries that have separable compilation device symbols
|
||||
#if __CUDACC_VER_MAJOR__ <= 9
|
||||
@@ -0,0 +1,9 @@
|
||||
|
||||
#if defined(USE_THREADS_POSIX) && defined(HAVE_PTHREAD_H)
|
||||
|
||||
# include <pthread.h>
|
||||
static int verify_linking_to_pthread_cuda()
|
||||
{
|
||||
return static_cast<int>(pthread_self());
|
||||
}
|
||||
#endif
|
||||
@@ -0,0 +1,9 @@
|
||||
|
||||
#if defined(USE_THREADS_POSIX) && defined(HAVE_PTHREAD_H)
|
||||
|
||||
# include <pthread.h>
|
||||
static int verify_linking_to_pthread_cxx()
|
||||
{
|
||||
return static_cast<int>(pthread_self());
|
||||
}
|
||||
#endif
|
||||
@@ -3,7 +3,6 @@ ADD_TEST_MACRO(CudaOnly.CircularLinkLine CudaOnlyCircularLinkLine)
|
||||
ADD_TEST_MACRO(CudaOnly.EnableStandard CudaOnlyEnableStandard)
|
||||
ADD_TEST_MACRO(CudaOnly.ExportPTX CudaOnlyExportPTX)
|
||||
ADD_TEST_MACRO(CudaOnly.GPUDebugFlag CudaOnlyGPUDebugFlag)
|
||||
ADD_TEST_MACRO(CudaOnly.LinkSystemDeviceLibraries CudaOnlyLinkSystemDeviceLibraries)
|
||||
ADD_TEST_MACRO(CudaOnly.ResolveDeviceSymbols CudaOnlyResolveDeviceSymbols)
|
||||
ADD_TEST_MACRO(CudaOnly.SeparateCompilation CudaOnlySeparateCompilation)
|
||||
ADD_TEST_MACRO(CudaOnly.WithDefs CudaOnlyWithDefs)
|
||||
|
||||
@@ -1,15 +0,0 @@
|
||||
cmake_minimum_required(VERSION 3.8)
|
||||
project(LinkSystemDeviceLibraries CUDA)
|
||||
|
||||
string(APPEND CMAKE_CUDA_FLAGS " -gencode arch=compute_35,code=compute_35 -gencode arch=compute_35,code=sm_35")
|
||||
set(CMAKE_CUDA_STANDARD 11)
|
||||
|
||||
add_executable(CudaOnlyLinkSystemDeviceLibraries main.cu)
|
||||
set_target_properties( CudaOnlyLinkSystemDeviceLibraries
|
||||
PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
|
||||
target_link_libraries( CudaOnlyLinkSystemDeviceLibraries PRIVATE cublas_device)
|
||||
|
||||
if(APPLE)
|
||||
# Help the static cuda runtime find the driver (libcuda.dyllib) at runtime.
|
||||
set_property(TARGET CudaOnlyLinkSystemDeviceLibraries PROPERTY BUILD_RPATH ${CMAKE_CUDA_IMPLICIT_LINK_DIRECTORIES})
|
||||
endif()
|
||||
Reference in New Issue
Block a user