Browse Source

Merge topic 'cuda-thread-flags'

2cc050b53b CUDA: Add test for device linking when host linking uses threads
83c13ca44f FindThreads: Pass -pthread to CUDA compiler through -Xcompiler
cf92fd9ae9 Merge branch 'cuda-filter-device-link-items' into cuda-thread-flags
e768d96c74 CUDA: Filter out host link flags during device linking

Acked-by: Kitware Robot <kwrobot@kitware.com>
Acked-by: Kelly (KT) Thompson <kgt@lanl.gov>
Merge-request: !2512
pull/324/head
Brad King 7 years ago
committed by Kitware Robot
parent
commit
69275d3b6a
  1. 4
      Modules/FindThreads.cmake
  2. 19
      Source/cmLinkLineDeviceComputer.cxx
  3. 1
      Tests/Cuda/CMakeLists.txt
  4. 45
      Tests/Cuda/ProperDeviceLibraries/CMakeLists.txt
  5. 9
      Tests/Cuda/ProperDeviceLibraries/main.cu
  6. 9
      Tests/Cuda/ProperDeviceLibraries/use_pthreads.cu
  7. 9
      Tests/Cuda/ProperDeviceLibraries/use_pthreads.cxx
  8. 1
      Tests/CudaOnly/CMakeLists.txt
  9. 15
      Tests/CudaOnly/LinkSystemDeviceLibraries/CMakeLists.txt

4
Modules/FindThreads.cmake

@ -209,7 +209,9 @@ if(THREADS_FOUND AND NOT TARGET Threads::Threads)
add_library(Threads::Threads INTERFACE IMPORTED)
if(THREADS_HAVE_PTHREAD_ARG)
set_property(TARGET Threads::Threads PROPERTY INTERFACE_COMPILE_OPTIONS "-pthread")
set_property(TARGET Threads::Threads
PROPERTY INTERFACE_COMPILE_OPTIONS "$<$<COMPILE_LANGUAGE:CUDA>:SHELL:-Xcompiler -pthread>"
"$<$<NOT:$<COMPILE_LANGUAGE:CUDA>>:-pthread>")
endif()
if(CMAKE_THREAD_LIBS_INIT)

19
Source/cmLinkLineDeviceComputer.cxx

@ -25,6 +25,23 @@ cmLinkLineDeviceComputer::~cmLinkLineDeviceComputer()
{
}
static bool cmLinkItemValidForDevice(std::string const& item)
{
// Valid items are:
// * Non-flags (does not start in '-')
// * Specific flags --library, --library-path, -l, -L
// For example:
// * 'cublas_device' => pass-along
// * '--library pthread' => pass-along
// * '-lpthread' => pass-along
// * '-pthread' => drop
// * '-a' => drop
return (!cmHasLiteralPrefix(item, "-") || //
cmHasLiteralPrefix(item, "-l") || //
cmHasLiteralPrefix(item, "-L") || //
cmHasLiteralPrefix(item, "--library"));
}
std::string cmLinkLineDeviceComputer::ComputeLinkLibraries(
cmComputeLinkInformation& cli, std::string const& stdLibString)
{
@ -69,7 +86,7 @@ std::string cmLinkLineDeviceComputer::ComputeLinkLibraries(
}
out +=
this->ConvertToOutputFormat(this->ConvertToLinkReference(item.Value));
} else {
} else if (cmLinkItemValidForDevice(item.Value)) {
out += item.Value;
}

1
Tests/Cuda/CMakeLists.txt

@ -4,5 +4,6 @@ ADD_TEST_MACRO(Cuda.ConsumeCompileFeatures CudaConsumeCompileFeatures)
ADD_TEST_MACRO(Cuda.ObjectLibrary CudaObjectLibrary)
ADD_TEST_MACRO(Cuda.MixedStandardLevels MixedStandardLevels)
ADD_TEST_MACRO(Cuda.ToolkitInclude CudaToolkitInclude)
ADD_TEST_MACRO(Cuda.ProperDeviceLibraries ProperDeviceLibraries)
ADD_TEST_MACRO(Cuda.ProperLinkFlags ProperLinkFlags)
ADD_TEST_MACRO(Cuda.WithC CudaWithC)

45
Tests/Cuda/ProperDeviceLibraries/CMakeLists.txt

@ -0,0 +1,45 @@
cmake_minimum_required(VERSION 3.13)
project(ProperDeviceLibraries CXX CUDA)
string(APPEND CMAKE_CUDA_FLAGS " -gencode arch=compute_35,code=compute_35 -gencode arch=compute_35,code=sm_35")
set(CMAKE_CUDA_STANDARD 11)
set(THREADS_PREFER_PTHREAD_FLAG ON)
find_package(Threads)
add_executable(ProperDeviceLibraries main.cu)
set_target_properties(ProperDeviceLibraries
PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
add_library(UseThreadsMixed SHARED use_pthreads.cxx use_pthreads.cu)
target_link_libraries(UseThreadsMixed Threads::Threads)
add_library(UseThreadsCuda SHARED use_pthreads.cu)
target_link_libraries(UseThreadsCuda Threads::Threads)
target_link_libraries(ProperDeviceLibraries PRIVATE UseThreadsMixed UseThreadsCuda)
if(THREADS_HAVE_PTHREAD_ARG AND CMAKE_USE_PTHREADS_INIT)
add_library(UseExplicitPThreadsFlag SHARED use_pthreads.cu)
target_compile_options(UseExplicitPThreadsFlag PUBLIC "-Xcompiler=-pthread")
target_link_libraries(UseExplicitPThreadsFlag PUBLIC "-pthread")
add_library(UseExplicitLThreadsFlag SHARED use_pthreads.cu)
target_compile_options(UseExplicitLThreadsFlag PUBLIC "-Xcompiler=-pthread")
target_link_libraries(UseExplicitLThreadsFlag PUBLIC "-lpthread")
add_library(UseExplicitLongThreadsFlag SHARED use_pthreads.cu)
target_link_libraries(UseExplicitLongThreadsFlag PUBLIC "--library pthread")
target_link_libraries(ProperDeviceLibraries PRIVATE UseExplicitPThreadsFlag UseExplicitLThreadsFlag UseExplicitLongThreadsFlag)
endif()
if(CMAKE_CUDA_COMPILER_VERSION VERSION_LESS 10.0.0)
#CUDA 10 removed the cublas_device library
target_link_libraries(ProperDeviceLibraries PRIVATE cublas_device)
endif()
if(APPLE)
# Help the static cuda runtime find the driver (libcuda.dyllib) at runtime.
set_property(TARGET ProperDeviceLibraries PROPERTY BUILD_RPATH ${CMAKE_CUDA_IMPLICIT_LINK_DIRECTORIES})
endif()

9
Tests/CudaOnly/LinkSystemDeviceLibraries/main.cu → Tests/Cuda/ProperDeviceLibraries/main.cu

@ -3,6 +3,15 @@
#include <cuda_runtime.h>
#include <iostream>
#if defined(USE_THREADS_POSIX) && defined(HAVE_PTHREAD_H)
# include <pthread.h>
static int verify_linking_to_pthread()
{
return static_cast<int>(pthread_self());
}
#endif
// this test only makes sense for versions of CUDA that ships
// static libraries that have separable compilation device symbols
#if __CUDACC_VER_MAJOR__ <= 9

9
Tests/Cuda/ProperDeviceLibraries/use_pthreads.cu

@ -0,0 +1,9 @@
#if defined(USE_THREADS_POSIX) && defined(HAVE_PTHREAD_H)
# include <pthread.h>
static int verify_linking_to_pthread_cuda()
{
return static_cast<int>(pthread_self());
}
#endif

9
Tests/Cuda/ProperDeviceLibraries/use_pthreads.cxx

@ -0,0 +1,9 @@
#if defined(USE_THREADS_POSIX) && defined(HAVE_PTHREAD_H)
# include <pthread.h>
static int verify_linking_to_pthread_cxx()
{
return static_cast<int>(pthread_self());
}
#endif

1
Tests/CudaOnly/CMakeLists.txt

@ -3,7 +3,6 @@ ADD_TEST_MACRO(CudaOnly.CircularLinkLine CudaOnlyCircularLinkLine)
ADD_TEST_MACRO(CudaOnly.EnableStandard CudaOnlyEnableStandard)
ADD_TEST_MACRO(CudaOnly.ExportPTX CudaOnlyExportPTX)
ADD_TEST_MACRO(CudaOnly.GPUDebugFlag CudaOnlyGPUDebugFlag)
ADD_TEST_MACRO(CudaOnly.LinkSystemDeviceLibraries CudaOnlyLinkSystemDeviceLibraries)
ADD_TEST_MACRO(CudaOnly.ResolveDeviceSymbols CudaOnlyResolveDeviceSymbols)
ADD_TEST_MACRO(CudaOnly.SeparateCompilation CudaOnlySeparateCompilation)
ADD_TEST_MACRO(CudaOnly.WithDefs CudaOnlyWithDefs)

15
Tests/CudaOnly/LinkSystemDeviceLibraries/CMakeLists.txt

@ -1,15 +0,0 @@
cmake_minimum_required(VERSION 3.8)
project(LinkSystemDeviceLibraries CUDA)
string(APPEND CMAKE_CUDA_FLAGS " -gencode arch=compute_35,code=compute_35 -gencode arch=compute_35,code=sm_35")
set(CMAKE_CUDA_STANDARD 11)
add_executable(CudaOnlyLinkSystemDeviceLibraries main.cu)
set_target_properties( CudaOnlyLinkSystemDeviceLibraries
PROPERTIES CUDA_SEPARABLE_COMPILATION ON)
target_link_libraries( CudaOnlyLinkSystemDeviceLibraries PRIVATE cublas_device)
if(APPLE)
# Help the static cuda runtime find the driver (libcuda.dyllib) at runtime.
set_property(TARGET CudaOnlyLinkSystemDeviceLibraries PROPERTY BUILD_RPATH ${CMAKE_CUDA_IMPLICIT_LINK_DIRECTORIES})
endif()
Loading…
Cancel
Save