cmake_minimum_required(VERSION 3.7) project (SeparateCompilation CUDA) #Goal for this example: #Build a static library that defines multiple methods and kernels that #use each other. #After that confirm that we can call those methods from dynamic libraries #and executables. #We complicate the matter by also testing that multiple static libraries #all containing cuda separable compilation code links properly set(CMAKE_CUDA_ARCHITECTURES 30 35 50 52) set(CMAKE_CUDA_SEPARABLE_COMPILATION ON) add_library(CUDASeparateLibA STATIC file1.cu file2.cu file3.cu) target_compile_features(CUDASeparateLibA PRIVATE cuda_std_11) get_property(sep_comp TARGET CUDASeparateLibA PROPERTY CUDA_SEPARABLE_COMPILATION) if(NOT sep_comp) message(FATAL_ERROR "CUDA_SEPARABLE_COMPILATION not initialized") endif() unset(CMAKE_CUDA_SEPARABLE_COMPILATION) if(CMAKE_CUDA_SIMULATE_ID STREQUAL "MSVC") # Test adding a flag that is not in our CUDA flag table for VS. if(NOT CMAKE_CUDA_COMPILER_VERSION VERSION_LESS 8) string(APPEND CMAKE_CUDA_FLAGS " --ftemplate-depth 50") endif() # Test adding a flag that nvcc should pass to the host compiler. target_compile_options(CUDASeparateLibA PRIVATE -Xcompiler=-bigobj) endif() #Having file4/file5 in a shared library causes serious problems #with the nvcc linker and it will generate bad entries that will #cause a segv when trying to run the executable # add_library(CUDASeparateLibB STATIC file4.cu file5.cu) target_compile_features(CUDASeparateLibB PRIVATE cuda_std_11) target_link_libraries(CUDASeparateLibB PRIVATE CUDASeparateLibA) add_executable(CudaOnlySeparateCompilation main.cu) target_link_libraries(CudaOnlySeparateCompilation PRIVATE CUDASeparateLibB) set_target_properties(CudaOnlySeparateCompilation PROPERTIES CUDA_STANDARD 11) set_target_properties(CudaOnlySeparateCompilation PROPERTIES CUDA_STANDARD_REQUIRED TRUE) set_target_properties(CUDASeparateLibA CUDASeparateLibB PROPERTIES CUDA_SEPARABLE_COMPILATION ON POSITION_INDEPENDENT_CODE ON) if (CMAKE_GENERATOR MATCHES "^Visual Studio") #Visual Studio CUDA integration will not perform device linking #on a target that itself does not have GenerateRelocatableDeviceCode #enabled. set_target_properties(CudaOnlySeparateCompilation PROPERTIES CUDA_SEPARABLE_COMPILATION ON) endif() if(APPLE) # Help the static cuda runtime find the driver (libcuda.dyllib) at runtime. set_property(TARGET CudaOnlySeparateCompilation PROPERTY BUILD_RPATH ${CMAKE_CUDA_IMPLICIT_LINK_DIRECTORIES}) endif()