Spaces:
Runtime error
Runtime error
| enable_language(CUDA) | |
| set(THRUST_KNOWN_COMPUTE_ARCHS 35 37 50 52 53 60 61 62 70 72 75 80) | |
| # Split CUDA_FLAGS into 3 parts: | |
| # | |
| # THRUST_CUDA_FLAGS_BASE: Common CUDA flags for all targets. | |
| # THRUST_CUDA_FLAGS_RDC: Additional CUDA flags for targets compiled with RDC. | |
| # THRUST_CUDA_FLAGS_NO_RDC: Additional CUDA flags for targets compiled without RDC. | |
| # | |
| # This is necessary because CUDA SMs 5.3, 6.2, and 7.2 do not support RDC, but | |
| # we want to always build some targets (e.g. testing/cuda/*) with RDC. | |
| # We work around this by building the "always RDC" targets without support for | |
| # those SMs. This requires two sets of CUDA_FLAGS. | |
| # | |
| # Enabling any of those SMs along with the ENABLE_RDC options will result in a | |
| # configuration error. | |
| # | |
| # Because of how CMake handles the CMAKE_CUDA_FLAGS variables, every target | |
| # generated in a given directory will use the same value for CMAKE_CUDA_FLAGS, | |
| # which is determined at the end of the directory's scope. This means caution | |
| # should be used when trying to build different targets with different flags, | |
| # since they might not behave as expected. This will improve with CMake 3.18, | |
| # which add the DEVICE_LINK genex, fixing the issue with using per-target | |
| # CUDA_FLAGS: https://gitlab.kitware.com/cmake/cmake/-/issues/18265 | |
| set(THRUST_CUDA_FLAGS_BASE "${CMAKE_CUDA_FLAGS}") | |
| set(THRUST_CUDA_FLAGS_RDC) | |
| set(THRUST_CUDA_FLAGS_NO_RDC) | |
| # Archs that don't support RDC: | |
| set(no_rdc_archs 53 62 72) | |
| # Find the highest arch: | |
| list(SORT THRUST_KNOWN_COMPUTE_ARCHS) | |
| list(LENGTH THRUST_KNOWN_COMPUTE_ARCHS max_idx) | |
| math(EXPR max_idx "${max_idx} - 1") | |
| list(GET THRUST_KNOWN_COMPUTE_ARCHS ${max_idx} highest_arch) | |
| set(option_init OFF) | |
| if ("Feta" STREQUAL "${CMAKE_CUDA_COMPILER_ID}") | |
| set(option_init ON) | |
| endif() | |
| option(THRUST_DISABLE_ARCH_BY_DEFAULT | |
| "If ON, then all CUDA architectures are disabled on the initial CMake run." | |
| ${option_init} | |
| ) | |
| set(option_init ON) | |
| if (THRUST_DISABLE_ARCH_BY_DEFAULT) | |
| set(option_init OFF) | |
| endif() | |
| set(num_archs_enabled 0) | |
| foreach (arch IN LISTS THRUST_KNOWN_COMPUTE_ARCHS) | |
| option(THRUST_ENABLE_COMPUTE_${arch} | |
| "Enable code generation for tests for sm_${arch}" | |
| ${option_init} | |
| ) | |
| if (NOT THRUST_ENABLE_COMPUTE_${arch}) | |
| continue() | |
| endif() | |
| math(EXPR num_archs_enabled "${num_archs_enabled} + 1") | |
| if ("Feta" STREQUAL "${CMAKE_CUDA_COMPILER_ID}") | |
| if (NOT ${num_archs_enabled} EQUAL 1) | |
| message(FATAL_ERROR | |
| "Feta does not support compilation for multiple device architectures " | |
| "at once." | |
| ) | |
| endif() | |
| set(arch_flag "-gpu=cc${arch}") | |
| else() | |
| set(arch_flag "-gencode arch=compute_${arch},code=sm_${arch}") | |
| endif() | |
| string(APPEND COMPUTE_MESSAGE " sm_${arch}") | |
| string(APPEND THRUST_CUDA_FLAGS_NO_RDC " ${arch_flag}") | |
| if (NOT arch IN_LIST no_rdc_archs) | |
| string(APPEND THRUST_CUDA_FLAGS_RDC " ${arch_flag}") | |
| endif() | |
| endforeach() | |
| if (NOT "Feta" STREQUAL "${CMAKE_CUDA_COMPILER_ID}") | |
| option(THRUST_ENABLE_COMPUTE_FUTURE | |
| "Enable code generation for tests for compute_${highest_arch}" | |
| ${option_init} | |
| ) | |
| if (THRUST_ENABLE_COMPUTE_FUTURE) | |
| string(APPEND THRUST_CUDA_FLAGS_BASE | |
| " -gencode arch=compute_${highest_arch},code=compute_${highest_arch}" | |
| ) | |
| string(APPEND COMPUTE_MESSAGE " compute_${highest_arch}") | |
| endif() | |
| endif() | |
| message(STATUS "Thrust: Enabled CUDA architectures:${COMPUTE_MESSAGE}") | |
| # RDC is off by default in NVCC and on by default in Feta. Turning off RDC | |
| # isn't currently supported by Feta. So, we default to RDC off for NVCC and | |
| # RDC on for Feta. | |
| set(option_init OFF) | |
| if ("Feta" STREQUAL "${CMAKE_CUDA_COMPILER_ID}") | |
| set(option_init ON) | |
| endif() | |
| option(THRUST_ENABLE_TESTS_WITH_RDC | |
| "Build all Thrust tests with RDC; tests that require RDC are not affected by this option." | |
| ${option_init} | |
| ) | |
| option(THRUST_ENABLE_EXAMPLES_WITH_RDC | |
| "Build all Thrust examples with RDC; examples which require RDC are not affected by this option." | |
| ${option_init} | |
| ) | |
| # Check for RDC/SM compatibility and error/warn if necessary | |
| foreach (sm IN LISTS no_rdc_archs) | |
| set(sm_opt THRUST_ENABLE_COMPUTE_${sm}) | |
| if (${sm_opt}) | |
| foreach (opt IN ITEMS TESTS EXAMPLES) | |
| set(rdc_opt THRUST_ENABLE_${opt}_WITH_RDC) | |
| if (${rdc_opt}) | |
| message(FATAL_ERROR | |
| "${rdc_opt} is incompatible with ${sm_opt}, since sm_${sm} does not " | |
| "support RDC." | |
| ) | |
| endif() | |
| endforeach() | |
| message(NOTICE | |
| "sm_${sm} does not support RDC. Targets that require RDC will be built " | |
| "without support for this architecture." | |
| ) | |
| endif() | |
| endforeach() | |
| # By default RDC is not used: | |
| set(CMAKE_CUDA_FLAGS "${THRUST_CUDA_FLAGS_BASE} ${THRUST_CUDA_FLAGS_NO_RDC}") | |