| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  | # Copyright (c) 2017 - 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  | # SPDX-License-Identifier: BSD-3-Clause
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | #
 | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  | # Redistribution and use in source and binary forms, with or without
 | 
					
						
							|  |  |  | # modification, are permitted provided that the following conditions are met:
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | #
 | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  | # 1. Redistributions of source code must retain the above copyright notice, this
 | 
					
						
							|  |  |  | # list of conditions and the following disclaimer.
 | 
					
						
							|  |  |  | #
 | 
					
						
							|  |  |  | # 2. Redistributions in binary form must reproduce the above copyright notice,
 | 
					
						
							|  |  |  | # this list of conditions and the following disclaimer in the documentation
 | 
					
						
							|  |  |  | # and/or other materials provided with the distribution.
 | 
					
						
							|  |  |  | #
 | 
					
						
							|  |  |  | # 3. Neither the name of the copyright holder nor the names of its
 | 
					
						
							|  |  |  | # contributors may be used to endorse or promote products derived from
 | 
					
						
							|  |  |  | # this software without specific prior written permission.
 | 
					
						
							|  |  |  | #
 | 
					
						
							|  |  |  | # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 | 
					
						
							|  |  |  | # AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 | 
					
						
							|  |  |  | # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 | 
					
						
							|  |  |  | # DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
 | 
					
						
							|  |  |  | # FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 | 
					
						
							|  |  |  | # DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
 | 
					
						
							|  |  |  | # SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
 | 
					
						
							|  |  |  | # CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
 | 
					
						
							|  |  |  | # OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | if(CUDA_COMPILER MATCHES "[Cc]lang")
 | 
					
						
							|  |  |  |   set(CUTLASS_NATIVE_CUDA_INIT ON)
 | 
					
						
							|  |  |  | elseif(CMAKE_VERSION VERSION_LESS 3.12.4)
 | 
					
						
							|  |  |  |   set(CUTLASS_NATIVE_CUDA_INIT OFF)
 | 
					
						
							|  |  |  | else()
 | 
					
						
							|  |  |  |   set(CUTLASS_NATIVE_CUDA_INIT ON)
 | 
					
						
							|  |  |  | endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | set(CUTLASS_NATIVE_CUDA ${CUTLASS_NATIVE_CUDA_INIT} CACHE BOOL "Utilize the CMake native CUDA flow")
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | if(NOT DEFINED ENV{CUDACXX} AND NOT DEFINED ENV{CUDA_BIN_PATH} AND DEFINED ENV{CUDA_PATH})
 | 
					
						
							|  |  |  |   # For backward compatibility, allow use of CUDA_PATH.
 | 
					
						
							|  |  |  |   set(ENV{CUDACXX} $ENV{CUDA_PATH}/bin/nvcc)
 | 
					
						
							|  |  |  | endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | if(CUTLASS_NATIVE_CUDA)
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   enable_language(CUDA)
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   if(NOT CUDA_VERSION)
 | 
					
						
							|  |  |  |     set(CUDA_VERSION ${CMAKE_CUDA_COMPILER_VERSION})
 | 
					
						
							|  |  |  |   endif()
 | 
					
						
							|  |  |  |   if(NOT CUDA_TOOLKIT_ROOT_DIR)
 | 
					
						
							|  |  |  |     get_filename_component(CUDA_TOOLKIT_ROOT_DIR "${CMAKE_CUDA_COMPILER}/../.." ABSOLUTE)
 | 
					
						
							|  |  |  |   endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | else()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   find_package(CUDA REQUIRED)
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   # We workaround missing variables with the native flow by also finding the CUDA toolkit the old way.
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   if(NOT CMAKE_CUDA_COMPILER_VERSION)
 | 
					
						
							|  |  |  |     set(CMAKE_CUDA_COMPILER_VERSION ${CUDA_VERSION})
 | 
					
						
							|  |  |  |   endif()
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | if (CUDA_VERSION VERSION_LESS 9.2)
 | 
					
						
							|  |  |  |   message(FATAL_ERROR "CUDA 9.2+ Required, Found ${CUDA_VERSION}.")
 | 
					
						
							|  |  |  | endif()
 | 
					
						
							|  |  |  | if(NOT CUTLASS_NATIVE_CUDA OR CUDA_COMPILER MATCHES "[Cc]lang")
 | 
					
						
							|  |  |  |   set(CMAKE_CUDA_COMPILER ${CUDA_TOOLKIT_ROOT_DIR}/bin/nvcc)
 | 
					
						
							|  |  |  |   message(STATUS "CUDA Compiler: ${CMAKE_CUDA_COMPILER}")
 | 
					
						
							|  |  |  | endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | find_library( | 
					
						
							|  |  |  |   CUDART_LIBRARY cudart
 | 
					
						
							|  |  |  |   PATHS
 | 
					
						
							|  |  |  |   ${CUDA_TOOLKIT_ROOT_DIR}
 | 
					
						
							|  |  |  |   PATH_SUFFIXES
 | 
					
						
							| 
									
										
										
										
											2023-05-24 22:21:25 +08:00
										 |  |  |   lib/x86_64-linux-gnu
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   lib/x64
 | 
					
						
							|  |  |  |   lib64
 | 
					
						
							|  |  |  |   lib
 | 
					
						
							|  |  |  |   NO_DEFAULT_PATH
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   # We aren't going to search any system paths. We want to find the runtime 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   # in the CUDA toolkit we're building against.
 | 
					
						
							|  |  |  |   )
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | if(NOT TARGET cudart AND CUDART_LIBRARY)
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   message(STATUS "CUDART: ${CUDART_LIBRARY}")
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   if(WIN32)
 | 
					
						
							|  |  |  |     add_library(cudart STATIC IMPORTED GLOBAL)
 | 
					
						
							|  |  |  |     # Even though we're linking against a .dll, in Windows you statically link against
 | 
					
						
							|  |  |  |     # the .lib file found under lib/x64. The .dll will be loaded at runtime automatically
 | 
					
						
							|  |  |  |     # from the PATH search.
 | 
					
						
							|  |  |  |   else()
 | 
					
						
							|  |  |  |     add_library(cudart SHARED IMPORTED GLOBAL)
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   endif()  
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   add_library(nvidia::cudart ALIAS cudart)
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   set_property( | 
					
						
							|  |  |  |     TARGET cudart
 | 
					
						
							|  |  |  |     PROPERTY IMPORTED_LOCATION
 | 
					
						
							|  |  |  |     ${CUDART_LIBRARY}
 | 
					
						
							|  |  |  |     )
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | elseif(TARGET cudart)
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   message(STATUS "CUDART: Already Found")
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | else()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   message(STATUS "CUDART: Not Found")
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | find_library( | 
					
						
							|  |  |  |   CUDA_DRIVER_LIBRARY cuda
 | 
					
						
							|  |  |  |   PATHS
 | 
					
						
							|  |  |  |   ${CUDA_TOOLKIT_ROOT_DIR}
 | 
					
						
							|  |  |  |   PATH_SUFFIXES
 | 
					
						
							| 
									
										
										
										
											2023-05-24 22:21:25 +08:00
										 |  |  |   lib/x86_64-linux-gnu
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   lib/x64
 | 
					
						
							|  |  |  |   lib64
 | 
					
						
							|  |  |  |   lib
 | 
					
						
							|  |  |  |   lib64/stubs
 | 
					
						
							|  |  |  |   lib/stubs
 | 
					
						
							|  |  |  |   NO_DEFAULT_PATH
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   # We aren't going to search any system paths. We want to find the runtime 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   # in the CUDA toolkit we're building against.
 | 
					
						
							|  |  |  |   )
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | if(NOT TARGET cuda_driver AND CUDA_DRIVER_LIBRARY)
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   message(STATUS "CUDA Driver: ${CUDA_DRIVER_LIBRARY}")
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   if(WIN32)
 | 
					
						
							|  |  |  |     add_library(cuda_driver STATIC IMPORTED GLOBAL)
 | 
					
						
							|  |  |  |     # Even though we're linking against a .dll, in Windows you statically link against
 | 
					
						
							|  |  |  |     # the .lib file found under lib/x64. The .dll will be loaded at runtime automatically
 | 
					
						
							|  |  |  |     # from the PATH search.
 | 
					
						
							|  |  |  |   else()
 | 
					
						
							|  |  |  |     add_library(cuda_driver SHARED IMPORTED GLOBAL)
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   endif()  
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   add_library(nvidia::cuda_driver ALIAS cuda_driver)
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   set_property( | 
					
						
							|  |  |  |     TARGET cuda_driver
 | 
					
						
							|  |  |  |     PROPERTY IMPORTED_LOCATION
 | 
					
						
							|  |  |  |     ${CUDA_DRIVER_LIBRARY}
 | 
					
						
							|  |  |  |     )
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | elseif(TARGET cuda_driver)
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   message(STATUS "CUDA Driver: Already Found")
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | else()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   message(STATUS "CUDA Driver: Not Found")
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | find_library( | 
					
						
							|  |  |  |   NVRTC_LIBRARY nvrtc
 | 
					
						
							|  |  |  |   PATHS
 | 
					
						
							|  |  |  |   ${CUDA_TOOLKIT_ROOT_DIR}
 | 
					
						
							|  |  |  |   PATH_SUFFIXES
 | 
					
						
							|  |  |  |   lib/x64
 | 
					
						
							|  |  |  |   lib64
 | 
					
						
							|  |  |  |   lib
 | 
					
						
							|  |  |  |   NO_DEFAULT_PATH
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   # We aren't going to search any system paths. We want to find the runtime 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   # in the CUDA toolkit we're building against.
 | 
					
						
							|  |  |  |   )
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | if(NOT TARGET nvrtc AND NVRTC_LIBRARY)
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   message(STATUS "NVRTC: ${NVRTC_LIBRARY}")
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   if(WIN32)
 | 
					
						
							|  |  |  |     add_library(nvrtc STATIC IMPORTED GLOBAL)
 | 
					
						
							|  |  |  |     # Even though we're linking against a .dll, in Windows you statically link against
 | 
					
						
							|  |  |  |     # the .lib file found under lib/x64. The .dll will be loaded at runtime automatically
 | 
					
						
							|  |  |  |     # from the PATH search.
 | 
					
						
							|  |  |  |   else()
 | 
					
						
							|  |  |  |     add_library(nvrtc SHARED IMPORTED GLOBAL)
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   endif()  
 | 
					
						
							|  |  |  |   
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   add_library(nvidia::nvrtc ALIAS nvrtc)
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   set_property( | 
					
						
							|  |  |  |     TARGET nvrtc
 | 
					
						
							|  |  |  |     PROPERTY IMPORTED_LOCATION
 | 
					
						
							|  |  |  |     ${NVRTC_LIBRARY}
 | 
					
						
							|  |  |  |     )
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | elseif(TARGET nvrtc)
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   message(STATUS "NVRTC: Already Found")
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | else()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   message(STATUS "NVRTC: Not Found")
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | include_directories(SYSTEM ${CUDA_INCLUDE_DIRS})
 | 
					
						
							|  |  |  | # Some platforms (e.g. Visual Studio) don't add the CUDA include directories to the system include
 | 
					
						
							|  |  |  | # paths by default, so we add it explicitly here.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | function(cutlass_correct_source_file_language_property)
 | 
					
						
							| 
									
										
										
										
											2021-02-26 22:58:26 +08:00
										 |  |  |   if(CUDA_COMPILER MATCHES "[Cc]lang")
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |     foreach(File ${ARGN})
 | 
					
						
							| 
									
										
										
										
											2020-06-09 07:17:35 +08:00
										 |  |  |       if(File MATCHES ".*\.cu$")
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |         set_source_files_properties(${File} PROPERTIES LANGUAGE CXX)
 | 
					
						
							|  |  |  |       endif()
 | 
					
						
							|  |  |  |     endforeach()
 | 
					
						
							|  |  |  |   endif()
 | 
					
						
							|  |  |  | endfunction()
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  | if (MSVC OR CUTLASS_LIBRARY_KERNELS MATCHES "all")
 | 
					
						
							| 
									
										
										
										
											2020-09-24 05:00:58 +08:00
										 |  |  |   set(CUTLASS_UNITY_BUILD_ENABLED_INIT ON)
 | 
					
						
							|  |  |  | else()
 | 
					
						
							|  |  |  |   set(CUTLASS_UNITY_BUILD_ENABLED_INIT OFF)
 | 
					
						
							|  |  |  | endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | set(CUTLASS_UNITY_BUILD_ENABLED ${CUTLASS_UNITY_BUILD_ENABLED_INIT} CACHE BOOL "Enable combined source compilation")
 | 
					
						
							| 
									
										
										
										
											2023-08-08 08:50:32 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | if (MSVC)
 | 
					
						
							|  |  |  |   set(CUTLASS_UNITY_BUILD_BATCH_SIZE_INIT 8)
 | 
					
						
							|  |  |  | else()
 | 
					
						
							|  |  |  |   set(CUTLASS_UNITY_BUILD_BATCH_SIZE_INIT 16)
 | 
					
						
							|  |  |  | endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | set(CUTLASS_UNITY_BUILD_BATCH_SIZE ${CUTLASS_UNITY_BUILD_BATCH_SIZE_INIT} CACHE STRING "Batch size for unified source files")
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | function(cutlass_unify_source_files TARGET_ARGS_VAR)
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   set(options)
 | 
					
						
							|  |  |  |   set(oneValueArgs BATCH_SOURCES BATCH_SIZE)
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   set(multiValueArgs)
 | 
					
						
							|  |  |  |   cmake_parse_arguments(_ "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   if (NOT DEFINED TARGET_ARGS_VAR)
 | 
					
						
							|  |  |  |     message(FATAL_ERROR "TARGET_ARGS_VAR parameter is required")
 | 
					
						
							|  |  |  |   endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   if (__BATCH_SOURCES AND NOT DEFINED __BATCH_SIZE)
 | 
					
						
							|  |  |  |     set(__BATCH_SIZE ${CUTLASS_UNITY_BUILD_BATCH_SIZE})
 | 
					
						
							|  |  |  |   endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   if (CUTLASS_UNITY_BUILD_ENABLED AND DEFINED __BATCH_SIZE AND __BATCH_SIZE GREATER 1)
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     set(CUDA_FILE_ARGS)
 | 
					
						
							|  |  |  |     set(TARGET_SOURCE_ARGS)
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |     
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |     foreach(ARG ${__UNPARSED_ARGUMENTS})
 | 
					
						
							|  |  |  |       if(${ARG} MATCHES ".*\.cu$")
 | 
					
						
							|  |  |  |         list(APPEND CUDA_FILE_ARGS ${ARG})
 | 
					
						
							|  |  |  |       else()
 | 
					
						
							|  |  |  |         list(APPEND TARGET_SOURCE_ARGS ${ARG})
 | 
					
						
							|  |  |  |       endif()
 | 
					
						
							|  |  |  |     endforeach()
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |     
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |     list(LENGTH CUDA_FILE_ARGS NUM_CUDA_FILE_ARGS)
 | 
					
						
							|  |  |  |     while(NUM_CUDA_FILE_ARGS GREATER 0)
 | 
					
						
							|  |  |  |       list(SUBLIST CUDA_FILE_ARGS 0 ${__BATCH_SIZE} CUDA_FILE_BATCH)
 | 
					
						
							|  |  |  |       string(SHA256 CUDA_FILE_BATCH_HASH "${CUDA_FILE_BATCH}")
 | 
					
						
							|  |  |  |       string(SUBSTRING ${CUDA_FILE_BATCH_HASH} 0 12 CUDA_FILE_BATCH_HASH)
 | 
					
						
							|  |  |  |       set(BATCH_FILE ${CMAKE_CURRENT_BINARY_DIR}/${NAME}.unity.${CUDA_FILE_BATCH_HASH}.cu)
 | 
					
						
							|  |  |  |       message(STATUS "Generating ${BATCH_FILE}")
 | 
					
						
							|  |  |  |       file(WRITE ${BATCH_FILE} "// Unity File - Auto Generated!\n")
 | 
					
						
							|  |  |  |       foreach(CUDA_FILE ${CUDA_FILE_BATCH})
 | 
					
						
							|  |  |  |         get_filename_component(CUDA_FILE_ABS_PATH ${CUDA_FILE} ABSOLUTE)
 | 
					
						
							|  |  |  |         file(APPEND ${BATCH_FILE} "#include \"${CUDA_FILE_ABS_PATH}\"\n") | 
					
						
							|  |  |  |       endforeach()
 | 
					
						
							|  |  |  |       list(APPEND TARGET_SOURCE_ARGS ${BATCH_FILE})
 | 
					
						
							|  |  |  |       if (NUM_CUDA_FILE_ARGS LESS_EQUAL __BATCH_SIZE)
 | 
					
						
							|  |  |  |         break()
 | 
					
						
							|  |  |  |       endif()
 | 
					
						
							|  |  |  |       list(SUBLIST CUDA_FILE_ARGS ${__BATCH_SIZE} -1 CUDA_FILE_ARGS)
 | 
					
						
							|  |  |  |       list(LENGTH CUDA_FILE_ARGS NUM_CUDA_FILE_ARGS)
 | 
					
						
							|  |  |  |     endwhile()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   else()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     set(TARGET_SOURCE_ARGS ${__UNPARSED_ARGUMENTS})
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   set(${TARGET_ARGS_VAR} ${TARGET_SOURCE_ARGS} PARENT_SCOPE)
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | endfunction()
 | 
					
						
							|  |  |  | function(cutlass_add_library NAME)
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   set(options SKIP_GENCODE_FLAGS)
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   set(oneValueArgs EXPORT_NAME)
 | 
					
						
							|  |  |  |   set(multiValueArgs)
 | 
					
						
							|  |  |  |   cmake_parse_arguments(_ "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   cutlass_unify_source_files(TARGET_SOURCE_ARGS ${__UNPARSED_ARGUMENTS})
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   if(CUTLASS_NATIVE_CUDA OR CUDA_COMPILER MATCHES "clang")
 | 
					
						
							|  |  |  |     cutlass_correct_source_file_language_property(${TARGET_SOURCE_ARGS})
 | 
					
						
							| 
									
										
										
										
											2023-09-27 05:24:26 +08:00
										 |  |  |     add_library(${NAME} ${TARGET_SOURCE_ARGS} "")
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   else()
 | 
					
						
							|  |  |  |     set(CUDA_LINK_LIBRARIES_KEYWORD PRIVATE)
 | 
					
						
							| 
									
										
										
										
											2023-09-27 05:24:26 +08:00
										 |  |  |     cuda_add_library(${NAME} ${TARGET_SOURCE_ARGS} "")
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   cutlass_apply_standard_compile_options(${NAME})
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   if (NOT __SKIP_GENCODE_FLAGS)
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   cutlass_apply_cuda_gencode_flags(${NAME})
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |   endif()
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   target_compile_features( | 
					
						
							|  |  |  |    ${NAME}
 | 
					
						
							|  |  |  |    INTERFACE
 | 
					
						
							|  |  |  |    cxx_std_11
 | 
					
						
							|  |  |  |    )
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   if(__EXPORT_NAME)
 | 
					
						
							|  |  |  |     add_library(nvidia::cutlass::${__EXPORT_NAME} ALIAS ${NAME})
 | 
					
						
							|  |  |  |     set_target_properties(${NAME} PROPERTIES EXPORT_NAME ${__EXPORT_NAME})
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | endfunction()
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | function(cutlass_add_executable NAME)
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   set(options)
 | 
					
						
							|  |  |  |   set(oneValueArgs)
 | 
					
						
							|  |  |  |   set(multiValueArgs)
 | 
					
						
							|  |  |  |   cmake_parse_arguments(_ "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   cutlass_unify_source_files(TARGET_SOURCE_ARGS ${__UNPARSED_ARGUMENTS})
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   if(CUTLASS_NATIVE_CUDA OR CUDA_COMPILER MATCHES "clang")
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |     cutlass_correct_source_file_language_property(${TARGET_SOURCE_ARGS})
 | 
					
						
							|  |  |  |     add_executable(${NAME} ${TARGET_SOURCE_ARGS})
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   else()
 | 
					
						
							|  |  |  |     set(CUDA_LINK_LIBRARIES_KEYWORD PRIVATE)
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |     cuda_add_executable(${NAME} ${TARGET_SOURCE_ARGS})
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   cutlass_apply_standard_compile_options(${NAME})
 | 
					
						
							|  |  |  |   cutlass_apply_cuda_gencode_flags(${NAME})
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   target_compile_features( | 
					
						
							|  |  |  |    ${NAME}
 | 
					
						
							|  |  |  |    INTERFACE
 | 
					
						
							|  |  |  |    cxx_std_11
 | 
					
						
							|  |  |  |    )
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | endfunction()
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | function(cutlass_target_sources NAME)
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   set(options)
 | 
					
						
							|  |  |  |   set(oneValueArgs)
 | 
					
						
							|  |  |  |   set(multiValueArgs)
 | 
					
						
							|  |  |  |   cmake_parse_arguments(_ "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   cutlass_unify_source_files(TARGET_SOURCE_ARGS ${__UNPARSED_ARGUMENTS})
 | 
					
						
							|  |  |  |   cutlass_correct_source_file_language_property(${TARGET_SOURCE_ARGS})
 | 
					
						
							|  |  |  |   target_sources(${NAME} ${TARGET_SOURCE_ARGS})
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | endfunction()
 |