2023-01-21 05:32:57 +08:00
|
|
|
# Copyright (c) 2017 - 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
|
2022-04-24 03:02:38 +08:00
|
|
|
# SPDX-License-Identifier: BSD-3-Clause
|
2018-09-19 07:58:03 +08:00
|
|
|
#
|
2022-04-24 03:02:38 +08:00
|
|
|
# Redistribution and use in source and binary forms, with or without
|
|
|
|
# modification, are permitted provided that the following conditions are met:
|
2018-09-19 07:58:03 +08:00
|
|
|
#
|
2022-04-24 03:02:38 +08:00
|
|
|
# 1. Redistributions of source code must retain the above copyright notice, this
|
|
|
|
# list of conditions and the following disclaimer.
|
|
|
|
#
|
|
|
|
# 2. Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
# this list of conditions and the following disclaimer in the documentation
|
|
|
|
# and/or other materials provided with the distribution.
|
|
|
|
#
|
|
|
|
# 3. Neither the name of the copyright holder nor the names of its
|
|
|
|
# contributors may be used to endorse or promote products derived from
|
|
|
|
# this software without specific prior written permission.
|
|
|
|
#
|
|
|
|
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
|
|
|
# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
|
|
|
|
# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
|
|
|
# SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
|
|
|
|
# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
|
|
|
# OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
2018-09-19 07:58:03 +08:00
|
|
|
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
|
2023-08-08 08:50:32 +08:00
|
|
|
find_package(Python3 3.5 COMPONENTS Interpreter REQUIRED)
|
|
|
|
|
2019-11-20 08:55:34 +08:00
|
|
|
#
|
|
|
|
# Sources for CUTLASS Profiler Tool
|
|
|
|
#
|
2023-04-15 11:19:34 +08:00
|
|
|
cmake_policy(SET CMP0112 NEW)
|
2019-11-20 08:55:34 +08:00
|
|
|
set(CUTLASS_TOOLS_PROFILER_SOURCES
|
|
|
|
src/main.cpp
|
|
|
|
src/cutlass_profiler.cu
|
|
|
|
src/options.cu
|
|
|
|
src/performance_report.cpp
|
|
|
|
src/enumerated_types.cpp
|
|
|
|
src/gpu_timer.cpp
|
|
|
|
src/device_allocation.cu
|
|
|
|
src/device_context.cu
|
2021-11-20 05:26:35 +08:00
|
|
|
src/cublas_helpers.cu
|
2020-11-20 13:25:25 +08:00
|
|
|
src/cudnn_helpers.cpp
|
2019-11-20 08:55:34 +08:00
|
|
|
src/problem_space.cpp
|
|
|
|
src/operation_profiler.cu
|
|
|
|
src/gemm_operation_profiler.cu
|
2022-04-24 03:02:38 +08:00
|
|
|
src/rank_k_operation_profiler.cu
|
|
|
|
src/rank_2k_operation_profiler.cu
|
|
|
|
src/trmm_operation_profiler.cu
|
|
|
|
src/symm_operation_profiler.cu
|
2020-11-20 13:25:25 +08:00
|
|
|
src/conv2d_operation_profiler.cu
|
|
|
|
src/conv3d_operation_profiler.cu
|
2020-09-24 05:00:58 +08:00
|
|
|
src/sparse_gemm_operation_profiler.cu
|
2018-09-19 07:58:03 +08:00
|
|
|
)
|
|
|
|
|
2019-11-20 08:55:34 +08:00
|
|
|
#
|
|
|
|
# Build target
|
|
|
|
#
|
2018-09-19 07:58:03 +08:00
|
|
|
|
|
|
|
cutlass_add_executable(
|
2019-11-20 08:55:34 +08:00
|
|
|
cutlass_profiler
|
|
|
|
${CUTLASS_TOOLS_PROFILER_SOURCES}
|
|
|
|
)
|
|
|
|
add_executable(nvidia::cutlass::profiler ALIAS cutlass_profiler)
|
|
|
|
set_target_properties(cutlass_profiler PROPERTIES EXPORT_NAME profiler)
|
|
|
|
|
|
|
|
#
|
|
|
|
# Include paths
|
|
|
|
#
|
|
|
|
|
2020-04-08 04:51:25 +08:00
|
|
|
target_include_directories(
|
|
|
|
cutlass_profiler
|
2019-11-20 08:55:34 +08:00
|
|
|
PRIVATE
|
2023-09-27 05:24:26 +08:00
|
|
|
${CMAKE_CURRENT_LIST_DIR}/include
|
2020-04-08 04:51:25 +08:00
|
|
|
)
|
2019-11-20 08:55:34 +08:00
|
|
|
|
|
|
|
#
|
|
|
|
# Library dependencies
|
|
|
|
#
|
|
|
|
|
|
|
|
target_link_libraries(
|
|
|
|
cutlass_profiler
|
|
|
|
PRIVATE
|
|
|
|
cutlass_lib
|
2020-04-08 04:51:25 +08:00
|
|
|
cutlass_tools_util_includes
|
|
|
|
$<$<BOOL:${CUTLASS_ENABLE_CUBLAS}>:nvidia::cublas>
|
2020-11-20 13:25:25 +08:00
|
|
|
$<$<BOOL:${CUTLASS_ENABLE_CUDNN}>:nvidia::cudnn>
|
2019-11-20 08:55:34 +08:00
|
|
|
cudart
|
2023-01-24 09:55:28 +08:00
|
|
|
cuda_driver
|
2019-11-20 08:55:34 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
install(
|
|
|
|
TARGETS cutlass_profiler
|
|
|
|
EXPORT NvidiaCutlass
|
|
|
|
RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR}
|
|
|
|
)
|
2020-11-20 13:25:25 +08:00
|
|
|
|
2023-09-27 05:24:26 +08:00
|
|
|
set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_GEMM --operation=Gemm --providers=cutlass --verification-providers=cublas,device --junit-output=test_cutlass_profiler_gemm --print-kernel-before-running=true)
|
|
|
|
set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_CONV2D --operation=Conv2d --providers=cutlass --verification-providers=cudnn,device --junit-output=test_cutlass_profiler_conv2d --print-kernel-before-running=true)
|
|
|
|
set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_CONV3D --operation=Conv3d --providers=cutlass --verification-providers=cudnn,device,host --junit-output=test_cutlass_profiler_conv3d --print-kernel-before-running=true)
|
|
|
|
set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_SPGEMM --operation=SparseGemm --providers=cutlass --verification-providers=cublas,device,host --junit-output=test_cutlass_profiler_spgemm --print-kernel-before-running=true)
|
|
|
|
set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_RANK_K --operation=RankK --providers=cutlass --verification-providers=cublas --junit-output=test_cutlass_profiler_rank_k --print-kernel-before-running=true)
|
|
|
|
set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_RANK_2K --operation=Rank2K --providers=cutlass --verification-providers=cublas --junit-output=test_cutlass_profiler_rank_2k --print-kernel-before-running=true)
|
|
|
|
set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_TRMM --operation=Trmm --providers=cutlass --verification-providers=device,host --junit-output=test_cutlass_profiler_trmm --print-kernel-before-running=true)
|
|
|
|
set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_SYMM --operation=Symm --providers=cutlass --verification-providers=cublas,host --junit-output=test_cutlass_profiler_symm --print-kernel-before-running=true)
|
2022-04-24 03:02:38 +08:00
|
|
|
|
2020-11-20 13:25:25 +08:00
|
|
|
cutlass_add_executable_tests(
|
|
|
|
test_profiler cutlass_profiler
|
|
|
|
DEPENDEES test_all
|
2023-04-29 21:34:27 +08:00
|
|
|
TEST_COMMAND_OPTIONS
|
|
|
|
GEMM
|
|
|
|
CONV2D
|
|
|
|
CONV3D
|
|
|
|
SPGEMM
|
|
|
|
RANK_K
|
|
|
|
RANK_2K
|
|
|
|
TRMM
|
|
|
|
SYMM
|
|
|
|
TEST_COMMAND_OPTIONS_PREFIX
|
|
|
|
CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_
|
2020-11-20 13:25:25 +08:00
|
|
|
DISABLE_EXECUTABLE_INSTALL_RULE
|
|
|
|
)
|
2022-11-19 22:02:15 +08:00
|
|
|
|