# Copyright (c) 2017-2021, NVIDIA CORPORATION. All rights reserved. # # Redistribution and use in source and binary forms, with or without modification, are permitted # provided that the following conditions are met: # * Redistributions of source code must retain the above copyright notice, this list of # conditions and the following disclaimer. # * Redistributions in binary form must reproduce the above copyright notice, this list of # conditions and the following disclaimer in the documentation and/or other materials # provided with the distribution. # * Neither the name of the NVIDIA CORPORATION nor the names of its contributors may be used # to endorse or promote products derived from this software without specific prior written # permission. # # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR # IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND # FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE # FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, # BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; # OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, # STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. # # Sources for CUTLASS Profiler Tool # set(CUTLASS_TOOLS_PROFILER_SOURCES src/main.cpp src/cutlass_profiler.cu src/options.cu src/performance_report.cpp src/enumerated_types.cpp src/gpu_timer.cpp src/device_allocation.cu src/device_context.cu src/cublas_helpers.cu src/cudnn_helpers.cpp src/problem_space.cpp src/operation_profiler.cu src/gemm_operation_profiler.cu src/conv2d_operation_profiler.cu src/conv3d_operation_profiler.cu src/sparse_gemm_operation_profiler.cu ) # # Build target # cutlass_add_executable( cutlass_profiler ${CUTLASS_TOOLS_PROFILER_SOURCES} ) add_executable(nvidia::cutlass::profiler ALIAS cutlass_profiler) set_target_properties(cutlass_profiler PROPERTIES EXPORT_NAME profiler) # # Include paths # target_include_directories( cutlass_profiler PRIVATE ${CMAKE_CURRENT_LIST_DIR}/src ) # # Library dependencies # target_link_libraries( cutlass_profiler PRIVATE cutlass_lib cutlass_tools_util_includes $<$:nvidia::cublas> $<$:nvidia::cudnn> cudart ) install( TARGETS cutlass_profiler EXPORT NvidiaCutlass RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} ) set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_GEMM --operation=Gemm --providers=cutlass --verification-providers=cublas,device --junit-output=test_cutlass_profiler_gemm) set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_CONV2D --operation=Conv2d --providers=cutlass --verification-providers=cudnn,device --junit-output=test_cutlass_profiler_conv2d) set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_CONV3D --operation=Conv3d --providers=cutlass --verification-providers=cudnn,device,host --junit-output=test_cutlass_profiler_conv3d) set(CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_SPGEMM --operation=SparseGemm --providers=cutlass --verification-providers=cublas,device,host --junit-output=test_cutlass_profiler_spgemm) cutlass_add_executable_tests( test_profiler cutlass_profiler DEPENDEES test_all TEST_COMMAND_OPTIONS CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_GEMM CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_CONV2D CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_CONV3D CUTLASS_PROFILER_TEST_COMMAND_OPTIONS_SPGEMM DISABLE_EXECUTABLE_INSTALL_RULE )