| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | # Copyright (c) 2017 - 2022 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 | 
					
						
							|  |  |  | # SPDX-License-Identifier: BSD-3-Clause
 | 
					
						
							|  |  |  | #
 | 
					
						
							|  |  |  | # Redistribution and use in source and binary forms, with or without
 | 
					
						
							|  |  |  | # modification, are permitted provided that the following conditions are met:
 | 
					
						
							|  |  |  | #
 | 
					
						
							|  |  |  | # 1. Redistributions of source code must retain the above copyright notice, this
 | 
					
						
							|  |  |  | # list of conditions and the following disclaimer.
 | 
					
						
							| 
									
										
										
										
											2018-09-19 07:58:03 +08:00
										 |  |  | #
 | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  | # 2. Redistributions in binary form must reproduce the above copyright notice,
 | 
					
						
							|  |  |  | # this list of conditions and the following disclaimer in the documentation
 | 
					
						
							|  |  |  | # and/or other materials provided with the distribution.
 | 
					
						
							| 
									
										
										
										
											2018-09-19 07:58:03 +08:00
										 |  |  | #
 | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  | # 3. Neither the name of the copyright holder nor the names of its
 | 
					
						
							|  |  |  | # contributors may be used to endorse or promote products derived from
 | 
					
						
							|  |  |  | # this software without specific prior written permission.
 | 
					
						
							|  |  |  | #
 | 
					
						
							|  |  |  | # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 | 
					
						
							|  |  |  | # AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 | 
					
						
							|  |  |  | # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 | 
					
						
							|  |  |  | # DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
 | 
					
						
							|  |  |  | # FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 | 
					
						
							|  |  |  | # DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
 | 
					
						
							|  |  |  | # SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
 | 
					
						
							|  |  |  | # CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
 | 
					
						
							|  |  |  | # OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 | 
					
						
							| 
									
										
										
										
											2018-09-19 07:58:03 +08:00
										 |  |  | # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | set(CUTLASS_EXAMPLES_COMMON_SOURCE_DIR ${CMAKE_CURRENT_SOURCE_DIR}/common)
 | 
					
						
							| 
									
										
										
										
											2019-03-21 01:49:17 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-11-20 13:25:25 +08:00
										 |  |  | add_custom_target(cutlass_examples)
 | 
					
						
							|  |  |  | add_custom_target(test_examples)
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | function(cutlass_example_add_executable NAME)
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   set(options)
 | 
					
						
							| 
									
										
										
										
											2021-07-23 12:40:53 +08:00
										 |  |  |   set(oneValueArgs DISABLE_TESTS)
 | 
					
						
							| 
									
										
										
										
											2020-11-20 13:25:25 +08:00
										 |  |  |   set(multiValueArgs DEPENDS DEPENDEES TEST_COMMAND_OPTIONS)
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   cmake_parse_arguments(_ "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-07-23 12:40:53 +08:00
										 |  |  |   if (NOT DEFINED __DISABLE_TESTS)
 | 
					
						
							|  |  |  |     set(__DISABLE_TESTS OFF)
 | 
					
						
							|  |  |  |   endif()
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   cutlass_add_executable(${NAME} ${__UNPARSED_ARGUMENTS})
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-11-20 13:25:25 +08:00
										 |  |  |   add_dependencies(cutlass_examples ${NAME})
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   target_link_libraries( | 
					
						
							|  |  |  |     ${NAME}
 | 
					
						
							|  |  |  |     PRIVATE
 | 
					
						
							|  |  |  |     CUTLASS
 | 
					
						
							|  |  |  |     cutlass_tools_util_includes
 | 
					
						
							| 
									
										
										
										
											2021-12-18 05:04:43 +08:00
										 |  |  |     $<$<BOOL:${CUTLASS_ENABLE_CUBLAS}>:nvidia::cublas>
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |     )
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   target_include_directories( | 
					
						
							|  |  |  |     ${NAME}
 | 
					
						
							|  |  |  |     PRIVATE
 | 
					
						
							|  |  |  |     ${CUTLASS_EXAMPLES_COMMON_SOURCE_DIR}
 | 
					
						
							|  |  |  |     )
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-11-20 13:25:25 +08:00
										 |  |  |   install( | 
					
						
							|  |  |  |     TARGETS ${NAME}
 | 
					
						
							|  |  |  |     RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR}
 | 
					
						
							| 
									
										
										
										
											2020-06-16 01:47:01 +08:00
										 |  |  |     )
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-11-20 13:25:25 +08:00
										 |  |  |   cutlass_add_executable_tests( | 
					
						
							|  |  |  |     test_examples_${NAME} ${NAME}
 | 
					
						
							|  |  |  |     DEPENDS ${__DEPENDS}
 | 
					
						
							|  |  |  |     DEPENDEES test_examples ${__DEPENDEES}
 | 
					
						
							|  |  |  |     TEST_COMMAND_OPTIONS ${__TEST_COMMAND_OPTIONS}
 | 
					
						
							|  |  |  |     DISABLE_EXECUTABLE_INSTALL_RULE
 | 
					
						
							| 
									
										
										
										
											2021-07-23 12:40:53 +08:00
										 |  |  |     DISABLE_TESTS ${__DISABLE_TESTS}
 | 
					
						
							| 
									
										
										
										
											2020-11-20 13:25:25 +08:00
										 |  |  |     )
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-11-20 13:25:25 +08:00
										 |  |  | endfunction()
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | foreach(EXAMPLE | 
					
						
							|  |  |  |   00_basic_gemm
 | 
					
						
							|  |  |  |   01_cutlass_utilities
 | 
					
						
							|  |  |  |   02_dump_reg_shmem
 | 
					
						
							|  |  |  |   03_visualize_layout
 | 
					
						
							|  |  |  |   04_tile_iterator
 | 
					
						
							|  |  |  |   05_batched_gemm
 | 
					
						
							|  |  |  |   06_splitK_gemm
 | 
					
						
							|  |  |  |   07_volta_tensorop_gemm
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   08_turing_tensorop_gemm
 | 
					
						
							| 
									
										
										
										
											2020-11-20 13:25:25 +08:00
										 |  |  |   09_turing_tensorop_conv2dfprop
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |   10_planar_complex
 | 
					
						
							|  |  |  |   11_planar_complex_array
 | 
					
						
							| 
									
										
										
										
											2020-06-09 07:17:35 +08:00
										 |  |  |   12_gemm_bias_relu
 | 
					
						
							| 
									
										
										
										
											2022-03-24 02:52:54 +08:00
										 |  |  |   13_two_tensor_op_fusion
 | 
					
						
							| 
									
										
										
										
											2020-09-24 05:00:58 +08:00
										 |  |  |   14_ampere_tf32_tensorop_gemm
 | 
					
						
							|  |  |  |   15_ampere_sparse_tensorop_gemm
 | 
					
						
							| 
									
										
										
										
											2021-02-26 22:58:26 +08:00
										 |  |  |   16_ampere_tensorop_conv2dfprop
 | 
					
						
							|  |  |  |   17_fprop_per_channel_bias
 | 
					
						
							| 
									
										
										
										
											2021-07-23 12:40:53 +08:00
										 |  |  |   18_ampere_fp64_tensorop_affine2_gemm
 | 
					
						
							|  |  |  |   19_tensorop_canonical
 | 
					
						
							|  |  |  |   20_simt_canonical
 | 
					
						
							|  |  |  |   21_quaternion_gemm
 | 
					
						
							|  |  |  |   22_quaternion_conv
 | 
					
						
							| 
									
										
										
										
											2021-09-21 04:34:47 +08:00
										 |  |  |   23_ampere_gemm_operand_reduction_fusion
 | 
					
						
							| 
									
										
										
										
											2021-11-20 05:26:35 +08:00
										 |  |  |   24_gemm_grouped
 | 
					
						
							|  |  |  |   25_ampere_fprop_mainloop_fusion
 | 
					
						
							|  |  |  |   26_ampere_wgrad_mainloop_fusion
 | 
					
						
							|  |  |  |   27_ampere_3xtf32_fast_accurate_tensorop_gemm
 | 
					
						
							|  |  |  |   28_ampere_3xtf32_fast_accurate_tensorop_fprop
 | 
					
						
							|  |  |  |   29_ampere_3xtf32_fast_accurate_tensorop_complex_gemm
 | 
					
						
							| 
									
										
										
										
											2022-03-24 02:52:54 +08:00
										 |  |  |   30_wgrad_split_k
 | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  |   31_basic_syrk
 | 
					
						
							|  |  |  |   32_basic_trmm
 | 
					
						
							|  |  |  |   33_ampere_3xtf32_tensorop_symm
 | 
					
						
							| 
									
										
										
										
											2022-03-24 02:52:54 +08:00
										 |  |  |   34_transposed_conv2d
 | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  |   35_gemm_softmax
 | 
					
						
							|  |  |  |   36_gather_scatter_fusion
 | 
					
						
							| 
									
										
										
										
											2022-09-04 06:48:46 +08:00
										 |  |  |   37_gemm_layernorm_gemm_fusion
 | 
					
						
							|  |  |  |   38_syr2k_grouped
 | 
					
						
							|  |  |  |   39_gemm_permute
 | 
					
						
							|  |  |  |   41_multi_head_attention
 | 
					
						
							| 
									
										
										
										
											2020-11-20 13:25:25 +08:00
										 |  |  |   )
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   add_subdirectory(${EXAMPLE})
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | endforeach()
 |