| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  | /*************************************************************************************************** | 
					
						
							| 
									
										
										
										
											2024-01-17 03:37:22 +08:00
										 |  |  |  * Copyright (c) 2023 - 2024 NVIDIA CORPORATION & AFFILIATES. All rights reserved. | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  |  * SPDX-License-Identifier: BSD-3-Clause | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Redistribution and use in source and binary forms, with or without | 
					
						
							|  |  |  |  * modification, are permitted provided that the following conditions are met: | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * 1. Redistributions of source code must retain the above copyright notice, this | 
					
						
							|  |  |  |  * list of conditions and the following disclaimer. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | 
					
						
							|  |  |  |  * this list of conditions and the following disclaimer in the documentation | 
					
						
							|  |  |  |  * and/or other materials provided with the distribution. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * 3. Neither the name of the copyright holder nor the names of its | 
					
						
							|  |  |  |  * contributors may be used to endorse or promote products derived from | 
					
						
							|  |  |  |  * this software without specific prior written permission. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | 
					
						
							|  |  |  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | 
					
						
							|  |  |  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE | 
					
						
							|  |  |  |  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE | 
					
						
							|  |  |  |  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | 
					
						
							|  |  |  |  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR | 
					
						
							|  |  |  |  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER | 
					
						
							|  |  |  |  * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, | 
					
						
							|  |  |  |  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE | 
					
						
							|  |  |  |  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  **************************************************************************************************/ | 
					
						
							|  |  |  | /*! \file | 
					
						
							|  |  |  |     \brief Unit tests for conversion operators. | 
					
						
							|  |  |  | */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include "../common/cutlass_unit_test.h" | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include "cutlass/numeric_conversion.h" | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include "cutlass/layout/matrix.h" | 
					
						
							|  |  |  | #include "cutlass/util/host_tensor.h" | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ///////////////////////////////////////////////////////////////////////////////////////////////// | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | namespace test { | 
					
						
							|  |  |  | namespace core { | 
					
						
							|  |  |  | namespace kernel { | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /// Simple conversion function | 
					
						
							|  |  |  | template <typename Destination, typename Source, int Count> | 
					
						
							|  |  |  | __global__ void convert( | 
					
						
							|  |  |  |   cutlass::Array<Destination, Count> *destination, | 
					
						
							|  |  |  |   cutlass::Array<Source, Count> const *source) { | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   cutlass::FastNumericArrayConverter<Destination, Source, Count> convert; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   *destination = convert(*source); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ///////////////////////////////////////////////////////////////////////////////////////////////// | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | template <typename Destination, typename Source, int Count> | 
					
						
							|  |  |  | void run_test_integer_range_limited() { | 
					
						
							|  |  |  |   const int kN = Count; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   dim3 grid(1, 1); | 
					
						
							|  |  |  |   dim3 block(1, 1); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   cutlass::HostTensor<Destination, cutlass::layout::RowMajor> destination({1, kN}); | 
					
						
							|  |  |  |   cutlass::HostTensor<Source, cutlass::layout::RowMajor> source({1, kN}); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   for (int i = 0; i < kN; ++i) { | 
					
						
							| 
									
										
										
										
											2024-08-30 11:11:06 +08:00
										 |  |  |     source.host_view().at({0, i}) = Source(i % 4); | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   source.sync_device(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   convert<Destination, Source, kN><<< grid, block >>>( | 
					
						
							|  |  |  |     reinterpret_cast<cutlass::Array<Destination, kN> *>(destination.device_data()), | 
					
						
							|  |  |  |     reinterpret_cast<cutlass::Array<Source, kN> const *>(source.device_data()) | 
					
						
							|  |  |  |   ); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   destination.sync_host(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   for (int i = 0; i < kN; ++i) { | 
					
						
							| 
									
										
										
										
											2024-08-30 11:11:06 +08:00
										 |  |  |     EXPECT_TRUE(float(destination.host_view().at({0, i})) == float(source.host_view().at({0, i}))); | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  |   } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | template <typename Destination, typename Source, int Count> | 
					
						
							|  |  |  | void run_test_integer_range_all() { | 
					
						
							|  |  |  |   const int kN = Count; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   dim3 grid(1, 1); | 
					
						
							|  |  |  |   dim3 block(1, 1); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   cutlass::HostTensor<Destination, cutlass::layout::RowMajor> destination({1, kN}); | 
					
						
							|  |  |  |   cutlass::HostTensor<Source, cutlass::layout::RowMajor> source({1, kN}); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-08-30 11:11:06 +08:00
										 |  |  |   int const kIntSourceMin = cutlass::platform::numeric_limits<Source>::lowest(); | 
					
						
							|  |  |  |   int const kIntSourceMax = cutlass::platform::numeric_limits<Source>::max(); | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  |   int const kIntRange = kIntSourceMax - kIntSourceMin + 1; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   for (int i = 0; i < kN; ++i) { | 
					
						
							| 
									
										
										
										
											2024-08-30 11:11:06 +08:00
										 |  |  |     source.host_view().at({0, i}) = Source(kIntSourceMin + (i % kIntRange)); | 
					
						
							| 
									
										
										
										
											2024-10-10 03:33:27 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  |   } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   source.sync_device(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   convert<Destination, Source, kN><<< grid, block >>>( | 
					
						
							|  |  |  |     reinterpret_cast<cutlass::Array<Destination, kN> *>(destination.device_data()), | 
					
						
							|  |  |  |     reinterpret_cast<cutlass::Array<Source, kN> const *>(source.device_data()) | 
					
						
							|  |  |  |   ); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   destination.sync_host(); | 
					
						
							| 
									
										
										
										
											2023-11-02 23:09:05 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  |   // Verify conversion | 
					
						
							|  |  |  |   bool passed = true; | 
					
						
							| 
									
										
										
										
											2024-10-10 03:33:27 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  |   for (int i = 0; i < kN; ++i) { | 
					
						
							| 
									
										
										
										
											2024-08-30 11:11:06 +08:00
										 |  |  |     if(!(float(destination.host_view().at({0, i})) == float(source.host_view().at({0, i})))) { | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  |       passed = false; | 
					
						
							|  |  |  |       break; | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |   } | 
					
						
							| 
									
										
										
										
											2024-10-10 03:33:27 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  |   EXPECT_TRUE(passed) << " FastNumericArrayConverter failed"; | 
					
						
							| 
									
										
										
										
											2023-11-02 23:09:05 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  |    // Print out results for the failed conversion. | 
					
						
							|  |  |  |    if (!passed) { | 
					
						
							|  |  |  |     for (int i = 0; i < kN; ++i) { | 
					
						
							| 
									
										
										
										
											2024-08-30 11:11:06 +08:00
										 |  |  |         std::cout << "source(" << float(source.host_view().at({0, i})) << ") -> " | 
					
						
							|  |  |  |                   << "destination ("<< float(destination.host_view().at({0, i})) << ")" << std::endl; | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  |     } | 
					
						
							|  |  |  |    } | 
					
						
							|  |  |  |    std::flush(std::cout); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | } // namespace kernel | 
					
						
							|  |  |  | } // namespace core | 
					
						
							|  |  |  | } // namespace test | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | ///////////////////////////////////////////////////////////////////////////////////////////////// | 
					
						
							|  |  |  | TEST(FastNumericConversion, s32_to_f32) { | 
					
						
							|  |  |  |   int const kN = 4; | 
					
						
							|  |  |  |   using Source = int; | 
					
						
							|  |  |  |   using Destination = float; | 
					
						
							|  |  |  |   test::core::kernel::run_test_integer_range_limited<Destination, Source, kN>(); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-12-30 04:21:31 +08:00
										 |  |  | TEST(FastNumericConversion, s8_to_f32_array) { | 
					
						
							|  |  |  |   int const kN = 256; | 
					
						
							|  |  |  |   using Source = int8_t; | 
					
						
							|  |  |  |   using Destination = float; | 
					
						
							|  |  |  |   test::core::kernel::run_test_integer_range_all<Destination, Source, kN>(); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | TEST(FastNumericConversion, u8_to_f32_array) { | 
					
						
							|  |  |  |   int const kN = 256; | 
					
						
							|  |  |  |   using Source = uint8_t; | 
					
						
							|  |  |  |   using Destination = float; | 
					
						
							|  |  |  |   test::core::kernel::run_test_integer_range_all<Destination, Source, kN>(); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-09-27 23:18:30 +08:00
										 |  |  | TEST(FastNumericConversion, s8_to_f16_array) { | 
					
						
							|  |  |  |   int const kN = 256; | 
					
						
							|  |  |  |   using Source = int8_t; | 
					
						
							|  |  |  |   using Destination = cutlass::half_t; | 
					
						
							|  |  |  |   test::core::kernel::run_test_integer_range_all<Destination, Source, kN>(); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | TEST(FastNumericConversion, u8_to_f16_array) { | 
					
						
							|  |  |  |   int const kN = 256; | 
					
						
							|  |  |  |   using Source = uint8_t; | 
					
						
							|  |  |  |   using Destination = cutlass::half_t; | 
					
						
							|  |  |  |   test::core::kernel::run_test_integer_range_all<Destination, Source, kN>(); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | TEST(FastNumericConversion, u8_to_bf16_array) { | 
					
						
							|  |  |  |   int const kN = 256; | 
					
						
							|  |  |  |   using Source = uint8_t; | 
					
						
							|  |  |  |   using Destination = cutlass::bfloat16_t; | 
					
						
							|  |  |  |   test::core::kernel::run_test_integer_range_all<Destination, Source, kN>(); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | TEST(FastNumericConversion, s8_to_bf16_array) { | 
					
						
							|  |  |  |   int const kN = 256; | 
					
						
							|  |  |  |   using Source = int8_t; | 
					
						
							|  |  |  |   using Destination = cutlass::bfloat16_t; | 
					
						
							|  |  |  |   test::core::kernel::run_test_integer_range_all<Destination, Source, kN>(); | 
					
						
							|  |  |  | } | 
					
						
							| 
									
										
										
										
											2024-08-30 11:11:06 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | TEST(FastNumericConversion, s4_to_s8_array) { | 
					
						
							|  |  |  |   int const kN = 16; | 
					
						
							|  |  |  |   using Source = cutlass::int4b_t; | 
					
						
							|  |  |  |   using Destination = int8_t; | 
					
						
							|  |  |  |   test::core::kernel::run_test_integer_range_all<Destination, Source, kN>(); | 
					
						
							|  |  |  | } |