| 
									
										
										
										
											2023-01-24 09:55:28 +08:00
										 |  |  | /***************************************************************************************************
 | 
					
						
							|  |  |  |  * Copyright (c) 2017 - 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved. | 
					
						
							|  |  |  |  * SPDX-License-Identifier: BSD-3-Clause | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * Redistribution and use in source and binary forms, with or without | 
					
						
							|  |  |  |  * modification, are permitted provided that the following conditions are met: | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * 1. Redistributions of source code must retain the above copyright notice, this | 
					
						
							|  |  |  |  * list of conditions and the following disclaimer. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | 
					
						
							|  |  |  |  * this list of conditions and the following disclaimer in the documentation | 
					
						
							|  |  |  |  * and/or other materials provided with the distribution. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * 3. Neither the name of the copyright holder nor the names of its | 
					
						
							|  |  |  |  * contributors may be used to endorse or promote products derived from | 
					
						
							|  |  |  |  * this software without specific prior written permission. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | 
					
						
							|  |  |  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | 
					
						
							|  |  |  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE | 
					
						
							|  |  |  |  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE | 
					
						
							|  |  |  |  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | 
					
						
							|  |  |  |  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR | 
					
						
							|  |  |  |  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER | 
					
						
							|  |  |  |  * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, | 
					
						
							|  |  |  |  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE | 
					
						
							|  |  |  |  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  **************************************************************************************************/ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include "cutlass_unit_test.h"
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-08-26 11:05:46 +08:00
										 |  |  | // C<uint32_t(something)>::value_type is not uint32_t for GCC 7.5.0.
 | 
					
						
							|  |  |  | // This test is thus disabled for GCC < 8.
 | 
					
						
							|  |  |  | #if defined(__GNUC__) && (__GNUC__ < 8)
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-24 09:55:28 +08:00
										 |  |  | #include <cutlass/trace.h>
 | 
					
						
							|  |  |  | #include <cute/swizzle.hpp>
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-08-26 11:05:46 +08:00
										 |  |  | namespace { // (anonymous)
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   // This function exists to work around a Clang 14 issue, in which
 | 
					
						
							|  |  |  |   // the compiler tries to instantiate code that lives inside the
 | 
					
						
							|  |  |  |   // "else" branch of an "if constexpr," even when the "else" branch
 | 
					
						
							|  |  |  |   // is false.  That triggers a spurious static_assert in MixedBits.
 | 
					
						
							|  |  |  |   // The work-around is to make the body of the "else" branch a
 | 
					
						
							|  |  |  |   // function, rather than leaving it in line.
 | 
					
						
							|  |  |  |   //
 | 
					
						
							|  |  |  |   // Some compilers strangely deduce the first two terms of
 | 
					
						
							|  |  |  |   // make_integer_sequence<uint32_t, 8> as C<false> and C<true>, and
 | 
					
						
							|  |  |  |   // the remaining terms as C<2>, C<3>, etc.  Making this function take
 | 
					
						
							|  |  |  |   // cute::integral_constant<uint32_t, S0_value>, etc. doesn't work
 | 
					
						
							|  |  |  |   // with those compilers.
 | 
					
						
							|  |  |  |   template<class S0_type, S0_type S0_value, | 
					
						
							|  |  |  |     class F0_type, F0_type F0_value, | 
					
						
							|  |  |  |     class S1_type, S1_type S1_value, | 
					
						
							|  |  |  |     class F1_type, F1_type F1_value> | 
					
						
							|  |  |  |   void clang14_workaround(cute::integral_constant<S0_type, S0_value>, | 
					
						
							|  |  |  |     cute::integral_constant<F0_type, F0_value>, | 
					
						
							|  |  |  |     cute::integral_constant<S1_type, S1_value>, | 
					
						
							|  |  |  |     cute::integral_constant<F1_type, F1_value>) | 
					
						
							|  |  |  |   { | 
					
						
							|  |  |  |     constexpr cute::C<static_cast<uint32_t>(S0_value)> S0{}; | 
					
						
							|  |  |  |     constexpr cute::C<static_cast<uint32_t>(F0_value)> F0{}; | 
					
						
							|  |  |  |     constexpr cute::C<static_cast<uint32_t>(S1_value)> S1{}; | 
					
						
							|  |  |  |     constexpr cute::C<static_cast<uint32_t>(F1_value)> F1{}; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     for (uint32_t d0 = 0; d0 < 8; ++d0) { | 
					
						
							|  |  |  |       if ((d0 & F0) != d0) { continue; }    // Skip repeats
 | 
					
						
							|  |  |  |       for (uint32_t d1 = 0; d1 < 8; ++d1) { | 
					
						
							|  |  |  |         if ((d1 & F1) != d1) { continue; }  // Skip repeats
 | 
					
						
							|  |  |  |         auto m0 = make_mixed_bits(S0, d0, F0); | 
					
						
							|  |  |  |         auto m1 = make_mixed_bits(S1, d1, F1); | 
					
						
							|  |  |  |         //print(m0); print(" & "); print(m1); print(" = "); print(m0 & m1); print("\n");
 | 
					
						
							|  |  |  |         EXPECT_EQ(uint32_t(m0 & m1), uint32_t(m0) & uint32_t(m1)); | 
					
						
							|  |  |  |         //print(m0); print(" | "); print(m1); print(" = "); print(m0 | m1); print("\n");
 | 
					
						
							|  |  |  |         EXPECT_EQ(uint32_t(m0 | m1), uint32_t(m0) | uint32_t(m1)); | 
					
						
							|  |  |  |         //print(m0); print(" ^ "); print(m1); print(" = "); print(m0 ^ m1); print("\n");
 | 
					
						
							|  |  |  |         EXPECT_EQ(uint32_t(m0 ^ m1), uint32_t(m0) ^ uint32_t(m1)); | 
					
						
							|  |  |  |       } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |   } | 
					
						
							|  |  |  | } // namespace (anonymous)
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-01-24 09:55:28 +08:00
										 |  |  | TEST(CuTe_core, MixedBits) { | 
					
						
							|  |  |  |   using namespace cute; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   auto uzero = cute::integral_constant<uint32_t, 0>{}; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   for_each(make_integer_sequence<uint32_t, 8>{}, [&](auto S0) { | 
					
						
							|  |  |  |     for_each(make_integer_sequence<uint32_t, 8>{}, [&](auto F0) { | 
					
						
							|  |  |  |       for_each(make_integer_sequence<uint32_t, 8>{}, [&](auto S1) { | 
					
						
							|  |  |  |         for_each(make_integer_sequence<uint32_t, 8>{}, [&](auto F1) { | 
					
						
							|  |  |  |           if constexpr (decltype(S0 == uzero || S1 == uzero)::value) { | 
					
						
							|  |  |  |             return; | 
					
						
							|  |  |  |           } else if constexpr (decltype((S0 & F0) != uzero || (S1 & F1) != uzero)::value) { | 
					
						
							|  |  |  |             return; | 
					
						
							|  |  |  |           } else { | 
					
						
							| 
									
										
										
										
											2023-08-26 11:05:46 +08:00
										 |  |  |             clang14_workaround(S0, F0, S1, F1); | 
					
						
							| 
									
										
										
										
											2023-01-24 09:55:28 +08:00
										 |  |  |           } | 
					
						
							|  |  |  |         }); | 
					
						
							|  |  |  |       }); | 
					
						
							|  |  |  |     }); | 
					
						
							|  |  |  |   }); | 
					
						
							|  |  |  | } | 
					
						
							| 
									
										
										
										
											2023-08-26 11:05:46 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | TEST(CuTe_core, MakeIntegerSequence) { | 
					
						
							|  |  |  |   cute::for_each(cute::make_integer_sequence<uint32_t, 8>{}, [](auto c) { | 
					
						
							|  |  |  |     using c_type = decltype(c); | 
					
						
							|  |  |  |     constexpr auto c_value = c_type::value; | 
					
						
							|  |  |  |     using expected_type = cute::integral_constant<uint32_t, c_value>; | 
					
						
							|  |  |  |     static_assert(cute::is_same_v<c_type, expected_type>); | 
					
						
							|  |  |  |   }); | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #endif // defined(__GNUC__) && (__GNUC__ < 8)
 |