/*************************************************************************************************** * Copyright (c) 2017 - 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved. * SPDX-License-Identifier: BSD-3-Clause * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are met: * * 1. Redistributions of source code must retain the above copyright notice, this * list of conditions and the following disclaimer. * * 2. Redistributions in binary form must reproduce the above copyright notice, * this list of conditions and the following disclaimer in the documentation * and/or other materials provided with the distribution. * * 3. Neither the name of the copyright holder nor the names of its * contributors may be used to endorse or promote products derived from * this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. * **************************************************************************************************/ #include "cutlass_unit_test.h" #include #include template void test_complement(Layout const& layout, CoSizeHi const& cosize_hi) { using namespace cute; auto result = complement(layout, cosize_hi); CUTLASS_TRACE_HOST("complement( " << layout << ", " << cosize_hi << ") => " << result); // Post-condition on the domain size of the complement (1) EXPECT_GE( size(result), cosize_hi / size(filter(layout))); // Post-condition on the codomain size of the complement (2) EXPECT_LE(cosize(result), cute::ceil_div(cosize_hi, cosize(layout)) * cosize(layout)); // Post-condition on the codomain of the complement for (int i = 1; i < size(result); ++i) { EXPECT_LT(result(i-1), result(i)); // Ordered (3) for (int j = 0; j < size(layout); ++j) { EXPECT_NE(result(i), layout(j)); // Complemented (4) } } // Other observations EXPECT_LE(size(result),cosize(result)); // As a result of the ordered condition (3) EXPECT_GE(cosize(result), cosize_hi / size(filter(layout))); // As a result of (1) (2) and (5) if constexpr (is_static::value) { // If we can apply complement again EXPECT_EQ(size(complement(make_layout(layout,result))), 1); // There's no more codomain left over } } template void test_complement(Layout const& layout) { return test_complement(layout, cosize(layout)); } TEST(CuTe_core, Complement) { using namespace cute; CUTLASS_TRACE_HOST("-------------------------------"); CUTLASS_TRACE_HOST("COMPLEMENT"); CUTLASS_TRACE_HOST("-------------------------------"); { auto layout = Layout<_1,_0>{}; test_complement(layout); test_complement(layout, Int<2>{}); } { auto layout = Layout<_1,_1>{}; test_complement(layout); test_complement(layout, Int<2>{}); } { auto layout = Layout<_1,_2>{}; test_complement(layout, Int<1>{}); test_complement(layout, Int<2>{}); test_complement(layout, Int<8>{}); } { auto layout = Layout<_4,_0>{}; test_complement(layout, Int<1>{}); test_complement(layout, Int<2>{}); test_complement(layout, Int<8>{}); } { auto layout = Layout<_4,_1>{}; test_complement(layout, Int<1>{}); test_complement(layout, Int<2>{}); test_complement(layout, Int<8>{}); } { auto layout = Layout<_4,_2>{}; test_complement(layout, Int<1>{}); test_complement(layout); test_complement(layout, Int<16>{}); } { auto layout = Layout<_4,_4>{}; test_complement(layout, Int<1>{}); test_complement(layout); test_complement(layout, Int<17>{}); } { auto layout = Layout>{}; test_complement(layout); } { auto layout = Layout>{}; test_complement(layout); } { auto layout = Layout, Stride<_1,_4>>{}; test_complement(layout); } { auto layout = Layout, Stride<_8,_1,_64>>{}; test_complement(layout); } { auto layout = Layout, Stride<_8,_1,_0>>{}; test_complement(layout); test_complement(layout, Int<460>{}); } { auto layout = make_layout(Shape,Shape<_2, _2>>{}, Stride,Stride<_8,_32>>{}); test_complement(layout); } { auto layout = make_layout(Shape,Shape<_2, _2>>{}, Stride,Stride<_8,_4>>{}); test_complement(layout); } // Fails due to non-injective input //{ //auto layout = make_layout(Shape,Shape<_2, _2>>{}, // Stride,Stride<_8,_4>>{}); //test_complement(layout); //} { auto layout = Layout, Stride<_1,_6>>{}; test_complement(layout); } { auto layout = Layout, Stride<_1,_10>>{}; test_complement(layout); } { auto layout = Layout, Stride<_1,_16>>{}; test_complement(layout); } CUTLASS_TRACE_HOST("-------------------------------"); CUTLASS_TRACE_HOST("Dynamic shapes/strides"); CUTLASS_TRACE_HOST("-------------------------------"); { auto layout = make_layout(12); test_complement(layout, 1); test_complement(layout); test_complement(layout, 53); test_complement(layout, 128); } { auto layout = make_layout(12, 1); test_complement(layout, 1); test_complement(layout); test_complement(layout, 53); test_complement(layout, 128); } { auto layout = make_layout(12, Int<2>{}); test_complement(layout, 1); test_complement(layout); test_complement(layout, 53); test_complement(layout, 128); } { auto layout = make_layout(12, 2); test_complement(layout, 1); test_complement(layout); test_complement(layout, 53); test_complement(layout, 128); } { auto layout = make_layout(make_shape(3,6),make_stride(_1{}, _3{})); test_complement(layout); } { auto layout = make_layout(make_shape(3,6),make_stride(_1{}, _9{})); test_complement(layout); } { auto layout = make_layout(make_shape(3,6),make_stride(_1{}, _10{})); test_complement(layout); } { auto layout = make_layout(make_shape(make_shape(2,2), make_shape(2,2)), Stride,Stride<_8,_32>>{}); test_complement(layout); } }