remove redundant hardcoded packing configs in mixed dtype gemm (#1894)

Co-authored-by: Siyuan Fu <siyuanf@nvidia.com>
This commit is contained in:
Lain 2024-10-23 11:24:09 -07:00 committed by GitHub
parent 12626bcfe4
commit be692b48b0
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -1291,24 +1291,6 @@ private:
return Int<cute::gcd(Cosize, 32 / cute::min(sizeof_bits_v<SrcType>, sizeof_bits_v<DstType>))>{};
}
};
template <int Cosize> struct select_packing<cutlass::float_e4m3_t, cutlass::bfloat16_t, Cosize> {
static constexpr auto value() { return Int<cute::gcd(Cosize, 2)>{}; }
};
template <int Cosize> struct select_packing<cutlass::float_e5m2_t, cutlass::bfloat16_t, Cosize> {
static constexpr auto value() { return Int<cute::gcd(Cosize, 2)>{}; }
};
template <int Cosize> struct select_packing<cutlass::float_e4m3_t, cutlass::half_t, Cosize> {
static constexpr auto value() { return Int<cute::gcd(Cosize, 2)>{}; }
};
template <int Cosize> struct select_packing<cutlass::float_e5m2_t, cutlass::half_t, Cosize> {
static constexpr auto value() { return Int<cute::gcd(Cosize, 2)>{}; }
};
template <int Cosize> struct select_packing<cutlass::int4b_t, cutlass::bfloat16_t, Cosize> {
static constexpr auto value() { return Int<cute::gcd(Cosize, 4)>{}; }
};
template <int Cosize> struct select_packing<cutlass::int4b_t, cutlass::half_t, Cosize> {
static constexpr auto value() { return Int<cute::gcd(Cosize, 4)>{}; }
};
CUTLASS_DEVICE
static uint32_t to_reg(Array<cutlass::int4b_t, 4> const& source) {