Parameters object constructable on the host.
#include <gemm_traits.h>
|
template<typename GemmDesc_ > |
CUTLASS_HOST_DEVICE int | initialize (GemmDesc_ const &desc) |
| Initialize the parameters. More...
|
|
CUTLASS_HOST_DEVICE int | initialize (Index m, Index n, Index k, typename Epilogue::Scalar alpha, ScalarA const *d_a, Index lda, ScalarB const *d_b, Index ldb, typename Epilogue::Scalar beta, ScalarC const *d_c, Index ldc, ScalarD *d_d, Index ldd) |
| Helper to construct a GEMM params using a BLAS-like API. More...
|
|
CUTLASS_HOST_DEVICE int | initialize (Index m, Index n, Index k, typename Epilogue::Scalar alpha, ScalarA const *d_a, Index lda, long long int batch_stride_A, ScalarB const *d_b, Index ldb, long long int batch_stride_B, typename Epilogue::Scalar beta, ScalarC const *d_c, Index ldc, long long int batch_stride_C, ScalarD *d_d, Index ldd, long long int batch_stride_D, Index batch_count) |
| Helper to construct a batched GEMM params. More...
|
|
CUTLASS_HOST_DEVICE | KernelLaunchConfiguration (dim3 _grid=dim3(1, 1, 1), dim3 _block=dim3(1, 1, 1), size_t _dynamic_smem=0) |
| Constructs a KernellaunchConfiguration object. More...
|
|
◆ initialize() [1/3]
template<typename GemmConfig_, typename GlobalLoadStreamA_, typename GlobalLoadStreamB_, typename SharedLoadStreamA_, typename SharedLoadStreamB_, typename Epilogue_, typename BlockSwizzle_ = IdentityBlockSwizzle, typename Index_ = int, typename ClearAccumulators_ = ClearAccumulators<typename GemmConfig_::Accumulators::Element>>
template<typename GemmDesc_ >
CUTLASS_HOST_DEVICE int cutlass::gemm::GemmTraits< GemmConfig_, GlobalLoadStreamA_, GlobalLoadStreamB_, SharedLoadStreamA_, SharedLoadStreamB_, Epilogue_, BlockSwizzle_, Index_, ClearAccumulators_ >::Params::initialize |
( |
GemmDesc_ const & |
desc | ) |
|
|
inline |
◆ initialize() [2/3]
template<typename GemmConfig_, typename GlobalLoadStreamA_, typename GlobalLoadStreamB_, typename SharedLoadStreamA_, typename SharedLoadStreamB_, typename Epilogue_, typename BlockSwizzle_ = IdentityBlockSwizzle, typename Index_ = int, typename ClearAccumulators_ = ClearAccumulators<typename GemmConfig_::Accumulators::Element>>
CUTLASS_HOST_DEVICE int cutlass::gemm::GemmTraits< GemmConfig_, GlobalLoadStreamA_, GlobalLoadStreamB_, SharedLoadStreamA_, SharedLoadStreamB_, Epilogue_, BlockSwizzle_, Index_, ClearAccumulators_ >::Params::initialize |
( |
Index |
m, |
|
|
Index |
n, |
|
|
Index |
k, |
|
|
typename Epilogue::Scalar |
alpha, |
|
|
ScalarA const * |
d_a, |
|
|
Index |
lda, |
|
|
ScalarB const * |
d_b, |
|
|
Index |
ldb, |
|
|
typename Epilogue::Scalar |
beta, |
|
|
ScalarC const * |
d_c, |
|
|
Index |
ldc, |
|
|
ScalarD * |
d_d, |
|
|
Index |
ldd |
|
) |
| |
|
inline |
◆ initialize() [3/3]
template<typename GemmConfig_, typename GlobalLoadStreamA_, typename GlobalLoadStreamB_, typename SharedLoadStreamA_, typename SharedLoadStreamB_, typename Epilogue_, typename BlockSwizzle_ = IdentityBlockSwizzle, typename Index_ = int, typename ClearAccumulators_ = ClearAccumulators<typename GemmConfig_::Accumulators::Element>>
CUTLASS_HOST_DEVICE int cutlass::gemm::GemmTraits< GemmConfig_, GlobalLoadStreamA_, GlobalLoadStreamB_, SharedLoadStreamA_, SharedLoadStreamB_, Epilogue_, BlockSwizzle_, Index_, ClearAccumulators_ >::Params::initialize |
( |
Index |
m, |
|
|
Index |
n, |
|
|
Index |
k, |
|
|
typename Epilogue::Scalar |
alpha, |
|
|
ScalarA const * |
d_a, |
|
|
Index |
lda, |
|
|
long long int |
batch_stride_A, |
|
|
ScalarB const * |
d_b, |
|
|
Index |
ldb, |
|
|
long long int |
batch_stride_B, |
|
|
typename Epilogue::Scalar |
beta, |
|
|
ScalarC const * |
d_c, |
|
|
Index |
ldc, |
|
|
long long int |
batch_stride_C, |
|
|
ScalarD * |
d_d, |
|
|
Index |
ldd, |
|
|
long long int |
batch_stride_D, |
|
|
Index |
batch_count |
|
) |
| |
|
inline |
◆ epilogue
template<typename GemmConfig_, typename GlobalLoadStreamA_, typename GlobalLoadStreamB_, typename SharedLoadStreamA_, typename SharedLoadStreamB_, typename Epilogue_, typename BlockSwizzle_ = IdentityBlockSwizzle, typename Index_ = int, typename ClearAccumulators_ = ClearAccumulators<typename GemmConfig_::Accumulators::Element>>
Epilogue::Params cutlass::gemm::GemmTraits< GemmConfig_, GlobalLoadStreamA_, GlobalLoadStreamB_, SharedLoadStreamA_, SharedLoadStreamB_, Epilogue_, BlockSwizzle_, Index_, ClearAccumulators_ >::Params::epilogue |
◆ global_to_shared_stream
template<typename GemmConfig_, typename GlobalLoadStreamA_, typename GlobalLoadStreamB_, typename SharedLoadStreamA_, typename SharedLoadStreamB_, typename Epilogue_, typename BlockSwizzle_ = IdentityBlockSwizzle, typename Index_ = int, typename ClearAccumulators_ = ClearAccumulators<typename GemmConfig_::Accumulators::Element>>
◆ problem_size
template<typename GemmConfig_, typename GlobalLoadStreamA_, typename GlobalLoadStreamB_, typename SharedLoadStreamA_, typename SharedLoadStreamB_, typename Epilogue_, typename BlockSwizzle_ = IdentityBlockSwizzle, typename Index_ = int, typename ClearAccumulators_ = ClearAccumulators<typename GemmConfig_::Accumulators::Element>>
GemmCoord cutlass::gemm::GemmTraits< GemmConfig_, GlobalLoadStreamA_, GlobalLoadStreamB_, SharedLoadStreamA_, SharedLoadStreamB_, Epilogue_, BlockSwizzle_, Index_, ClearAccumulators_ >::Params::problem_size |
◆ shared_stream
template<typename GemmConfig_, typename GlobalLoadStreamA_, typename GlobalLoadStreamB_, typename SharedLoadStreamA_, typename SharedLoadStreamB_, typename Epilogue_, typename BlockSwizzle_ = IdentityBlockSwizzle, typename Index_ = int, typename ClearAccumulators_ = ClearAccumulators<typename GemmConfig_::Accumulators::Element>>
The documentation for this struct was generated from the following file: