cutlass/docs/search/variables_b.js
Andrew Kerr fb335f6a5f
CUTLASS 2.0 (#62)
CUTLASS 2.0

Substantially refactored for

- Better performance, particularly for native Turing Tensor Cores
- Robust and durable templates spanning the design space
- Encapsulated functionality embodying modern C++11 programming techniques
- Optimized containers and data types for efficient, generic, portable device code

Updates to:
- Quick start guide
- Documentation
- Utilities
- CUTLASS Profiler

Native Turing Tensor Cores
- Efficient GEMM kernels targeting Turing Tensor Cores
- Mixed-precision floating point, 8-bit integer, 4-bit integer, and binarized operands

Coverage of existing CUTLASS functionality:
- GEMM kernels targeting CUDA and Tensor Cores in NVIDIA GPUs
- Volta Tensor Cores through native mma.sync and through WMMA API
- Optimizations such as parallel reductions, threadblock rasterization, and intra-threadblock reductions
- Batched GEMM operations
- Complex-valued GEMMs

Note: this commit and all that follow require a host compiler supporting C++11 or greater.
2019-11-19 16:55:34 -08:00

15 lines
3.5 KiB
JavaScript

var searchData=
[
['main_5floop',['main_loop',['../unioncutlass_1_1gemm_1_1kernel_1_1Gemm_1_1SharedStorage.html#a25ca6f379b42d97b73de07473e2fdf02',1,'cutlass::gemm::kernel::Gemm::SharedStorage::main_loop()'],['../unioncutlass_1_1gemm_1_1kernel_1_1GemmBatched_1_1SharedStorage.html#ae9f9d72c08cbf031961d95dca828d573',1,'cutlass::gemm::kernel::GemmBatched::SharedStorage::main_loop()'],['../unioncutlass_1_1gemm_1_1kernel_1_1GemmSplitKParallel_1_1SharedStorage.html#a9a4c11bb49a8cadae9cb2c17c92bf6db',1,'cutlass::gemm::kernel::GemmSplitKParallel::SharedStorage::main_loop()']]],
['math_5finstruction',['math_instruction',['../structcutlass_1_1library_1_1TileDescription.html#aad96c46afa29cb6c02f8e0737eeaf963',1,'cutlass::library::TileDescription']]],
['max',['max',['../structcutlass_1_1Distribution.html#a824641fd3addfa360999614970adfac0',1,'cutlass::Distribution']]],
['maximum_5fcompute_5fcapability',['maximum_compute_capability',['../structcutlass_1_1library_1_1TileDescription.html#a37f5925a2f04995091c56c034f4f2572',1,'cutlass::library::TileDescription']]],
['maxinreg',['maxInReg',['../structcutlass_1_1reduction_1_1BatchedReductionTraits.html#af11a3284195a24e580d2f379f179f05a',1,'cutlass::reduction::BatchedReductionTraits']]],
['maxoutreg',['maxOutReg',['../structcutlass_1_1reduction_1_1BatchedReductionTraits.html#ac28e31791c5888bbe7b04abe6376a422',1,'cutlass::reduction::BatchedReductionTraits']]],
['mean',['mean',['../structcutlass_1_1Distribution.html#a776df53c7ad1b7de983c9f9d17d7438c',1,'cutlass::Distribution::mean()'],['../structcutlass_1_1reference_1_1device_1_1detail_1_1RandomGaussianFunc_1_1Params.html#a07d12eba25e8e2e9da03ce735b1b8113',1,'cutlass::reference::device::detail::RandomGaussianFunc::Params::mean()'],['../structcutlass_1_1reference_1_1host_1_1detail_1_1RandomGaussianFunc.html#a5da7c7b953aa178bb356ba8578245d89',1,'cutlass::reference::host::detail::RandomGaussianFunc::mean()'],['../structcutlass_1_1reference_1_1host_1_1detail_1_1RandomGaussianFunc_3_01complex_3_01Element_01_4_01_4.html#ad8c60b0630a2867fd80a0d09a3cf63cd',1,'cutlass::reference::host::detail::RandomGaussianFunc< complex< Element > >::mean()']]],
['min',['min',['../structcutlass_1_1Distribution.html#a846430e3a21ed25c779fc6e714bc1bcc',1,'cutlass::Distribution::min()'],['../structcutlass_1_1reference_1_1device_1_1detail_1_1RandomUniformFunc_1_1Params.html#a5f49e5175fa2fc3c3c7fb495fe6958db',1,'cutlass::reference::device::detail::RandomUniformFunc::Params::min()'],['../structcutlass_1_1reference_1_1host_1_1detail_1_1RandomUniformFunc.html#ab3de08baeb9246f5472a1c8ec19c68fa',1,'cutlass::reference::host::detail::RandomUniformFunc::min()'],['../structcutlass_1_1reference_1_1host_1_1detail_1_1RandomUniformFunc_3_01complex_3_01Element_01_4_01_4.html#a005299ae9f0e4533f6847a7f6ff9e6ad',1,'cutlass::reference::host::detail::RandomUniformFunc< complex< Element > >::min()']]],
['minimum_5fcompute_5fcapability',['minimum_compute_capability',['../structcutlass_1_1library_1_1TileDescription.html#a25557ce7220e284c095ef7f691b16fa0',1,'cutlass::library::TileDescription']]],
['mma',['mma',['../classcutlass_1_1gemm_1_1warp_1_1MmaTensorOp.html#a2eddba2b1644d2df5ade4de535b95ed7',1,'cutlass::gemm::warp::MmaTensorOp::mma()'],['../classcutlass_1_1gemm_1_1warp_1_1MmaVoltaTensorOp.html#aa4837cb1fd3eac3713e99d0625f14842',1,'cutlass::gemm::warp::MmaVoltaTensorOp::mma()']]],
['msg',['msg',['../classcutlass_1_1cuda__exception.html#af748a69a87ad9863985f6a77260ba77a',1,'cutlass::cuda_exception']]]
];