cutlass/docs/search/variables_4.js
Andrew Kerr fb335f6a5f
CUTLASS 2.0 (#62)
CUTLASS 2.0

Substantially refactored for

- Better performance, particularly for native Turing Tensor Cores
- Robust and durable templates spanning the design space
- Encapsulated functionality embodying modern C++11 programming techniques
- Optimized containers and data types for efficient, generic, portable device code

Updates to:
- Quick start guide
- Documentation
- Utilities
- CUTLASS Profiler

Native Turing Tensor Cores
- Efficient GEMM kernels targeting Turing Tensor Cores
- Mixed-precision floating point, 8-bit integer, 4-bit integer, and binarized operands

Coverage of existing CUTLASS functionality:
- GEMM kernels targeting CUDA and Tensor Cores in NVIDIA GPUs
- Volta Tensor Cores through native mma.sync and through WMMA API
- Optimizations such as parallel reductions, threadblock rasterization, and intra-threadblock reductions
- Batched GEMM operations
- Complex-valued GEMMs

Note: this commit and all that follow require a host compiler supporting C++11 or greater.
2019-11-19 16:55:34 -08:00

9 lines
4.0 KiB
JavaScript

var searchData=
[
['element',['element',['../structcutlass_1_1library_1_1TensorDescription.html#a79ef2d43932a8d540dfffab9de8336fa',1,'cutlass::library::TensorDescription']]],
['element_5faccumulator',['element_accumulator',['../structcutlass_1_1library_1_1MathInstructionDescription.html#ac2fa166c39589c08d76c06ee191eb86f',1,'cutlass::library::MathInstructionDescription']]],
['element_5fepilogue',['element_epilogue',['../structcutlass_1_1library_1_1GemmDescription.html#ac7315202cc067ec32d678f6606f11e23',1,'cutlass::library::GemmDescription']]],
['epilogue',['epilogue',['../structcutlass_1_1gemm_1_1device_1_1Gemm_1_1Arguments.html#a98c7946bf72f054b026bb6fd49175e90',1,'cutlass::gemm::device::Gemm::Arguments::epilogue()'],['../structcutlass_1_1gemm_1_1device_1_1Gemm_3_01ElementA___00_01LayoutA___00_01ElementB___00_01Layou1b211cc9c97c022d8fe10f2dd32c8709.html#a426f402c08be99849a4477a07f010a5e',1,'cutlass::gemm::device::Gemm< ElementA_, LayoutA_, ElementB_, LayoutB_, ElementC_, layout::ColumnMajor, ElementAccumulator_, OperatorClass_, ArchTag_, ThreadblockShape_, WarpShape_, InstructionShape_, EpilogueOutputOp_, ThreadblockSwizzle_, Stages, AlignmentA, AlignmentB, SplitKSerial, Operator_, IsBetaZero >::Arguments::epilogue()'],['../structcutlass_1_1gemm_1_1device_1_1GemmBatched_1_1Arguments.html#aea0c4cd59daee8d3b497be411beb9b3a',1,'cutlass::gemm::device::GemmBatched::Arguments::epilogue()'],['../structcutlass_1_1gemm_1_1device_1_1GemmBatched_3_01ElementA___00_01LayoutA___00_01ElementB___00_213d78696663f4231cd52c6a277c60e5.html#af9c2fa1e0cc0456197c2cc0840c89982',1,'cutlass::gemm::device::GemmBatched< ElementA_, LayoutA_, ElementB_, LayoutB_, ElementC_, layout::ColumnMajor, ElementAccumulator_, OperatorClass_, ArchTag_, ThreadblockShape_, WarpShape_, InstructionShape_, EpilogueOutputOp_, ThreadblockSwizzle_, Stages, AlignmentA, AlignmentB, Operator_ >::Arguments::epilogue()'],['../structcutlass_1_1gemm_1_1device_1_1GemmComplex_1_1Arguments.html#a42ba311ce71d63f836eecc05b3da754f',1,'cutlass::gemm::device::GemmComplex::Arguments::epilogue()'],['../structcutlass_1_1gemm_1_1device_1_1GemmComplex_3_01ElementA___00_01LayoutA___00_01ElementB___00_a3923967cafb5cb9774c320dc24baa77.html#ad1f435bf8b7003afad9b803adf9fcb89',1,'cutlass::gemm::device::GemmComplex< ElementA_, LayoutA_, ElementB_, LayoutB_, ElementC_, layout::ColumnMajor, ElementAccumulator_, OperatorClass_, ArchTag_, ThreadblockShape_, WarpShape_, InstructionShape_, EpilogueOutputOp_, ThreadblockSwizzle_, Stages, TransformA, TransformB, SplitKSerial >::Arguments::epilogue()'],['../structcutlass_1_1gemm_1_1device_1_1GemmSplitKParallel_1_1Arguments.html#a92fb61dbfc8ca622f852cc1673fa1066',1,'cutlass::gemm::device::GemmSplitKParallel::Arguments::epilogue()'],['../structcutlass_1_1gemm_1_1device_1_1GemmSplitKParallel_3_01ElementA___00_01LayoutA___00_01Elementafcb1aeaf2035a7ac769d7acc233423b.html#a04818e67f94c5440ac6c367798e17fc2',1,'cutlass::gemm::device::GemmSplitKParallel< ElementA_, LayoutA_, ElementB_, LayoutB_, ElementC_, layout::ColumnMajor, ElementAccumulator_, OperatorClass_, ArchTag_, ThreadblockShape_, WarpShape_, InstructionShape_, EpilogueOutputOp_, ConvertScaledOp_, ReductionOp_, ThreadblockSwizzle_, Stages, kAlignmentA, kAlignmentB, Operator_ >::Arguments::epilogue()'],['../unioncutlass_1_1gemm_1_1kernel_1_1Gemm_1_1SharedStorage.html#aeed9542ff5c448269160ceb51fe2cf2b',1,'cutlass::gemm::kernel::Gemm::SharedStorage::epilogue()'],['../structcutlass_1_1gemm_1_1kernel_1_1GemmBatched_1_1Params.html#aa9de86f045ae89ecf844c4397e9e202c',1,'cutlass::gemm::kernel::GemmBatched::Params::epilogue()'],['../unioncutlass_1_1gemm_1_1kernel_1_1GemmBatched_1_1SharedStorage.html#a12326ac5fd0a306b62aa74ab4e10fd0d',1,'cutlass::gemm::kernel::GemmBatched::SharedStorage::epilogue()'],['../unioncutlass_1_1gemm_1_1kernel_1_1GemmSplitKParallel_1_1SharedStorage.html#a36820192d060123d2dd6b1475a6fd8dc',1,'cutlass::gemm::kernel::GemmSplitKParallel::SharedStorage::epilogue()']]],
['err',['err',['../classcutlass_1_1cuda__exception.html#a1166c2a5331dbf394abd5309b4d1377a',1,'cutlass::cuda_exception']]]
];