cutlass/docs/search/functions_d.js
Andrew Kerr fb335f6a5f
CUTLASS 2.0 (#62)
CUTLASS 2.0

Substantially refactored for

- Better performance, particularly for native Turing Tensor Cores
- Robust and durable templates spanning the design space
- Encapsulated functionality embodying modern C++11 programming techniques
- Optimized containers and data types for efficient, generic, portable device code

Updates to:
- Quick start guide
- Documentation
- Utilities
- CUTLASS Profiler

Native Turing Tensor Cores
- Efficient GEMM kernels targeting Turing Tensor Cores
- Mixed-precision floating point, 8-bit integer, 4-bit integer, and binarized operands

Coverage of existing CUTLASS functionality:
- GEMM kernels targeting CUDA and Tensor Cores in NVIDIA GPUs
- Volta Tensor Cores through native mma.sync and through WMMA API
- Optimizations such as parallel reductions, threadblock rasterization, and intra-threadblock reductions
- Batched GEMM operations
- Complex-valued GEMMs

Note: this commit and all that follow require a host compiler supporting C++11 or greater.
2019-11-19 16:55:34 -08:00

12 lines
2.0 KiB
JavaScript

var searchData=
[
['n',['n',['../structcutlass_1_1gemm_1_1GemmCoord.html#a1b29d2cb15360ad5499216859ad5436a',1,'cutlass::gemm::GemmCoord::n() const '],['../structcutlass_1_1gemm_1_1GemmCoord.html#a1327b9b4b9379df24df3d4b716952d11',1,'cutlass::gemm::GemmCoord::n()'],['../structcutlass_1_1gemm_1_1BatchedGemmCoord.html#a67c16efaba4f8e87fb226bac4ccb0ad8',1,'cutlass::gemm::BatchedGemmCoord::n() const '],['../structcutlass_1_1gemm_1_1BatchedGemmCoord.html#adff635f9c102e2648736dcd019c050b9',1,'cutlass::gemm::BatchedGemmCoord::n()'],['../structcutlass_1_1Tensor4DCoord.html#a2fa718218c21df006b71d9325f1ddb5a',1,'cutlass::Tensor4DCoord::n() const '],['../structcutlass_1_1Tensor4DCoord.html#a8f3d209442262c674f0bde0257ef1792',1,'cutlass::Tensor4DCoord::n()']]],
['nanh',['nanh',['../namespacecutlass.html#a6ded5de9d10cc550e9f39e6c5f6c971c',1,'cutlass']]],
['nk',['nk',['../structcutlass_1_1gemm_1_1GemmCoord.html#aa5e22c102d48dfd91c28e1c08ba687ea',1,'cutlass::gemm::GemmCoord']]],
['nm',['nm',['../structcutlass_1_1gemm_1_1GemmCoord.html#a1fc9861bfa5074513ab8f1cae7adab0d',1,'cutlass::gemm::GemmCoord']]],
['non_5fconst_5fref',['non_const_ref',['../classcutlass_1_1TensorRef.html#a66a9bab939e2d57c130bb76a5527f482',1,'cutlass::TensorRef']]],
['norm',['norm',['../namespacecutlass.html#a8d529517dadbc9ff697183cfb3e9a21f',1,'cutlass::norm(T const &z)'],['../namespacecutlass.html#ac6da2f4c8e675ef7c53cffeb04ccaff1',1,'cutlass::norm(int8_t const &z)'],['../namespacecutlass.html#a462c9f7d686d23a0a764a773c9af2f47',1,'cutlass::norm(complex< T > const &z)']]],
['norm_5faccumulate',['norm_accumulate',['../namespacecutlass.html#a326d3123e33cfd02c4e7ad519c56561f',1,'cutlass::norm_accumulate(T const &x, R const &accumulator)'],['../namespacecutlass.html#a47fce4c8a33798ec16ad04e8c8bc651d',1,'cutlass::norm_accumulate(complex< T > const &z, R const &accumulator)']]],
['num_5fnaked_5fargs',['num_naked_args',['../structcutlass_1_1CommandLine.html#a0bee40a3cc6078a08eec5d4ca4711f61',1,'cutlass::CommandLine']]]
];