
CUTLASS 2.0 Substantially refactored for - Better performance, particularly for native Turing Tensor Cores - Robust and durable templates spanning the design space - Encapsulated functionality embodying modern C++11 programming techniques - Optimized containers and data types for efficient, generic, portable device code Updates to: - Quick start guide - Documentation - Utilities - CUTLASS Profiler Native Turing Tensor Cores - Efficient GEMM kernels targeting Turing Tensor Cores - Mixed-precision floating point, 8-bit integer, 4-bit integer, and binarized operands Coverage of existing CUTLASS functionality: - GEMM kernels targeting CUDA and Tensor Cores in NVIDIA GPUs - Volta Tensor Cores through native mma.sync and through WMMA API - Optimizations such as parallel reductions, threadblock rasterization, and intra-threadblock reductions - Batched GEMM operations - Complex-valued GEMMs Note: this commit and all that follow require a host compiler supporting C++11 or greater.
67 lines
35 KiB
JavaScript
67 lines
35 KiB
JavaScript
var searchData=
|
|
[
|
|
['c',['c',['../structcutlass_1_1Tensor4DCoord.html#ab0f58e5f54b42534fca77a662c78c7ad',1,'cutlass::Tensor4DCoord::c() const '],['../structcutlass_1_1Tensor4DCoord.html#a494c8f38161b2d767f9497e751467699',1,'cutlass::Tensor4DCoord::c()']]],
|
|
['can_5fimplement',['can_implement',['../classcutlass_1_1gemm_1_1device_1_1Gemm.html#a40ad889da7ff420fd9f9000cd9f98e32',1,'cutlass::gemm::device::Gemm::can_implement()'],['../classcutlass_1_1gemm_1_1device_1_1Gemm_3_01ElementA___00_01LayoutA___00_01ElementB___00_01Layout4d0960ae6b1d1bf19e6239dbd002249c.html#a662bcbcb6164c803ab490c86e69b9ee1',1,'cutlass::gemm::device::Gemm< ElementA_, LayoutA_, ElementB_, LayoutB_, ElementC_, layout::ColumnMajor, ElementAccumulator_, OperatorClass_, ArchTag_, ThreadblockShape_, WarpShape_, InstructionShape_, EpilogueOutputOp_, ThreadblockSwizzle_, Stages, AlignmentA, AlignmentB, SplitKSerial, Operator_, IsBetaZero >::can_implement()'],['../classcutlass_1_1gemm_1_1device_1_1GemmBatched.html#acb4d53fbea4366349574091d68594558',1,'cutlass::gemm::device::GemmBatched::can_implement()'],['../classcutlass_1_1gemm_1_1device_1_1GemmBatched_3_01ElementA___00_01LayoutA___00_01ElementB___00_0c9bb6f4463ab6085e6008b5d5ad6abfd.html#abbd82c0f989a9d07e5e222db96386701',1,'cutlass::gemm::device::GemmBatched< ElementA_, LayoutA_, ElementB_, LayoutB_, ElementC_, layout::ColumnMajor, ElementAccumulator_, OperatorClass_, ArchTag_, ThreadblockShape_, WarpShape_, InstructionShape_, EpilogueOutputOp_, ThreadblockSwizzle_, Stages, AlignmentA, AlignmentB, Operator_ >::can_implement()'],['../classcutlass_1_1gemm_1_1device_1_1GemmComplex.html#aa94353c3aa13b38f0e859070edf61c6e',1,'cutlass::gemm::device::GemmComplex::can_implement()'],['../classcutlass_1_1gemm_1_1device_1_1GemmComplex_3_01ElementA___00_01LayoutA___00_01ElementB___00_07c56401b4df75709ae636675d9980a9a.html#adb94d2e6dd70b46bea6b5b433e14fea9',1,'cutlass::gemm::device::GemmComplex< ElementA_, LayoutA_, ElementB_, LayoutB_, ElementC_, layout::ColumnMajor, ElementAccumulator_, OperatorClass_, ArchTag_, ThreadblockShape_, WarpShape_, InstructionShape_, EpilogueOutputOp_, ThreadblockSwizzle_, Stages, TransformA, TransformB, SplitKSerial >::can_implement()'],['../classcutlass_1_1gemm_1_1device_1_1GemmSplitKParallel.html#a114b122602b425909f9be0df461353a4',1,'cutlass::gemm::device::GemmSplitKParallel::can_implement()'],['../classcutlass_1_1gemm_1_1device_1_1GemmSplitKParallel_3_01ElementA___00_01LayoutA___00_01ElementBbe7c1f7154ad5b5bf9d4d28301e2b457.html#a465591fbfde2a9aa6330d9adcbf82bd6',1,'cutlass::gemm::device::GemmSplitKParallel< ElementA_, LayoutA_, ElementB_, LayoutB_, ElementC_, layout::ColumnMajor, ElementAccumulator_, OperatorClass_, ArchTag_, ThreadblockShape_, WarpShape_, InstructionShape_, EpilogueOutputOp_, ConvertScaledOp_, ReductionOp_, ThreadblockSwizzle_, Stages, kAlignmentA, kAlignmentB, Operator_ >::can_implement()'],['../structcutlass_1_1gemm_1_1kernel_1_1Gemm.html#afa50b807bd445330e9f3a55d664008c9',1,'cutlass::gemm::kernel::Gemm::can_implement()'],['../classcutlass_1_1library_1_1Operation.html#a36bef483ad4a6c1d5bd426e134f16538',1,'cutlass::library::Operation::can_implement()']]],
|
|
['capacity',['capacity',['../classcutlass_1_1layout_1_1RowMajor.html#a89225f007689acef0e17f6990e32c56e',1,'cutlass::layout::RowMajor::capacity()'],['../classcutlass_1_1layout_1_1ColumnMajor.html#ae0ede39a3011be136c9033327935170d',1,'cutlass::layout::ColumnMajor::capacity()'],['../structcutlass_1_1layout_1_1RowMajorInterleaved.html#a37d81b341052fb816b7a5373efd76c52',1,'cutlass::layout::RowMajorInterleaved::capacity()'],['../structcutlass_1_1layout_1_1ColumnMajorInterleaved.html#a8233dbf6ef04491c79780bf27893f3e1',1,'cutlass::layout::ColumnMajorInterleaved::capacity()'],['../structcutlass_1_1layout_1_1ContiguousMatrix.html#af7266ef6f5ba58567103e8792cb0484b',1,'cutlass::layout::ContiguousMatrix::capacity()'],['../structcutlass_1_1layout_1_1ColumnMajorBlockLinear.html#afa68813c9946c24aa27eae56848a52e6',1,'cutlass::layout::ColumnMajorBlockLinear::capacity()'],['../structcutlass_1_1layout_1_1RowMajorBlockLinear.html#a4e39977f24228d8a2776ca1652336c3b',1,'cutlass::layout::RowMajorBlockLinear::capacity()'],['../structcutlass_1_1layout_1_1GeneralMatrix.html#a435e6e78b25296cd7ccaada3dcd4e16b',1,'cutlass::layout::GeneralMatrix::capacity()'],['../classcutlass_1_1layout_1_1PitchLinear.html#a3fb2016836e011e8c77a4b3fbb3e51d5',1,'cutlass::layout::PitchLinear::capacity()'],['../classcutlass_1_1layout_1_1TensorNHWC.html#a3bb3250d891e752789fa02d5c0cc0ede',1,'cutlass::layout::TensorNHWC::capacity()'],['../classcutlass_1_1layout_1_1TensorNCHW.html#a20dd56dacab1558db7253fb737704c51',1,'cutlass::layout::TensorNCHW::capacity()'],['../classcutlass_1_1layout_1_1TensorNCxHWx.html#a915e1193d4f9c1feb973ae1331687bf9',1,'cutlass::layout::TensorNCxHWx::capacity()'],['../classcutlass_1_1layout_1_1TensorCxRSKx.html#a27c2569d09991401630d7842c0c1ba67',1,'cutlass::layout::TensorCxRSKx::capacity()'],['../structcutlass_1_1layout_1_1VoltaTensorOpMultiplicandCongruous.html#af9149c2f7914f62232dcb3bd8f46384d',1,'cutlass::layout::VoltaTensorOpMultiplicandCongruous::capacity()'],['../structcutlass_1_1layout_1_1ColumnMajorVoltaTensorOpMultiplicandCongruous.html#ae616638f7e2dc315865b3693f71f52cd',1,'cutlass::layout::ColumnMajorVoltaTensorOpMultiplicandCongruous::capacity()'],['../structcutlass_1_1layout_1_1RowMajorVoltaTensorOpMultiplicandCongruous.html#a38fc7f3ffab51a56a76d297ecdc7edf7',1,'cutlass::layout::RowMajorVoltaTensorOpMultiplicandCongruous::capacity()'],['../structcutlass_1_1layout_1_1VoltaTensorOpMultiplicandBCongruous.html#aaafaf46f0d3bb10de607e999e28ca87a',1,'cutlass::layout::VoltaTensorOpMultiplicandBCongruous::capacity()'],['../structcutlass_1_1layout_1_1ColumnMajorVoltaTensorOpMultiplicandBCongruous.html#a9ac9d347fb65719c8a05295816120fec',1,'cutlass::layout::ColumnMajorVoltaTensorOpMultiplicandBCongruous::capacity()'],['../structcutlass_1_1layout_1_1RowMajorVoltaTensorOpMultiplicandBCongruous.html#a2a556452484f1d6958ec57d0a5b68dea',1,'cutlass::layout::RowMajorVoltaTensorOpMultiplicandBCongruous::capacity()'],['../structcutlass_1_1layout_1_1VoltaTensorOpMultiplicandCrosswise.html#a0c2e65352446d60ea1a917ff840245e8',1,'cutlass::layout::VoltaTensorOpMultiplicandCrosswise::capacity()'],['../structcutlass_1_1layout_1_1ColumnMajorVoltaTensorOpMultiplicandCrosswise.html#a1c709df04e3d4693707dc30b6c1f08f5',1,'cutlass::layout::ColumnMajorVoltaTensorOpMultiplicandCrosswise::capacity()'],['../structcutlass_1_1layout_1_1RowMajorVoltaTensorOpMultiplicandCrosswise.html#a0a6c5b20d5c84ace7d2440c03b42f29e',1,'cutlass::layout::RowMajorVoltaTensorOpMultiplicandCrosswise::capacity()'],['../structcutlass_1_1layout_1_1TensorOpMultiplicand.html#a9ef7a95265d1602eb5d050eb89ad8b6b',1,'cutlass::layout::TensorOpMultiplicand::capacity()'],['../structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous.html#a016ea88480ec49f60b311b00e06dba54',1,'cutlass::layout::TensorOpMultiplicandCongruous::capacity()'],['../structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous_3_0132_00_01Crosswise_01_4.html#a8580ab6b5c31b815c9ff4d146cbec442',1,'cutlass::layout::TensorOpMultiplicandCongruous< 32, Crosswise >::capacity()'],['../structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous.html#a789b0744a97926b5447be3861f184122',1,'cutlass::layout::ColumnMajorTensorOpMultiplicandCongruous::capacity()'],['../structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCongruous.html#aa5e728fbc807f398363a43dafd0118f5',1,'cutlass::layout::RowMajorTensorOpMultiplicandCongruous::capacity()'],['../structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html#abf4bd0dac231dfa83fc109420371fe8e',1,'cutlass::layout::TensorOpMultiplicandCrosswise::capacity()'],['../structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise.html#afeba15c02217a7e06c3cb96c7bef2bd0',1,'cutlass::layout::ColumnMajorTensorOpMultiplicandCrosswise::capacity()'],['../structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCrosswise.html#a04e4211bb2e725d434371b2cf1de696e',1,'cutlass::layout::RowMajorTensorOpMultiplicandCrosswise::capacity()'],['../structcutlass_1_1layout_1_1TensorOpMultiplicandColumnMajorInterleaved.html#a68ec1121f75551e44ef28edc17763179',1,'cutlass::layout::TensorOpMultiplicandColumnMajorInterleaved::capacity()'],['../structcutlass_1_1layout_1_1TensorOpMultiplicandRowMajorInterleaved.html#a0df7088ef67f17f69fd72fb5d238fc3e',1,'cutlass::layout::TensorOpMultiplicandRowMajorInterleaved::capacity()'],['../classcutlass_1_1layout_1_1PackedVectorLayout.html#a20b384f56d697894a75c8f4693155320',1,'cutlass::layout::PackedVectorLayout::capacity()'],['../classcutlass_1_1IdentityTensorLayout.html#a3dc530520b5eb35bc57c75de7954b59f',1,'cutlass::IdentityTensorLayout::capacity()'],['../classcutlass_1_1TensorView.html#ad7c287afe582ff3681a8cd6e53d6a4f5',1,'cutlass::TensorView::capacity()'],['../classcutlass_1_1thread_1_1Matrix.html#a6c737c01701bb00f0d47ffdf847fcb6d',1,'cutlass::thread::Matrix::capacity()'],['../classcutlass_1_1HostTensor.html#aa6ea111e8fcba15c07f0cf679e1eec7f',1,'cutlass::HostTensor::capacity()']]],
|
|
['cast_5ffrom_5fdouble',['cast_from_double',['../namespacecutlass_1_1library.html#a5f25bb70b92aa865148c22d4cffcaa37',1,'cutlass::library']]],
|
|
['cast_5ffrom_5fint64',['cast_from_int64',['../namespacecutlass_1_1library.html#a0b8493aa442c2c23aa57234c4e928660',1,'cutlass::library']]],
|
|
['cast_5ffrom_5fuint64',['cast_from_uint64',['../namespacecutlass_1_1library.html#aa997284cf98e50d99e48516f91a96c08',1,'cutlass::library']]],
|
|
['cbegin',['cbegin',['../classcutlass_1_1Array_3_01T_00_01N_00_01true_01_4.html#a815d434e9da9715a115896b3f6e64608',1,'cutlass::Array< T, N, true >::cbegin()'],['../classcutlass_1_1Array_3_01T_00_01N_00_01false_01_4.html#a86a56cc907c8566068034ef8294cf7c2',1,'cutlass::Array< T, N, false >::cbegin()']]],
|
|
['cend',['cend',['../classcutlass_1_1Array_3_01T_00_01N_00_01true_01_4.html#a27e663ee5e22d4af436588a500a6cc0c',1,'cutlass::Array< T, N, true >::cend()'],['../classcutlass_1_1Array_3_01T_00_01N_00_01false_01_4.html#ae6106b72ee9035389afb313801561b16',1,'cutlass::Array< T, N, false >::cend()']]],
|
|
['check',['check',['../structcutlass_1_1platform_1_1is__base__of__helper.html#a5bf08859497e304ca353699ad6ac332b',1,'cutlass::platform::is_base_of_helper::check(DerivedT *, T)'],['../structcutlass_1_1platform_1_1is__base__of__helper.html#ae8896817cabf297437b3a073e693ffd2',1,'cutlass::platform::is_base_of_helper::check(BaseT *, int)']]],
|
|
['check_5fcmd_5fline_5fflag',['check_cmd_line_flag',['../structcutlass_1_1CommandLine.html#a5a20785501f9ed3d4a57241b08399552',1,'cutlass::CommandLine']]],
|
|
['clamp',['clamp',['../structcutlass_1_1Coord.html#a40e145063833155c800b38f82cee7461',1,'cutlass::Coord']]],
|
|
['clear',['clear',['../classcutlass_1_1Array_3_01T_00_01N_00_01true_01_4.html#ae67b1d98a446384fc75a1c92474e719d',1,'cutlass::Array< T, N, true >::clear()'],['../classcutlass_1_1Array_3_01T_00_01N_00_01false_01_4.html#a5b84c4dc5257f31108a0598915f03f94',1,'cutlass::Array< T, N, false >::clear()'],['../structcutlass_1_1epilogue_1_1threadblock_1_1PredicatedTileIterator_1_1Mask.html#a0fcbcea35583d096e4154209237ba217',1,'cutlass::epilogue::threadblock::PredicatedTileIterator::Mask::clear()'],['../structcutlass_1_1epilogue_1_1threadblock_1_1InterleavedPredicatedTileIterator_1_1Mask.html#aed4717037e76148efbb7bb68d6c4e509',1,'cutlass::epilogue::threadblock::InterleavedPredicatedTileIterator::Mask::clear()'],['../structcutlass_1_1PredicateVector.html#a51d9239e76ec040819333022fcecdb55',1,'cutlass::PredicateVector::clear()']]],
|
|
['clear_5fmask',['clear_mask',['../classcutlass_1_1epilogue_1_1threadblock_1_1PredicatedTileIterator.html#a17a6ccbe829782c27e49f47922fce84a',1,'cutlass::epilogue::threadblock::PredicatedTileIterator::clear_mask()'],['../classcutlass_1_1epilogue_1_1threadblock_1_1InterleavedPredicatedTileIterator.html#ab478d83e7b15b9eca8f3f281072cba38',1,'cutlass::epilogue::threadblock::InterleavedPredicatedTileIterator::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileAccessIterator_3_01Shape___00_01Elemen784a0e9da3f55064c47e5613791f51f7.html#ac0b90ae65b6bd987bfb0a0fca4912533',1,'cutlass::transform::threadblock::PredicatedTileAccessIterator< Shape_, Element_, layout::PitchLinear, AdvanceRank, ThreadMap_, AccessType_ >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileAccessIterator_3_01Shape___00_01Elemen89c687c583745a73cb485041911a4c4e.html#ae78b23bb3d11b1ad5fe615a4bcb2d15d',1,'cutlass::transform::threadblock::PredicatedTileAccessIterator< Shape_, Element_, layout::ColumnMajor, AdvanceRank, ThreadMap_, AccessType_ >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileAccessIterator_3_01Shape___00_01Elemen9838736ad62fae54213fbaf722a989ab.html#ad52c785f2d0e7bfc86633571f5e4a926',1,'cutlass::transform::threadblock::PredicatedTileAccessIterator< Shape_, Element_, layout::RowMajor, AdvanceRank, ThreadMap_, AccessType_ >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileAccessIterator_3_01Shape___00_01Elemenab63a1e105bf37f6371516cb9e2c5a7a.html#a2fd2b595bf69e2f4d1c9af852acdd018',1,'cutlass::transform::threadblock::PredicatedTileAccessIterator< Shape_, Element_, layout::ColumnMajorInterleaved< InterleavedK >, AdvanceRank, ThreadMap_, AccessType_ >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileAccessIterator_3_01Shape___00_01Elemen809793e785fb4211888c6b4e5dcfcb39.html#acd9df23ddc440195ba7a648db3c55f3e',1,'cutlass::transform::threadblock::PredicatedTileAccessIterator< Shape_, Element_, layout::RowMajorInterleaved< InterleavedK >, AdvanceRank, ThreadMap_, AccessType_ >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileAccessIterator2dThreadTile_3_01Shape__1790abaa54a01f277d75766d5882fec8.html#a5ad8047c30a84a55fa1c21c911d148d8',1,'cutlass::transform::threadblock::PredicatedTileAccessIterator2dThreadTile< Shape_, Element_, layout::PitchLinear, AdvanceRank, ThreadMap_, AccessType_ >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileAccessIterator2dThreadTile_3_01Shape__da632779aba661c0f4cfaaa78126b771.html#a887454d8c430984ceffd4859903b4898',1,'cutlass::transform::threadblock::PredicatedTileAccessIterator2dThreadTile< Shape_, Element_, layout::ColumnMajor, AdvanceRank, ThreadMap_, AccessType_ >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileAccessIterator2dThreadTile_3_01Shape__7327fa15996bcb8502cdfcc192350fe1.html#abc85cc801d0e933dfb026a9c266674e2',1,'cutlass::transform::threadblock::PredicatedTileAccessIterator2dThreadTile< Shape_, Element_, layout::RowMajor, AdvanceRank, ThreadMap_, AccessType_ >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileIterator_3_01Shape___00_01Element___00e7c2c404e7aedfe60ad56bb5571306a1.html#afd3e189a510aef0ddceb6f0ceb519d88',1,'cutlass::transform::threadblock::PredicatedTileIterator< Shape_, Element_, layout::PitchLinear, AdvanceRank, ThreadMap_, AccessSize >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileIterator_3_01Shape___00_01Element___0068b3e874b5d93d11f0fa902c7f1d11d9.html#ac31418e71cb8ed71b7ebf51ab7028713',1,'cutlass::transform::threadblock::PredicatedTileIterator< Shape_, Element_, layout::ColumnMajor, AdvanceRank, ThreadMap_, AccessSize >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileIterator_3_01Shape___00_01Element___0041ea81994f8af0d4d071fdb9e66b5ff0.html#a38b1509afcb20c5474ea5998f85c6507',1,'cutlass::transform::threadblock::PredicatedTileIterator< Shape_, Element_, layout::RowMajor, AdvanceRank, ThreadMap_, AccessSize >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileIterator_3_01Shape___00_01Element___00f6b3a9dfab5e7c72d5233f7e5e6e3b9b.html#a73c78020399019ab244400b48f43d7cc',1,'cutlass::transform::threadblock::PredicatedTileIterator< Shape_, Element_, layout::ColumnMajorInterleaved< InterleavedK >, AdvanceRank, ThreadMap_, AccessSize >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileIterator_3_01Shape___00_01Element___00d670f969180a8d182dffb356ebcc957e.html#a40cdf0a9b56d2571c87f50d1abcfae73',1,'cutlass::transform::threadblock::PredicatedTileIterator< Shape_, Element_, layout::RowMajorInterleaved< InterleavedK >, AdvanceRank, ThreadMap_, AccessSize >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileIterator2dThreadTile_3_01Shape___00_017a517f3c73efd795ab05059cc9b111e1.html#a24d17e4be377b870202dd8524047af8d',1,'cutlass::transform::threadblock::PredicatedTileIterator2dThreadTile< Shape_, Element_, layout::PitchLinear, AdvanceRank, ThreadMap_, Transpose_ >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileIterator2dThreadTile_3_01Shape___00_0165b39a630d10785a3558406f9adb99b9.html#a16eb418826fc3bead16d7f15dccae29f',1,'cutlass::transform::threadblock::PredicatedTileIterator2dThreadTile< Shape_, Element_, layout::ColumnMajor, AdvanceRank, ThreadMap_, Transpose_ >::clear_mask()'],['../classcutlass_1_1transform_1_1threadblock_1_1PredicatedTileIterator2dThreadTile_3_01Shape___00_013671177d6219bfeb0e1b4dc4c1b5bf11.html#a2778dc7d89b47e3fe9b1d3f9e67c9601',1,'cutlass::transform::threadblock::PredicatedTileIterator2dThreadTile< Shape_, Element_, layout::RowMajor, AdvanceRank, ThreadMap_, Transpose_ >::clear_mask()']]],
|
|
['clz',['clz',['../namespacecutlass.html#a6bc666acc9f0d7278a788975e226e005',1,'cutlass']]],
|
|
['column',['column',['../structcutlass_1_1MatrixCoord.html#afbdcc5ca5b91f11f29046667b0bfde7b',1,'cutlass::MatrixCoord::column() const '],['../structcutlass_1_1MatrixCoord.html#a093f5e568a81c6464dbf4aef996c32ba',1,'cutlass::MatrixCoord::column()']]],
|
|
['columnmajor',['ColumnMajor',['../classcutlass_1_1layout_1_1ColumnMajor.html#adc69d6cd2cf938d1ab41c4f2ba0589a4',1,'cutlass::layout::ColumnMajor::ColumnMajor(Index ldm=0)'],['../classcutlass_1_1layout_1_1ColumnMajor.html#a0a9383ad9de01697e2df975c3a3e6ab8',1,'cutlass::layout::ColumnMajor::ColumnMajor(Stride stride)']]],
|
|
['columnmajorblocklinear',['ColumnMajorBlockLinear',['../structcutlass_1_1layout_1_1ColumnMajorBlockLinear.html#a740b33237fd49dee4692946811e203ba',1,'cutlass::layout::ColumnMajorBlockLinear']]],
|
|
['columnmajorinterleaved',['ColumnMajorInterleaved',['../structcutlass_1_1layout_1_1ColumnMajorInterleaved.html#acd4d70f17b74ebe3e55ea0027bac5899',1,'cutlass::layout::ColumnMajorInterleaved::ColumnMajorInterleaved(Index ldm=0)'],['../structcutlass_1_1layout_1_1ColumnMajorInterleaved.html#a2d4a85bbfbb919349e6fd2b859a0a461',1,'cutlass::layout::ColumnMajorInterleaved::ColumnMajorInterleaved(Stride stride)']]],
|
|
['columnmajortensoropmultiplicandcongruous',['ColumnMajorTensorOpMultiplicandCongruous',['../structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous.html#a910ff464fc55a153bf3e54cb7b816ccb',1,'cutlass::layout::ColumnMajorTensorOpMultiplicandCongruous::ColumnMajorTensorOpMultiplicandCongruous(Index ldm=0)'],['../structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous.html#a588582ed7496bb9f6cfbb7f79873affa',1,'cutlass::layout::ColumnMajorTensorOpMultiplicandCongruous::ColumnMajorTensorOpMultiplicandCongruous(Stride stride)']]],
|
|
['columnmajortensoropmultiplicandcrosswise',['ColumnMajorTensorOpMultiplicandCrosswise',['../structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise.html#ae9010e219ceb098de21d2673a9112b50',1,'cutlass::layout::ColumnMajorTensorOpMultiplicandCrosswise::ColumnMajorTensorOpMultiplicandCrosswise(Index ldm=0)'],['../structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise.html#a77befaca4f7609243842a4e54d50d010',1,'cutlass::layout::ColumnMajorTensorOpMultiplicandCrosswise::ColumnMajorTensorOpMultiplicandCrosswise(Stride stride)']]],
|
|
['columnmajorvoltatensoropmultiplicandbcongruous',['ColumnMajorVoltaTensorOpMultiplicandBCongruous',['../structcutlass_1_1layout_1_1ColumnMajorVoltaTensorOpMultiplicandBCongruous.html#ab42f59c4fb58814ce2b5617b12e3faf0',1,'cutlass::layout::ColumnMajorVoltaTensorOpMultiplicandBCongruous::ColumnMajorVoltaTensorOpMultiplicandBCongruous(Index ldm=0)'],['../structcutlass_1_1layout_1_1ColumnMajorVoltaTensorOpMultiplicandBCongruous.html#a80099cf16729a8b553677fc70bea81bc',1,'cutlass::layout::ColumnMajorVoltaTensorOpMultiplicandBCongruous::ColumnMajorVoltaTensorOpMultiplicandBCongruous(Stride stride)']]],
|
|
['columnmajorvoltatensoropmultiplicandcongruous',['ColumnMajorVoltaTensorOpMultiplicandCongruous',['../structcutlass_1_1layout_1_1ColumnMajorVoltaTensorOpMultiplicandCongruous.html#a9019c397159688cd2bafe55967ee7f36',1,'cutlass::layout::ColumnMajorVoltaTensorOpMultiplicandCongruous::ColumnMajorVoltaTensorOpMultiplicandCongruous(Index ldm=0)'],['../structcutlass_1_1layout_1_1ColumnMajorVoltaTensorOpMultiplicandCongruous.html#a963c8058ab8ef1a5d21403bd1dc27277',1,'cutlass::layout::ColumnMajorVoltaTensorOpMultiplicandCongruous::ColumnMajorVoltaTensorOpMultiplicandCongruous(Stride stride)']]],
|
|
['columnmajorvoltatensoropmultiplicandcrosswise',['ColumnMajorVoltaTensorOpMultiplicandCrosswise',['../structcutlass_1_1layout_1_1ColumnMajorVoltaTensorOpMultiplicandCrosswise.html#af2456911e4cfca021d50ec16ca1d7505',1,'cutlass::layout::ColumnMajorVoltaTensorOpMultiplicandCrosswise::ColumnMajorVoltaTensorOpMultiplicandCrosswise(Index ldm=0)'],['../structcutlass_1_1layout_1_1ColumnMajorVoltaTensorOpMultiplicandCrosswise.html#a7c839af8ec4dda7a6114d49daec52728',1,'cutlass::layout::ColumnMajorVoltaTensorOpMultiplicandCrosswise::ColumnMajorVoltaTensorOpMultiplicandCrosswise(Stride stride)']]],
|
|
['commandline',['CommandLine',['../structcutlass_1_1CommandLine.html#a7156975dc884e8b58b91c710495fc79d',1,'cutlass::CommandLine']]],
|
|
['complex',['complex',['../classcutlass_1_1complex.html#a9050cd0f48c7a7b718ea9223299b3a82',1,'cutlass::complex::complex(T r=T(0))'],['../classcutlass_1_1complex.html#a0eae629b6e4bf0be4a8d259fcc59c842',1,'cutlass::complex::complex(T r, T i)'],['../classcutlass_1_1complex.html#a2a853405a46cc6ed36185a80bd2aae98',1,'cutlass::complex::complex(complex< A > const &z)'],['../classcutlass_1_1complex.html#a8681bee9979b43f21d154e17725cb630',1,'cutlass::complex::complex(cuFloatComplex const &z)'],['../classcutlass_1_1complex.html#ada1e58813aa2d901d44237f5f9fb37db',1,'cutlass::complex::complex(cuDoubleComplex const &z)']]],
|
|
['compute_5fgemm',['compute_gemm',['../namespacecutlass_1_1reference_1_1device.html#a4b872e5b16985b2cf31530a9090a8423',1,'cutlass::reference::device::compute_gemm(gemm::GemmCoord problem_size, ScalarType alpha, TensorRef< ElementA, LayoutA > tensor_a, TensorRef< ElementB, LayoutB > tensor_b, ScalarType beta, TensorRef< ElementC, LayoutC > tensor_c, TensorRef< ElementC, LayoutC > tensor_d, AccumulatorType initial_accum)'],['../namespacecutlass_1_1reference_1_1device.html#aa1b04f721cb13fb3f110acf6b29dc53b',1,'cutlass::reference::device::compute_gemm(gemm::GemmCoord problem_size, ScalarType alpha, TensorRef< ElementA, LayoutA > tensor_a, TensorRef< ElementB, LayoutB > tensor_b, ScalarType beta, TensorRef< ElementC, LayoutC > tensor_c, AccumulatorType initial_accum)'],['../namespacecutlass_1_1reference_1_1host.html#a300d68abd082150020768c0a94044a34',1,'cutlass::reference::host::compute_gemm(gemm::GemmCoord problem_size, ScalarType alpha, TensorRef< ElementA, LayoutA > tensor_a, TensorRef< ElementB, LayoutB > tensor_b, ScalarType beta, TensorRef< ElementC, LayoutC > tensor_c, TensorRef< ElementC, LayoutC > tensor_d, ComputeType initial_accum)'],['../namespacecutlass_1_1reference_1_1host.html#aa75c5933390f3960666e97b37c854877',1,'cutlass::reference::host::compute_gemm(gemm::GemmCoord problem_size, ScalarType alpha, TensorRef< ElementA, LayoutA > tensor_a, TensorRef< ElementB, LayoutB > tensor_b, ScalarType beta, TensorRef< ElementC, LayoutC > tensor_c, ComputeType initial_accum)']]],
|
|
['conj',['conj',['../namespacecutlass.html#adba9348e32642fa40c186b5ca6e5ba4e',1,'cutlass']]],
|
|
['const_5fbegin',['const_begin',['../structcutlass_1_1PredicateVector.html#a505db4b5fba1671ee8362c18e2ccce1b',1,'cutlass::PredicateVector']]],
|
|
['const_5fend',['const_end',['../structcutlass_1_1PredicateVector.html#a8017a90ffe8a8039fff56b6956739045',1,'cutlass::PredicateVector']]],
|
|
['const_5fiterator',['const_iterator',['../classcutlass_1_1Array_3_01T_00_01N_00_01true_01_4_1_1const__iterator.html#a40f18ab5962efa95ac4ae4f5140c5d7b',1,'cutlass::Array< T, N, true >::const_iterator::const_iterator()'],['../classcutlass_1_1Array_3_01T_00_01N_00_01true_01_4_1_1const__iterator.html#a56cb84bfcb97eeeae472f03fc203d759',1,'cutlass::Array< T, N, true >::const_iterator::const_iterator(T const *_ptr)'],['../classcutlass_1_1Array_3_01T_00_01N_00_01false_01_4_1_1const__iterator.html#a2baacc6de7180213621a2d6b2328ca7d',1,'cutlass::Array< T, N, false >::const_iterator::const_iterator()'],['../classcutlass_1_1Array_3_01T_00_01N_00_01false_01_4_1_1const__iterator.html#a273a0ea9cf66fac0787e90339fd49371',1,'cutlass::Array< T, N, false >::const_iterator::const_iterator(Storage const *ptr, int idx=0)']]],
|
|
['const_5fmax',['const_max',['../namespacecutlass.html#a072919006084ca52479a69cd10694448',1,'cutlass']]],
|
|
['const_5fmin',['const_min',['../namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872',1,'cutlass']]],
|
|
['const_5fref',['const_ref',['../classcutlass_1_1TensorRef.html#a5c5c66a59e9759f11f832fb71f4234c2',1,'cutlass::TensorRef::const_ref()'],['../classcutlass_1_1TensorView.html#aef27ab5348a53539286057a0da8720fc',1,'cutlass::TensorView::const_ref()'],['../classcutlass_1_1thread_1_1Matrix.html#a850e9e43797c386ffbdec398d1c1b559',1,'cutlass::thread::Matrix::const_ref()']]],
|
|
['const_5freference',['const_reference',['../classcutlass_1_1Array_3_01T_00_01N_00_01false_01_4_1_1const__reference.html#abf1841f0ac863891efcf23bd5ac57847',1,'cutlass::Array< T, N, false >::const_reference::const_reference()'],['../classcutlass_1_1Array_3_01T_00_01N_00_01false_01_4_1_1const__reference.html#ac9e3b9e2f5797efbc47e3415aa204079',1,'cutlass::Array< T, N, false >::const_reference::const_reference(Storage const *ptr, int idx=0)']]],
|
|
['const_5freverse_5fiterator',['const_reverse_iterator',['../classcutlass_1_1Array_3_01T_00_01N_00_01true_01_4_1_1const__reverse__iterator.html#aa839335a821fad9841eb31560d7520a2',1,'cutlass::Array< T, N, true >::const_reverse_iterator::const_reverse_iterator()'],['../classcutlass_1_1Array_3_01T_00_01N_00_01true_01_4_1_1const__reverse__iterator.html#a6e2a9b7f836704d9d39ad42c74502a07',1,'cutlass::Array< T, N, true >::const_reverse_iterator::const_reverse_iterator(T const *_ptr)'],['../classcutlass_1_1Array_3_01T_00_01N_00_01false_01_4_1_1const__reverse__iterator.html#aae7705a26ea52ebd18d5f5809d816ee2',1,'cutlass::Array< T, N, false >::const_reverse_iterator::const_reverse_iterator()'],['../classcutlass_1_1Array_3_01T_00_01N_00_01false_01_4_1_1const__reverse__iterator.html#a4bef88847b70f6bca81dd46bd883373b',1,'cutlass::Array< T, N, false >::const_reverse_iterator::const_reverse_iterator(Storage const *ptr, int idx=0)']]],
|
|
['const_5fview',['const_view',['../classcutlass_1_1TensorView.html#ab7794e21b87340f8b73aeb4dca2cb80c',1,'cutlass::TensorView::const_view()'],['../classcutlass_1_1thread_1_1Matrix.html#a65a4c5ff99fd0a7dbee722c9e04fac35',1,'cutlass::thread::Matrix::const_view()']]],
|
|
['constiterator',['ConstIterator',['../classcutlass_1_1PredicateVector_1_1ConstIterator.html#a1216aab9c567ec0d4232019008ef3ea7',1,'cutlass::PredicateVector::ConstIterator::ConstIterator(ConstIterator const &it)'],['../classcutlass_1_1PredicateVector_1_1ConstIterator.html#abb6749fd0f66f9442fa18fabbb3588e4',1,'cutlass::PredicateVector::ConstIterator::ConstIterator(PredicateVector const &vec, int _start=0)']]],
|
|
['constsubbytereference',['ConstSubbyteReference',['../classcutlass_1_1ConstSubbyteReference.html#aa00016fe6dafa323e9875be4287fbfe5',1,'cutlass::ConstSubbyteReference::ConstSubbyteReference()'],['../classcutlass_1_1ConstSubbyteReference.html#a158ae5a484751f274c083807b4a37868',1,'cutlass::ConstSubbyteReference::ConstSubbyteReference(Element const *ptr, int64_t offset)'],['../classcutlass_1_1ConstSubbyteReference.html#adfefff5e63632fcdc4f59e21dccea16d',1,'cutlass::ConstSubbyteReference::ConstSubbyteReference(Element *ptr=nullptr)']]],
|
|
['contains',['contains',['../classcutlass_1_1TensorView.html#a6a6a1f99d06abd8fb3f5a8e4e0fea25e',1,'cutlass::TensorView']]],
|
|
['contiguous',['contiguous',['../structcutlass_1_1layout_1_1PitchLinearCoord.html#adb31bc9b8cf49dfff64245b70a850834',1,'cutlass::layout::PitchLinearCoord::contiguous() const '],['../structcutlass_1_1layout_1_1PitchLinearCoord.html#a3d3c19009c7cf8991cb33f1ff8c8d494',1,'cutlass::layout::PitchLinearCoord::contiguous()']]],
|
|
['contiguousmatrix',['ContiguousMatrix',['../structcutlass_1_1layout_1_1ContiguousMatrix.html#a4515c6a78dadf99bf491137e6bb52451',1,'cutlass::layout::ContiguousMatrix']]],
|
|
['convert',['Convert',['../classcutlass_1_1epilogue_1_1thread_1_1Convert.html#ac7ec0a00e5863dc06f4d99477fd5c056',1,'cutlass::epilogue::thread::Convert::Convert()'],['../structcutlass_1_1half__t.html#a4c472ad52970df8b6f5c05beff66ff9f',1,'cutlass::half_t::convert(float const &flt)'],['../structcutlass_1_1half__t.html#a1cddd98cc0650a0fcc5ff1ea0cb08fcf',1,'cutlass::half_t::convert(int const &n)'],['../structcutlass_1_1half__t.html#a6af4af16ddbbfcefde206c29cac5c1ec',1,'cutlass::half_t::convert(unsigned const &n)'],['../structcutlass_1_1half__t.html#a5ef78c3a7ccd316fc4fe52b7c230f87b',1,'cutlass::half_t::convert(half_t const &x)'],['../structcutlass_1_1NumericConverter.html#a4d1a347bd8c92f3dc5b6e919005d34d2',1,'cutlass::NumericConverter::convert()'],['../structcutlass_1_1NumericConverter_3_01int8__t_00_01float_00_01Round_01_4.html#ab90d4ee00677c3129962501a148cdaf7',1,'cutlass::NumericConverter< int8_t, float, Round >::convert()'],['../structcutlass_1_1NumericConverter_3_01T_00_01T_00_01Round_01_4.html#aa61325e20130b528104b990fc8ec3bb8',1,'cutlass::NumericConverter< T, T, Round >::convert()'],['../structcutlass_1_1NumericConverter_3_01float_00_01half__t_00_01Round_01_4.html#af7d7dec76e968b489efa25be32a4cf04',1,'cutlass::NumericConverter< float, half_t, Round >::convert()'],['../structcutlass_1_1NumericConverter_3_01half__t_00_01float_00_01FloatRoundStyle_1_1round__to__nearest_01_4.html#aaf16c1dd3bb1fc0566c819146dfd5ab8',1,'cutlass::NumericConverter< half_t, float, FloatRoundStyle::round_to_nearest >::convert()'],['../structcutlass_1_1NumericConverter_3_01half__t_00_01float_00_01FloatRoundStyle_1_1round__toward__zero_01_4.html#a43ab30e5283f39b1defe46b13da9ac1b',1,'cutlass::NumericConverter< half_t, float, FloatRoundStyle::round_toward_zero >::convert()'],['../structcutlass_1_1NumericConverterClamp.html#aefadbac80ed0f5be1abc6f6704631fe2',1,'cutlass::NumericConverterClamp::convert()'],['../structcutlass_1_1NumericArrayConverter.html#a157bacb3ab7d03032c83ff75d0a0d090',1,'cutlass::NumericArrayConverter::convert()'],['../structcutlass_1_1NumericArrayConverter_3_01half__t_00_01float_00_012_00_01FloatRoundStyle_1_1round__to__nearest_01_4.html#a3cc4d59f083555f24288e15490eeb41d',1,'cutlass::NumericArrayConverter< half_t, float, 2, FloatRoundStyle::round_to_nearest >::convert()'],['../structcutlass_1_1NumericArrayConverter_3_01float_00_01half__t_00_012_00_01Round_01_4.html#a16ac842664840d5db0ba823303c9ec4e',1,'cutlass::NumericArrayConverter< float, half_t, 2, Round >::convert()'],['../structcutlass_1_1NumericArrayConverter_3_01half__t_00_01float_00_01N_00_01Round_01_4.html#af8e268c03414c218485ed80e158725e8',1,'cutlass::NumericArrayConverter< half_t, float, N, Round >::convert()'],['../structcutlass_1_1NumericArrayConverter_3_01float_00_01half__t_00_01N_00_01Round_01_4.html#a4602966344dcf217c4dbd97deb358c6f',1,'cutlass::NumericArrayConverter< float, half_t, N, Round >::convert()']]],
|
|
['coord',['Coord',['../structcutlass_1_1Coord.html#a5281db2419b5567db4265dead7ac02cc',1,'cutlass::Coord::Coord(Index value=Index(0))'],['../structcutlass_1_1Coord.html#ab7094975a4b7471315ca083ae575030a',1,'cutlass::Coord::Coord(Index const (&_idx)[kRank])'],['../structcutlass_1_1Coord.html#a42aefbb547e39b8cc7267c58a610c147',1,'cutlass::Coord::Coord(Coord< kRank, Index, LongIndex > const &coord)']]],
|
|
['copy',['copy',['../namespacecutlass_1_1device__memory.html#a117e201964852b2b3e228d81eaf73f93',1,'cutlass::device_memory']]],
|
|
['copy_5fdevice_5fto_5fdevice',['copy_device_to_device',['../namespacecutlass_1_1device__memory.html#a8ff6151b081442db9af7421110c0242b',1,'cutlass::device_memory']]],
|
|
['copy_5fhost_5fto_5fhost',['copy_host_to_host',['../namespacecutlass_1_1device__memory.html#a0a3ab26e6c9a8aae6b09bfb3e4eb24e8',1,'cutlass::device_memory']]],
|
|
['copy_5fin_5fdevice_5fto_5fdevice',['copy_in_device_to_device',['../classcutlass_1_1HostTensor.html#a5686ea068c8f3e820ccff015e95bc474',1,'cutlass::HostTensor']]],
|
|
['copy_5fin_5fdevice_5fto_5fhost',['copy_in_device_to_host',['../classcutlass_1_1HostTensor.html#a2b4858efb0356a6fc01bb9f55f0ad3b2',1,'cutlass::HostTensor']]],
|
|
['copy_5fin_5fhost_5fto_5fdevice',['copy_in_host_to_device',['../classcutlass_1_1HostTensor.html#ad385330c69ecd7bd0b6c3660815253fa',1,'cutlass::HostTensor']]],
|
|
['copy_5fin_5fhost_5fto_5fhost',['copy_in_host_to_host',['../classcutlass_1_1HostTensor.html#ae11229ea69460ca174c5e6f9815eb97f',1,'cutlass::HostTensor']]],
|
|
['copy_5fout_5fdevice_5fto_5fdevice',['copy_out_device_to_device',['../classcutlass_1_1HostTensor.html#ab7179440d39b0445113b30b7a460a1ec',1,'cutlass::HostTensor']]],
|
|
['copy_5fout_5fdevice_5fto_5fhost',['copy_out_device_to_host',['../classcutlass_1_1HostTensor.html#ab3051d2842b3aa3815e2ea5f53abfc2a',1,'cutlass::HostTensor']]],
|
|
['copy_5fout_5fhost_5fto_5fdevice',['copy_out_host_to_device',['../classcutlass_1_1HostTensor.html#abeefdb8bccb2d8d751fdb22fa7e8ef0c',1,'cutlass::HostTensor']]],
|
|
['copy_5fout_5fhost_5fto_5fhost',['copy_out_host_to_host',['../classcutlass_1_1HostTensor.html#a40da221db96cfda76ba5623856c66bf1',1,'cutlass::HostTensor']]],
|
|
['copy_5fto_5fdevice',['copy_to_device',['../namespacecutlass_1_1device__memory.html#adce1a75429c0eae9d34dc18944777325',1,'cutlass::device_memory']]],
|
|
['copy_5fto_5fhost',['copy_to_host',['../namespacecutlass_1_1device__memory.html#a5333f291105136d2e8e4c31329d93c31',1,'cutlass::device_memory']]],
|
|
['copysign',['copysign',['../namespacecutlass.html#ac42c217e2600fb741312b535c633bb76',1,'cutlass']]],
|
|
['cos',['cos',['../namespacecutlass.html#a2337866060023f87d4d821850738541f',1,'cutlass']]],
|
|
['crbegin',['crbegin',['../classcutlass_1_1Array_3_01T_00_01N_00_01true_01_4.html#ab1813941489bef9563cc0bc3f647b2ca',1,'cutlass::Array< T, N, true >::crbegin()'],['../classcutlass_1_1Array_3_01T_00_01N_00_01false_01_4.html#a01b9f76c6052dc2467095b91c1ebe34e',1,'cutlass::Array< T, N, false >::crbegin()']]],
|
|
['crend',['crend',['../classcutlass_1_1Array_3_01T_00_01N_00_01true_01_4.html#a76e1b5d728b155f9d967a43c0cc3b0dd',1,'cutlass::Array< T, N, true >::crend()'],['../classcutlass_1_1Array_3_01T_00_01N_00_01false_01_4.html#abbc436f18649c1578ef95eb501872094',1,'cutlass::Array< T, N, false >::crend()']]],
|
|
['cuda_5fexception',['cuda_exception',['../classcutlass_1_1cuda__exception.html#acbfb99c9979ce7d24fe774459c66cfa5',1,'cutlass::cuda_exception']]],
|
|
['cuda_5fperror_5fimpl',['cuda_perror_impl',['../namespacecutlass.html#a6d3dfeb642a2ce3d5f52243fe48f89cc',1,'cutlass::cuda_perror_impl()'],['../tools_2util_2include_2cutlass_2util_2debug_8h.html#aed67644b6ffaa6d88a2efa09fcaafdce',1,'cuda_perror_impl(): debug.h']]],
|
|
['cudaerror',['cudaError',['../classcutlass_1_1cuda__exception.html#a5e2363c04ed0a43e244b274cb21aebf1',1,'cutlass::cuda_exception']]]
|
|
];
|