402 lines
29 KiB
HTML
402 lines
29 KiB
HTML
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
|
|
<html xmlns="http://www.w3.org/1999/xhtml">
|
|
<head>
|
|
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
|
|
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
|
|
<meta name="generator" content="Doxygen 1.8.14"/>
|
|
<meta name="viewport" content="width=device-width, initial-scale=1"/>
|
|
<title>Cutlass: cutlass::gemm::ThreadMultiplyAdd< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ > Struct Template Reference</title>
|
|
<link href="tabs.css" rel="stylesheet" type="text/css"/>
|
|
<script type="text/javascript" src="jquery.js"></script>
|
|
<script type="text/javascript" src="dynsections.js"></script>
|
|
<link href="search/search.css" rel="stylesheet" type="text/css"/>
|
|
<script type="text/javascript" src="search/searchdata.js"></script>
|
|
<script type="text/javascript" src="search/search.js"></script>
|
|
<script type="text/x-mathjax-config">
|
|
MathJax.Hub.Config({
|
|
extensions: ["tex2jax.js"],
|
|
jax: ["input/TeX","output/HTML-CSS"],
|
|
});
|
|
</script><script type="text/javascript" async src="http://cdn.mathjax.org/mathjax/latest/MathJax.js"></script>
|
|
<link href="doxygen.css" rel="stylesheet" type="text/css" />
|
|
</head>
|
|
<body>
|
|
<div id="top"><!-- do not remove this div, it is closed by doxygen! -->
|
|
<div id="titlearea">
|
|
<table cellspacing="0" cellpadding="0">
|
|
<tbody>
|
|
<tr style="height: 56px;">
|
|
<td id="projectalign" style="padding-left: 0.5em;">
|
|
<div id="projectname">Cutlass
|
|
</div>
|
|
<div id="projectbrief">CUDA Templates for Linear Algebra Subroutines and Solvers</div>
|
|
</td>
|
|
</tr>
|
|
</tbody>
|
|
</table>
|
|
</div>
|
|
<!-- end header part -->
|
|
<!-- Generated by Doxygen 1.8.14 -->
|
|
<script type="text/javascript">
|
|
/* @license magnet:?xt=urn:btih:cf05388f2679ee054f2beb29a391d25f4e673ac3&dn=gpl-2.0.txt GPL-v2 */
|
|
var searchBox = new SearchBox("searchBox", "search",false,'Search');
|
|
/* @license-end */
|
|
</script>
|
|
<script type="text/javascript" src="menudata.js"></script>
|
|
<script type="text/javascript" src="menu.js"></script>
|
|
<script type="text/javascript">
|
|
/* @license magnet:?xt=urn:btih:cf05388f2679ee054f2beb29a391d25f4e673ac3&dn=gpl-2.0.txt GPL-v2 */
|
|
$(function() {
|
|
initMenu('',true,false,'search.php','Search');
|
|
$(document).ready(function() { init_search(); });
|
|
});
|
|
/* @license-end */</script>
|
|
<div id="main-nav"></div>
|
|
<!-- window showing the filter options -->
|
|
<div id="MSearchSelectWindow"
|
|
onmouseover="return searchBox.OnSearchSelectShow()"
|
|
onmouseout="return searchBox.OnSearchSelectHide()"
|
|
onkeydown="return searchBox.OnSearchSelectKey(event)">
|
|
</div>
|
|
|
|
<!-- iframe showing the search results (closed by default) -->
|
|
<div id="MSearchResultsWindow">
|
|
<iframe src="javascript:void(0)" frameborder="0"
|
|
name="MSearchResults" id="MSearchResults">
|
|
</iframe>
|
|
</div>
|
|
|
|
<div id="nav-path" class="navpath">
|
|
<ul>
|
|
<li class="navelem"><a class="el" href="namespacecutlass.html">cutlass</a></li><li class="navelem"><a class="el" href="namespacecutlass_1_1gemm.html">gemm</a></li><li class="navelem"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">ThreadMultiplyAdd</a></li> </ul>
|
|
</div>
|
|
</div><!-- top -->
|
|
<div class="header">
|
|
<div class="summary">
|
|
<a href="#pub-types">Public Types</a> |
|
|
<a href="#pub-methods">Public Member Functions</a> |
|
|
<a href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd-members.html">List of all members</a> </div>
|
|
<div class="headertitle">
|
|
<div class="title">cutlass::gemm::ThreadMultiplyAdd< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ > Struct Template Reference</div> </div>
|
|
</div><!--header-->
|
|
<div class="contents">
|
|
|
|
<p>Template performing matrix multiply-add operation within a thread.
|
|
</p>
|
|
|
|
<p><code>#include <<a class="el" href="thread__multiply__add_8h_source.html">thread_multiply_add.h</a>></code></p>
|
|
<table class="memberdecls">
|
|
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a name="pub-types"></a>
|
|
Public Types</h2></td></tr>
|
|
<tr class="memitem:a56d687b878397c694e7338fa750995af"><td class="memItemLeft" align="right" valign="top">typedef <a class="el" href="structcutlass_1_1Shape.html">Shape</a>< 1, 1, 1, 1 > </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a56d687b878397c694e7338fa750995af">InstructionShape</a></td></tr>
|
|
<tr class="memdesc:a56d687b878397c694e7338fa750995af"><td class="mdescLeft"> </td><td class="mdescRight">The shape of the instruction. <a href="#a56d687b878397c694e7338fa750995af">More...</a><br /></td></tr>
|
|
<tr class="separator:a56d687b878397c694e7338fa750995af"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a33a68b52cca697bd505bfd982938143e"><td class="memItemLeft" align="right" valign="top">typedef ThreadGemmShape_ </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a33a68b52cca697bd505bfd982938143e">ThreadGemmShape</a></td></tr>
|
|
<tr class="memdesc:a33a68b52cca697bd505bfd982938143e"><td class="mdescLeft"> </td><td class="mdescRight">The shape of a thread-leveel matrix multiply accumulate. <a href="#a33a68b52cca697bd505bfd982938143e">More...</a><br /></td></tr>
|
|
<tr class="separator:a33a68b52cca697bd505bfd982938143e"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:ad8ea3777c307bf3f8c58a8df3966715d"><td class="memItemLeft" align="right" valign="top">typedef <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a33a68b52cca697bd505bfd982938143e">ThreadGemmShape</a> </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#ad8ea3777c307bf3f8c58a8df3966715d">AccumulatorsPerThread</a></td></tr>
|
|
<tr class="memdesc:ad8ea3777c307bf3f8c58a8df3966715d"><td class="mdescLeft"> </td><td class="mdescRight">Aliased to "AccumulatorsPerThread" for compatibility. Expect to be renamed in CUTLASS v2.0. <a href="#ad8ea3777c307bf3f8c58a8df3966715d">More...</a><br /></td></tr>
|
|
<tr class="separator:ad8ea3777c307bf3f8c58a8df3966715d"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a19bd7eb621b08f192bc01a4634853a9b"><td class="memItemLeft" align="right" valign="top">typedef ThreadsPerWarp_ </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a19bd7eb621b08f192bc01a4634853a9b">ThreadsPerWarp</a></td></tr>
|
|
<tr class="memdesc:a19bd7eb621b08f192bc01a4634853a9b"><td class="mdescLeft"> </td><td class="mdescRight">The number of threads per warp. <a href="#a19bd7eb621b08f192bc01a4634853a9b">More...</a><br /></td></tr>
|
|
<tr class="separator:a19bd7eb621b08f192bc01a4634853a9b"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a9f706e141ec3bc880fa17a5731d8370e"><td class="memItemLeft" align="right" valign="top">typedef <a class="el" href="structcutlass_1_1ShapeMul.html">ShapeMul</a>< <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a33a68b52cca697bd505bfd982938143e">ThreadGemmShape</a>, <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a19bd7eb621b08f192bc01a4634853a9b">ThreadsPerWarp</a> >::<a class="el" href="structcutlass_1_1Shape.html">Shape</a> </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a9f706e141ec3bc880fa17a5731d8370e">AccumulatorsPerWarp</a></td></tr>
|
|
<tr class="memdesc:a9f706e141ec3bc880fa17a5731d8370e"><td class="mdescLeft"> </td><td class="mdescRight">The number of accumulators per warp. <a href="#a9f706e141ec3bc880fa17a5731d8370e">More...</a><br /></td></tr>
|
|
<tr class="separator:a9f706e141ec3bc880fa17a5731d8370e"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a6bb4f6a102edc2c8fba5b67abf05c363"><td class="memItemLeft" align="right" valign="top">typedef ScalarA_ </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a6bb4f6a102edc2c8fba5b67abf05c363">ScalarA</a></td></tr>
|
|
<tr class="memdesc:a6bb4f6a102edc2c8fba5b67abf05c363"><td class="mdescLeft"> </td><td class="mdescRight">The type for A. <a href="#a6bb4f6a102edc2c8fba5b67abf05c363">More...</a><br /></td></tr>
|
|
<tr class="separator:a6bb4f6a102edc2c8fba5b67abf05c363"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a7c1cc536ac6ad12800f9e2b5ec682649"><td class="memItemLeft" align="right" valign="top">typedef <a class="el" href="structcutlass_1_1Fragment.html">Fragment</a>< <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a6bb4f6a102edc2c8fba5b67abf05c363">ScalarA</a>, AccumulatorsPerThread::kW > </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a7c1cc536ac6ad12800f9e2b5ec682649">FragmentA</a></td></tr>
|
|
<tr class="memdesc:a7c1cc536ac6ad12800f9e2b5ec682649"><td class="mdescLeft"> </td><td class="mdescRight">The fragment for A. <a href="#a7c1cc536ac6ad12800f9e2b5ec682649">More...</a><br /></td></tr>
|
|
<tr class="separator:a7c1cc536ac6ad12800f9e2b5ec682649"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a6c9a73da33b5ba70307a719db988b56c"><td class="memItemLeft" align="right" valign="top">typedef ScalarB_ </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a6c9a73da33b5ba70307a719db988b56c">ScalarB</a></td></tr>
|
|
<tr class="memdesc:a6c9a73da33b5ba70307a719db988b56c"><td class="mdescLeft"> </td><td class="mdescRight">The type for B. <a href="#a6c9a73da33b5ba70307a719db988b56c">More...</a><br /></td></tr>
|
|
<tr class="separator:a6c9a73da33b5ba70307a719db988b56c"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a1401162276ea0858ea85a8e4785adbad"><td class="memItemLeft" align="right" valign="top">typedef <a class="el" href="structcutlass_1_1Fragment.html">Fragment</a>< <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a6c9a73da33b5ba70307a719db988b56c">ScalarB</a>, AccumulatorsPerThread::kH > </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a1401162276ea0858ea85a8e4785adbad">FragmentB</a></td></tr>
|
|
<tr class="memdesc:a1401162276ea0858ea85a8e4785adbad"><td class="mdescLeft"> </td><td class="mdescRight">The fragment for B. <a href="#a1401162276ea0858ea85a8e4785adbad">More...</a><br /></td></tr>
|
|
<tr class="separator:a1401162276ea0858ea85a8e4785adbad"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:af41778b170d940d10bd53f13d34912b1"><td class="memItemLeft" align="right" valign="top">typedef ScalarC_ </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#af41778b170d940d10bd53f13d34912b1">ScalarC</a></td></tr>
|
|
<tr class="memdesc:af41778b170d940d10bd53f13d34912b1"><td class="mdescLeft"> </td><td class="mdescRight">The type for C and D. <a href="#af41778b170d940d10bd53f13d34912b1">More...</a><br /></td></tr>
|
|
<tr class="separator:af41778b170d940d10bd53f13d34912b1"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a72d1ac143dab68b6cdd73d057315fcb6"><td class="memItemLeft" align="right" valign="top">typedef <a class="el" href="structcutlass_1_1Fragment.html">Fragment</a>< <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#af41778b170d940d10bd53f13d34912b1">ScalarC</a>, AccumulatorsPerThread::kH *AccumulatorsPerThread::kW, 16 > </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a72d1ac143dab68b6cdd73d057315fcb6">Accumulators</a></td></tr>
|
|
<tr class="memdesc:a72d1ac143dab68b6cdd73d057315fcb6"><td class="mdescLeft"> </td><td class="mdescRight">The accumulators. <a href="#a72d1ac143dab68b6cdd73d057315fcb6">More...</a><br /></td></tr>
|
|
<tr class="separator:a72d1ac143dab68b6cdd73d057315fcb6"><td class="memSeparator" colspan="2"> </td></tr>
|
|
</table><table class="memberdecls">
|
|
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a name="pub-methods"></a>
|
|
Public Member Functions</h2></td></tr>
|
|
<tr class="memitem:ac087f0b397599221b74d220fcb1c7121"><td class="memItemLeft" align="right" valign="top">CUTLASS_DEVICE </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#ac087f0b397599221b74d220fcb1c7121">ThreadMultiplyAdd</a> ()</td></tr>
|
|
<tr class="memdesc:ac087f0b397599221b74d220fcb1c7121"><td class="mdescLeft"> </td><td class="mdescRight">Ctor. <a href="#ac087f0b397599221b74d220fcb1c7121">More...</a><br /></td></tr>
|
|
<tr class="separator:ac087f0b397599221b74d220fcb1c7121"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a7989d48e4c2e16b7804b813630f347cb"><td class="memItemLeft" align="right" valign="top">CUTLASS_DEVICE void </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a7989d48e4c2e16b7804b813630f347cb">multiply_add</a> (<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a7c1cc536ac6ad12800f9e2b5ec682649">FragmentA</a> const &a, <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a1401162276ea0858ea85a8e4785adbad">FragmentB</a> const &b, <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a72d1ac143dab68b6cdd73d057315fcb6">Accumulators</a> const &c, <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a72d1ac143dab68b6cdd73d057315fcb6">Accumulators</a> &d)</td></tr>
|
|
<tr class="memdesc:a7989d48e4c2e16b7804b813630f347cb"><td class="mdescLeft"> </td><td class="mdescRight">Multiply : d = a*b + c. <a href="#a7989d48e4c2e16b7804b813630f347cb">More...</a><br /></td></tr>
|
|
<tr class="separator:a7989d48e4c2e16b7804b813630f347cb"><td class="memSeparator" colspan="2"> </td></tr>
|
|
</table>
|
|
<h2 class="groupheader">Member Typedef Documentation</h2>
|
|
<a id="a72d1ac143dab68b6cdd73d057315fcb6"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a72d1ac143dab68b6cdd73d057315fcb6">◆ </a></span>Accumulators</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef <a class="el" href="structcutlass_1_1Fragment.html">Fragment</a><<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#af41778b170d940d10bd53f13d34912b1">ScalarC</a>, AccumulatorsPerThread::kH * AccumulatorsPerThread::kW, 16> <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a72d1ac143dab68b6cdd73d057315fcb6">Accumulators</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="ad8ea3777c307bf3f8c58a8df3966715d"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#ad8ea3777c307bf3f8c58a8df3966715d">◆ </a></span>AccumulatorsPerThread</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a33a68b52cca697bd505bfd982938143e">ThreadGemmShape</a> <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#ad8ea3777c307bf3f8c58a8df3966715d">AccumulatorsPerThread</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a9f706e141ec3bc880fa17a5731d8370e"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a9f706e141ec3bc880fa17a5731d8370e">◆ </a></span>AccumulatorsPerWarp</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef <a class="el" href="structcutlass_1_1ShapeMul.html">ShapeMul</a><<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a33a68b52cca697bd505bfd982938143e">ThreadGemmShape</a>, <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a19bd7eb621b08f192bc01a4634853a9b">ThreadsPerWarp</a>>::<a class="el" href="structcutlass_1_1Shape.html">Shape</a> <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a9f706e141ec3bc880fa17a5731d8370e">AccumulatorsPerWarp</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a7c1cc536ac6ad12800f9e2b5ec682649"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a7c1cc536ac6ad12800f9e2b5ec682649">◆ </a></span>FragmentA</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef <a class="el" href="structcutlass_1_1Fragment.html">Fragment</a><<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a6bb4f6a102edc2c8fba5b67abf05c363">ScalarA</a>, AccumulatorsPerThread::kW> <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a7c1cc536ac6ad12800f9e2b5ec682649">FragmentA</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a1401162276ea0858ea85a8e4785adbad"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a1401162276ea0858ea85a8e4785adbad">◆ </a></span>FragmentB</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef <a class="el" href="structcutlass_1_1Fragment.html">Fragment</a><<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a6c9a73da33b5ba70307a719db988b56c">ScalarB</a>, AccumulatorsPerThread::kH> <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a1401162276ea0858ea85a8e4785adbad">FragmentB</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a56d687b878397c694e7338fa750995af"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a56d687b878397c694e7338fa750995af">◆ </a></span>InstructionShape</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef <a class="el" href="structcutlass_1_1Shape.html">Shape</a><1, 1, 1, 1> <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a56d687b878397c694e7338fa750995af">InstructionShape</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a6bb4f6a102edc2c8fba5b67abf05c363"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a6bb4f6a102edc2c8fba5b67abf05c363">◆ </a></span>ScalarA</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef ScalarA_ <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a6bb4f6a102edc2c8fba5b67abf05c363">ScalarA</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a6c9a73da33b5ba70307a719db988b56c"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a6c9a73da33b5ba70307a719db988b56c">◆ </a></span>ScalarB</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef ScalarB_ <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a6c9a73da33b5ba70307a719db988b56c">ScalarB</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="af41778b170d940d10bd53f13d34912b1"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#af41778b170d940d10bd53f13d34912b1">◆ </a></span>ScalarC</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef ScalarC_ <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#af41778b170d940d10bd53f13d34912b1">ScalarC</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a33a68b52cca697bd505bfd982938143e"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a33a68b52cca697bd505bfd982938143e">◆ </a></span>ThreadGemmShape</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef ThreadGemmShape_ <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a33a68b52cca697bd505bfd982938143e">ThreadGemmShape</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a19bd7eb621b08f192bc01a4634853a9b"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a19bd7eb621b08f192bc01a4634853a9b">◆ </a></span>ThreadsPerWarp</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef ThreadsPerWarp_ <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a19bd7eb621b08f192bc01a4634853a9b">ThreadsPerWarp</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<h2 class="groupheader">Constructor & Destructor Documentation</h2>
|
|
<a id="ac087f0b397599221b74d220fcb1c7121"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#ac087f0b397599221b74d220fcb1c7121">◆ </a></span>ThreadMultiplyAdd()</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">CUTLASS_DEVICE <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::<a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">ThreadMultiplyAdd</a> </td>
|
|
<td>(</td>
|
|
<td class="paramname"></td><td>)</td>
|
|
<td></td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">inline</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<h2 class="groupheader">Member Function Documentation</h2>
|
|
<a id="a7989d48e4c2e16b7804b813630f347cb"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a7989d48e4c2e16b7804b813630f347cb">◆ </a></span>multiply_add()</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename ThreadGemmShape_ , typename ThreadsPerWarp_ , typename ScalarA_ , typename ScalarB_ , typename ScalarC_ , MatrixLayout::Kind kLayout_ = MatrixLayout::kColumnMajor> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">CUTLASS_DEVICE void <a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html">cutlass::gemm::ThreadMultiplyAdd</a>< ThreadGemmShape_, ThreadsPerWarp_, ScalarA_, ScalarB_, ScalarC_, kLayout_ >::multiply_add </td>
|
|
<td>(</td>
|
|
<td class="paramtype"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a7c1cc536ac6ad12800f9e2b5ec682649">FragmentA</a> const & </td>
|
|
<td class="paramname"><em>a</em>, </td>
|
|
</tr>
|
|
<tr>
|
|
<td class="paramkey"></td>
|
|
<td></td>
|
|
<td class="paramtype"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a1401162276ea0858ea85a8e4785adbad">FragmentB</a> const & </td>
|
|
<td class="paramname"><em>b</em>, </td>
|
|
</tr>
|
|
<tr>
|
|
<td class="paramkey"></td>
|
|
<td></td>
|
|
<td class="paramtype"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a72d1ac143dab68b6cdd73d057315fcb6">Accumulators</a> const & </td>
|
|
<td class="paramname"><em>c</em>, </td>
|
|
</tr>
|
|
<tr>
|
|
<td class="paramkey"></td>
|
|
<td></td>
|
|
<td class="paramtype"><a class="el" href="structcutlass_1_1gemm_1_1ThreadMultiplyAdd.html#a72d1ac143dab68b6cdd73d057315fcb6">Accumulators</a> & </td>
|
|
<td class="paramname"><em>d</em> </td>
|
|
</tr>
|
|
<tr>
|
|
<td></td>
|
|
<td>)</td>
|
|
<td></td><td></td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">inline</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<hr/>The documentation for this struct was generated from the following file:<ul>
|
|
<li><a class="el" href="thread__multiply__add_8h_source.html">thread_multiply_add.h</a></li>
|
|
</ul>
|
|
</div><!-- contents -->
|
|
<!-- start footer part -->
|
|
<hr class="footer"/><address class="footer"><small>
|
|
Generated on Fri Oct 26 2018 14:53:40 for Cutlass by  <a href="http://www.doxygen.org/index.html">
|
|
<img class="footer" src="doxygen.png" alt="doxygen"/>
|
|
</a> 1.8.14
|
|
</small></address>
|
|
</body>
|
|
</html>
|