550 lines
41 KiB
HTML
550 lines
41 KiB
HTML
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
|
|
<html xmlns="http://www.w3.org/1999/xhtml">
|
|
<head>
|
|
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
|
|
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
|
|
<meta name="generator" content="Doxygen 1.8.14"/>
|
|
<meta name="viewport" content="width=device-width, initial-scale=1"/>
|
|
<title>Cutlass: cutlass::gemm::GemmSharedLoadTileDTraits< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ > Struct Template Reference</title>
|
|
<link href="tabs.css" rel="stylesheet" type="text/css"/>
|
|
<script type="text/javascript" src="jquery.js"></script>
|
|
<script type="text/javascript" src="dynsections.js"></script>
|
|
<link href="search/search.css" rel="stylesheet" type="text/css"/>
|
|
<script type="text/javascript" src="search/searchdata.js"></script>
|
|
<script type="text/javascript" src="search/search.js"></script>
|
|
<script type="text/x-mathjax-config">
|
|
MathJax.Hub.Config({
|
|
extensions: ["tex2jax.js"],
|
|
jax: ["input/TeX","output/HTML-CSS"],
|
|
});
|
|
</script><script type="text/javascript" async src="http://cdn.mathjax.org/mathjax/latest/MathJax.js"></script>
|
|
<link href="doxygen.css" rel="stylesheet" type="text/css" />
|
|
</head>
|
|
<body>
|
|
<div id="top"><!-- do not remove this div, it is closed by doxygen! -->
|
|
<div id="titlearea">
|
|
<table cellspacing="0" cellpadding="0">
|
|
<tbody>
|
|
<tr style="height: 56px;">
|
|
<td id="projectalign" style="padding-left: 0.5em;">
|
|
<div id="projectname">Cutlass
|
|
</div>
|
|
<div id="projectbrief">CUDA Templates for Linear Algebra Subroutines and Solvers</div>
|
|
</td>
|
|
</tr>
|
|
</tbody>
|
|
</table>
|
|
</div>
|
|
<!-- end header part -->
|
|
<!-- Generated by Doxygen 1.8.14 -->
|
|
<script type="text/javascript">
|
|
/* @license magnet:?xt=urn:btih:cf05388f2679ee054f2beb29a391d25f4e673ac3&dn=gpl-2.0.txt GPL-v2 */
|
|
var searchBox = new SearchBox("searchBox", "search",false,'Search');
|
|
/* @license-end */
|
|
</script>
|
|
<script type="text/javascript" src="menudata.js"></script>
|
|
<script type="text/javascript" src="menu.js"></script>
|
|
<script type="text/javascript">
|
|
/* @license magnet:?xt=urn:btih:cf05388f2679ee054f2beb29a391d25f4e673ac3&dn=gpl-2.0.txt GPL-v2 */
|
|
$(function() {
|
|
initMenu('',true,false,'search.php','Search');
|
|
$(document).ready(function() { init_search(); });
|
|
});
|
|
/* @license-end */</script>
|
|
<div id="main-nav"></div>
|
|
<!-- window showing the filter options -->
|
|
<div id="MSearchSelectWindow"
|
|
onmouseover="return searchBox.OnSearchSelectShow()"
|
|
onmouseout="return searchBox.OnSearchSelectHide()"
|
|
onkeydown="return searchBox.OnSearchSelectKey(event)">
|
|
</div>
|
|
|
|
<!-- iframe showing the search results (closed by default) -->
|
|
<div id="MSearchResultsWindow">
|
|
<iframe src="javascript:void(0)" frameborder="0"
|
|
name="MSearchResults" id="MSearchResults">
|
|
</iframe>
|
|
</div>
|
|
|
|
<div id="nav-path" class="navpath">
|
|
<ul>
|
|
<li class="navelem"><a class="el" href="namespacecutlass.html">cutlass</a></li><li class="navelem"><a class="el" href="namespacecutlass_1_1gemm.html">gemm</a></li><li class="navelem"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">GemmSharedLoadTileDTraits</a></li> </ul>
|
|
</div>
|
|
</div><!-- top -->
|
|
<div class="header">
|
|
<div class="summary">
|
|
<a href="#nested-classes">Classes</a> |
|
|
<a href="#pub-types">Public Types</a> |
|
|
<a href="#pub-static-attribs">Static Public Attributes</a> |
|
|
<a href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits-members.html">List of all members</a> </div>
|
|
<div class="headertitle">
|
|
<div class="title">cutlass::gemm::GemmSharedLoadTileDTraits< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ > Struct Template Reference</div> </div>
|
|
</div><!--header-->
|
|
<div class="contents">
|
|
|
|
<p><code>#include <<a class="el" href="gemm__shared__tile_8h_source.html">gemm_shared_tile.h</a>></code></p>
|
|
<table class="memberdecls">
|
|
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a name="nested-classes"></a>
|
|
Classes</h2></td></tr>
|
|
<tr class="memitem:"><td class="memItemLeft" align="right" valign="top">struct  </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits_1_1ThreadOffset.html">ThreadOffset</a></td></tr>
|
|
<tr class="memdesc:"><td class="mdescLeft"> </td><td class="mdescRight">Computes the thread offset in (H, W) based on thread ID. <a href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits_1_1ThreadOffset.html#details">More...</a><br /></td></tr>
|
|
<tr class="separator:"><td class="memSeparator" colspan="2"> </td></tr>
|
|
</table><table class="memberdecls">
|
|
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a name="pub-types"></a>
|
|
Public Types</h2></td></tr>
|
|
<tr class="memitem:a1b025cb056729706f36469e74a9799dc"><td class="memItemLeft" align="right" valign="top">typedef <a class="el" href="structcutlass_1_1platform_1_1remove__const.html">platform::remove_const</a>< Scalar_ >::type </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a1b025cb056729706f36469e74a9799dc">Scalar</a></td></tr>
|
|
<tr class="memdesc:a1b025cb056729706f36469e74a9799dc"><td class="mdescLeft"> </td><td class="mdescRight">The scalar. <a href="#a1b025cb056729706f36469e74a9799dc">More...</a><br /></td></tr>
|
|
<tr class="separator:a1b025cb056729706f36469e74a9799dc"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a1e72b69cf2147e4d194893a64417b920"><td class="memItemLeft" align="right" valign="top">typedef Scalar_ * </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a1e72b69cf2147e4d194893a64417b920">Pointer</a></td></tr>
|
|
<tr class="memdesc:a1e72b69cf2147e4d194893a64417b920"><td class="mdescLeft"> </td><td class="mdescRight">The pointer. <a href="#a1e72b69cf2147e4d194893a64417b920">More...</a><br /></td></tr>
|
|
<tr class="separator:a1e72b69cf2147e4d194893a64417b920"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:acb16feebdcad5bbebe9d4d3383c37899"><td class="memItemLeft" align="right" valign="top">typedef OutputTile_ </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#acb16feebdcad5bbebe9d4d3383c37899">OutputTile</a></td></tr>
|
|
<tr class="memdesc:acb16feebdcad5bbebe9d4d3383c37899"><td class="mdescLeft"> </td><td class="mdescRight">The dimension of the output tile. <a href="#acb16feebdcad5bbebe9d4d3383c37899">More...</a><br /></td></tr>
|
|
<tr class="separator:acb16feebdcad5bbebe9d4d3383c37899"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a4764f70691cb3fee91ce47653363aa4f"><td class="memItemLeft" align="right" valign="top">typedef Warps_ </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a4764f70691cb3fee91ce47653363aa4f">Warps</a></td></tr>
|
|
<tr class="memdesc:a4764f70691cb3fee91ce47653363aa4f"><td class="mdescLeft"> </td><td class="mdescRight">The warps in the tile. <a href="#a4764f70691cb3fee91ce47653363aa4f">More...</a><br /></td></tr>
|
|
<tr class="separator:a4764f70691cb3fee91ce47653363aa4f"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a9022ffc49b32503fd3639341e7e291a3"><td class="memItemLeft" align="right" valign="top">typedef ThreadsPerWarp_ </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a9022ffc49b32503fd3639341e7e291a3">ThreadsPerWarp</a></td></tr>
|
|
<tr class="memdesc:a9022ffc49b32503fd3639341e7e291a3"><td class="mdescLeft"> </td><td class="mdescRight">The threads in the warps. <a href="#a9022ffc49b32503fd3639341e7e291a3">More...</a><br /></td></tr>
|
|
<tr class="separator:a9022ffc49b32503fd3639341e7e291a3"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a63f980fea1ff3dd83ac276cfd83a4ce5"><td class="memItemLeft" align="right" valign="top">typedef <a class="el" href="structcutlass_1_1Shape.html">Shape</a>< 1, 2, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#aa3e378cabce9ed7f199c179c15a12ca4">kScalarsPerRow</a>/<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8d308d593b59624abe3e228d588be61d">kAccessSize</a>, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8d308d593b59624abe3e228d588be61d">kAccessSize</a> > </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a63f980fea1ff3dd83ac276cfd83a4ce5">Tile</a></td></tr>
|
|
<tr class="separator:a63f980fea1ff3dd83ac276cfd83a4ce5"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a1b33700f904dd15e3533fec15d9d71bd"><td class="memItemLeft" align="right" valign="top">typedef <a class="el" href="structcutlass_1_1Shape.html">Shape</a>< <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8663311646210b690bb0c2a1012e82f0">kIterationsD</a>, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a3b1a461c1dfbcd3817ab2d57bd0da9f1">kIterationsH</a>, OutputTile::kW/kWarpSize/<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8d308d593b59624abe3e228d588be61d">kAccessSize</a>, Warps::kD > </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a1b33700f904dd15e3533fec15d9d71bd">Iterations</a></td></tr>
|
|
<tr class="memdesc:a1b33700f904dd15e3533fec15d9d71bd"><td class="mdescLeft"> </td><td class="mdescRight">The number of iterations needed to store the tile. <a href="#a1b33700f904dd15e3533fec15d9d71bd">More...</a><br /></td></tr>
|
|
<tr class="separator:a1b33700f904dd15e3533fec15d9d71bd"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a57b065abb737bee1c17398c90b5bc39b"><td class="memItemLeft" align="right" valign="top">typedef <a class="el" href="structcutlass_1_1Shape.html">Shape</a>< OutputTile::kW, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#aa3e378cabce9ed7f199c179c15a12ca4">kScalarsPerRow</a>, kWarpSize *<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8d308d593b59624abe3e228d588be61d">kAccessSize</a>, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a15438a44b588dc4cfd4b47c18af79cd2">kSplitK</a> > </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a57b065abb737bee1c17398c90b5bc39b">ImmediateOffsetStrides</a></td></tr>
|
|
<tr class="memdesc:a57b065abb737bee1c17398c90b5bc39b"><td class="mdescLeft"> </td><td class="mdescRight">The strides in each dimension between different loads/stores. <a href="#a57b065abb737bee1c17398c90b5bc39b">More...</a><br /></td></tr>
|
|
<tr class="separator:a57b065abb737bee1c17398c90b5bc39b"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a2cd23d3b5e2cb64c6d5e9b1d6a78fbce"><td class="memItemLeft" align="right" valign="top">typedef <a class="el" href="structcutlass_1_1Shape.html">Shape</a>< OutputTile::kW, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#aa3e378cabce9ed7f199c179c15a12ca4">kScalarsPerRow</a>, kWarpSize *<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8d308d593b59624abe3e228d588be61d">kAccessSize</a>, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a15438a44b588dc4cfd4b47c18af79cd2">kSplitK</a> > </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a2cd23d3b5e2cb64c6d5e9b1d6a78fbce">Delta</a></td></tr>
|
|
<tr class="memdesc:a2cd23d3b5e2cb64c6d5e9b1d6a78fbce"><td class="mdescLeft"> </td><td class="mdescRight">The strides in each dimension between different loads/stores. <a href="#a2cd23d3b5e2cb64c6d5e9b1d6a78fbce">More...</a><br /></td></tr>
|
|
<tr class="separator:a2cd23d3b5e2cb64c6d5e9b1d6a78fbce"><td class="memSeparator" colspan="2"> </td></tr>
|
|
</table><table class="memberdecls">
|
|
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a name="pub-static-attribs"></a>
|
|
Static Public Attributes</h2></td></tr>
|
|
<tr class="memitem:a8d308d593b59624abe3e228d588be61d"><td class="memItemLeft" align="right" valign="top">static int const </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8d308d593b59624abe3e228d588be61d">kAccessSize</a> = kScalarsPerLds_</td></tr>
|
|
<tr class="memdesc:a8d308d593b59624abe3e228d588be61d"><td class="mdescLeft"> </td><td class="mdescRight">The number of scalars per LDG/STG. <a href="#a8d308d593b59624abe3e228d588be61d">More...</a><br /></td></tr>
|
|
<tr class="separator:a8d308d593b59624abe3e228d588be61d"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a7e9ce187e12575f0ecd39b2bfe13dddf"><td class="memItemLeft" align="right" valign="top">static int const </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a7e9ce187e12575f0ecd39b2bfe13dddf">kSkew</a> = kSkew_</td></tr>
|
|
<tr class="memdesc:a7e9ce187e12575f0ecd39b2bfe13dddf"><td class="mdescLeft"> </td><td class="mdescRight">The skew. <a href="#a7e9ce187e12575f0ecd39b2bfe13dddf">More...</a><br /></td></tr>
|
|
<tr class="separator:a7e9ce187e12575f0ecd39b2bfe13dddf"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:afb4687520eff9c6a21c35a5e04f69de8"><td class="memItemLeft" align="right" valign="top">static <a class="el" href="structcutlass_1_1MemorySpace.html#a1e031ec41668015a8fe4ba2c1145d03c">MemorySpace::Kind</a> const </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#afb4687520eff9c6a21c35a5e04f69de8">kMemorySpace</a> = <a class="el" href="structcutlass_1_1MemorySpace.html#a1e031ec41668015a8fe4ba2c1145d03ca2804339b2be64ff68ae3042073aaa7cc">MemorySpace::kShared</a></td></tr>
|
|
<tr class="memdesc:afb4687520eff9c6a21c35a5e04f69de8"><td class="mdescLeft"> </td><td class="mdescRight">The memory space. <a href="#afb4687520eff9c6a21c35a5e04f69de8">More...</a><br /></td></tr>
|
|
<tr class="separator:afb4687520eff9c6a21c35a5e04f69de8"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:abb5fdb164b09c8f74f92278f3d68b95f"><td class="memItemLeft" align="right" valign="top">static int const </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#abb5fdb164b09c8f74f92278f3d68b95f">kScalarsPerThread</a> = OutputTile_::kW / Warps::kW / ThreadsPerWarp::kW</td></tr>
|
|
<tr class="memdesc:abb5fdb164b09c8f74f92278f3d68b95f"><td class="mdescLeft"> </td><td class="mdescRight">The number of scalars per thread. <a href="#abb5fdb164b09c8f74f92278f3d68b95f">More...</a><br /></td></tr>
|
|
<tr class="separator:abb5fdb164b09c8f74f92278f3d68b95f"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a8325bc9d56155ecb6f2ddbd56f4ed23d"><td class="memItemLeft" align="right" valign="top">static int const </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8325bc9d56155ecb6f2ddbd56f4ed23d">kThreads</a> = <a class="el" href="structcutlass_1_1ShapeCount.html">ShapeCount</a><<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a4764f70691cb3fee91ce47653363aa4f">Warps</a>>::kCount * kWarpSize</td></tr>
|
|
<tr class="memdesc:a8325bc9d56155ecb6f2ddbd56f4ed23d"><td class="mdescLeft"> </td><td class="mdescRight">The number of threads. <a href="#a8325bc9d56155ecb6f2ddbd56f4ed23d">More...</a><br /></td></tr>
|
|
<tr class="separator:a8325bc9d56155ecb6f2ddbd56f4ed23d"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:aa3e378cabce9ed7f199c179c15a12ca4"><td class="memItemLeft" align="right" valign="top">static int const </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#aa3e378cabce9ed7f199c179c15a12ca4">kScalarsPerRow</a> = <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8325bc9d56155ecb6f2ddbd56f4ed23d">kThreads</a> / 2 * <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#abb5fdb164b09c8f74f92278f3d68b95f">kScalarsPerThread</a> + <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a7e9ce187e12575f0ecd39b2bfe13dddf">kSkew</a></td></tr>
|
|
<tr class="memdesc:aa3e378cabce9ed7f199c179c15a12ca4"><td class="mdescLeft"> </td><td class="mdescRight">The number of scalars per row. We build a tile with 2 rows (to avoid bank conflicts). <a href="#aa3e378cabce9ed7f199c179c15a12ca4">More...</a><br /></td></tr>
|
|
<tr class="separator:aa3e378cabce9ed7f199c179c15a12ca4"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a4b8d66df02ba1653aa6d1f23b967f237"><td class="memItemLeft" align="right" valign="top">static int const </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a4b8d66df02ba1653aa6d1f23b967f237">kIterationsInHPerWarp</a> = kTileH_ / <a class="el" href="structcutlass_1_1ShapeCount.html">ShapeCount</a><<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a4764f70691cb3fee91ce47653363aa4f">Warps</a>>::kCount</td></tr>
|
|
<tr class="separator:a4b8d66df02ba1653aa6d1f23b967f237"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a3b1a461c1dfbcd3817ab2d57bd0da9f1"><td class="memItemLeft" align="right" valign="top">static int const </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a3b1a461c1dfbcd3817ab2d57bd0da9f1">kIterationsH</a> = <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a4b8d66df02ba1653aa6d1f23b967f237">kIterationsInHPerWarp</a> == 1 ? 1 : 2</td></tr>
|
|
<tr class="separator:a3b1a461c1dfbcd3817ab2d57bd0da9f1"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a8663311646210b690bb0c2a1012e82f0"><td class="memItemLeft" align="right" valign="top">static int const </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8663311646210b690bb0c2a1012e82f0">kIterationsD</a> = <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a4b8d66df02ba1653aa6d1f23b967f237">kIterationsInHPerWarp</a> / <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a3b1a461c1dfbcd3817ab2d57bd0da9f1">kIterationsH</a></td></tr>
|
|
<tr class="separator:a8663311646210b690bb0c2a1012e82f0"><td class="memSeparator" colspan="2"> </td></tr>
|
|
<tr class="memitem:a15438a44b588dc4cfd4b47c18af79cd2"><td class="memItemLeft" align="right" valign="top">static int const </td><td class="memItemRight" valign="bottom"><a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a15438a44b588dc4cfd4b47c18af79cd2">kSplitK</a> = OutputTile::kW * ThreadsPerWarp::kH / 2 * Warps::kH</td></tr>
|
|
<tr class="separator:a15438a44b588dc4cfd4b47c18af79cd2"><td class="memSeparator" colspan="2"> </td></tr>
|
|
</table>
|
|
<h2 class="groupheader">Member Typedef Documentation</h2>
|
|
<a id="a2cd23d3b5e2cb64c6d5e9b1d6a78fbce"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a2cd23d3b5e2cb64c6d5e9b1d6a78fbce">◆ </a></span>Delta</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef <a class="el" href="structcutlass_1_1Shape.html">Shape</a><OutputTile::kW, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#aa3e378cabce9ed7f199c179c15a12ca4">kScalarsPerRow</a>, kWarpSize * <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8d308d593b59624abe3e228d588be61d">kAccessSize</a>, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a15438a44b588dc4cfd4b47c18af79cd2">kSplitK</a>> <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a2cd23d3b5e2cb64c6d5e9b1d6a78fbce">Delta</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a57b065abb737bee1c17398c90b5bc39b"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a57b065abb737bee1c17398c90b5bc39b">◆ </a></span>ImmediateOffsetStrides</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef <a class="el" href="structcutlass_1_1Shape.html">Shape</a><OutputTile::kW, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#aa3e378cabce9ed7f199c179c15a12ca4">kScalarsPerRow</a>, kWarpSize * <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8d308d593b59624abe3e228d588be61d">kAccessSize</a>, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a15438a44b588dc4cfd4b47c18af79cd2">kSplitK</a>> <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a57b065abb737bee1c17398c90b5bc39b">ImmediateOffsetStrides</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a1b33700f904dd15e3533fec15d9d71bd"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a1b33700f904dd15e3533fec15d9d71bd">◆ </a></span>Iterations</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef <a class="el" href="structcutlass_1_1Shape.html">Shape</a><<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8663311646210b690bb0c2a1012e82f0">kIterationsD</a>, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a3b1a461c1dfbcd3817ab2d57bd0da9f1">kIterationsH</a>, OutputTile::kW / kWarpSize / <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8d308d593b59624abe3e228d588be61d">kAccessSize</a>, Warps::kD> <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a1b33700f904dd15e3533fec15d9d71bd">Iterations</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="acb16feebdcad5bbebe9d4d3383c37899"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#acb16feebdcad5bbebe9d4d3383c37899">◆ </a></span>OutputTile</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef OutputTile_ <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#acb16feebdcad5bbebe9d4d3383c37899">OutputTile</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a1e72b69cf2147e4d194893a64417b920"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a1e72b69cf2147e4d194893a64417b920">◆ </a></span>Pointer</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef Scalar_* <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a1e72b69cf2147e4d194893a64417b920">Pointer</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a1b025cb056729706f36469e74a9799dc"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a1b025cb056729706f36469e74a9799dc">◆ </a></span>Scalar</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef <a class="el" href="structcutlass_1_1platform_1_1remove__const.html">platform::remove_const</a><Scalar_>::type <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a1b025cb056729706f36469e74a9799dc">Scalar</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a9022ffc49b32503fd3639341e7e291a3"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a9022ffc49b32503fd3639341e7e291a3">◆ </a></span>ThreadsPerWarp</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef ThreadsPerWarp_ <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a9022ffc49b32503fd3639341e7e291a3">ThreadsPerWarp</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a63f980fea1ff3dd83ac276cfd83a4ce5"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a63f980fea1ff3dd83ac276cfd83a4ce5">◆ </a></span>Tile</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef <a class="el" href="structcutlass_1_1Shape.html">Shape</a><1, 2, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#aa3e378cabce9ed7f199c179c15a12ca4">kScalarsPerRow</a> / <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8d308d593b59624abe3e228d588be61d">kAccessSize</a>, <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8d308d593b59624abe3e228d588be61d">kAccessSize</a>> <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a63f980fea1ff3dd83ac276cfd83a4ce5">Tile</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
<p>The tile. We have 2 rows of scalars. We use those two rows to make sure we do not have bank conflicts in the epilogue. </p>
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a4764f70691cb3fee91ce47653363aa4f"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a4764f70691cb3fee91ce47653363aa4f">◆ </a></span>Warps</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">typedef Warps_ <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a4764f70691cb3fee91ce47653363aa4f">Warps</a></td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<h2 class="groupheader">Member Data Documentation</h2>
|
|
<a id="a8d308d593b59624abe3e228d588be61d"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a8d308d593b59624abe3e228d588be61d">◆ </a></span>kAccessSize</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">int const <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kAccessSize = kScalarsPerLds_</td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">static</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a8663311646210b690bb0c2a1012e82f0"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a8663311646210b690bb0c2a1012e82f0">◆ </a></span>kIterationsD</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">int const <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kIterationsD = <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a4b8d66df02ba1653aa6d1f23b967f237">kIterationsInHPerWarp</a> / <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a3b1a461c1dfbcd3817ab2d57bd0da9f1">kIterationsH</a></td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">static</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a3b1a461c1dfbcd3817ab2d57bd0da9f1"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a3b1a461c1dfbcd3817ab2d57bd0da9f1">◆ </a></span>kIterationsH</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">int const <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kIterationsH = <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a4b8d66df02ba1653aa6d1f23b967f237">kIterationsInHPerWarp</a> == 1 ? 1 : 2</td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">static</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a4b8d66df02ba1653aa6d1f23b967f237"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a4b8d66df02ba1653aa6d1f23b967f237">◆ </a></span>kIterationsInHPerWarp</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">int const <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kIterationsInHPerWarp = kTileH_ / <a class="el" href="structcutlass_1_1ShapeCount.html">ShapeCount</a><<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a4764f70691cb3fee91ce47653363aa4f">Warps</a>>::kCount</td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">static</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="afb4687520eff9c6a21c35a5e04f69de8"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#afb4687520eff9c6a21c35a5e04f69de8">◆ </a></span>kMemorySpace</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname"><a class="el" href="structcutlass_1_1MemorySpace.html#a1e031ec41668015a8fe4ba2c1145d03c">MemorySpace::Kind</a> const <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kMemorySpace = <a class="el" href="structcutlass_1_1MemorySpace.html#a1e031ec41668015a8fe4ba2c1145d03ca2804339b2be64ff68ae3042073aaa7cc">MemorySpace::kShared</a></td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">static</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="aa3e378cabce9ed7f199c179c15a12ca4"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#aa3e378cabce9ed7f199c179c15a12ca4">◆ </a></span>kScalarsPerRow</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">int const <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kScalarsPerRow = <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a8325bc9d56155ecb6f2ddbd56f4ed23d">kThreads</a> / 2 * <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#abb5fdb164b09c8f74f92278f3d68b95f">kScalarsPerThread</a> + <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a7e9ce187e12575f0ecd39b2bfe13dddf">kSkew</a></td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">static</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="abb5fdb164b09c8f74f92278f3d68b95f"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#abb5fdb164b09c8f74f92278f3d68b95f">◆ </a></span>kScalarsPerThread</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">int const <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kScalarsPerThread = OutputTile_::kW / Warps::kW / ThreadsPerWarp::kW</td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">static</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a7e9ce187e12575f0ecd39b2bfe13dddf"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a7e9ce187e12575f0ecd39b2bfe13dddf">◆ </a></span>kSkew</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">int const <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kSkew = kSkew_</td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">static</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a15438a44b588dc4cfd4b47c18af79cd2"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a15438a44b588dc4cfd4b47c18af79cd2">◆ </a></span>kSplitK</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">int const <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kSplitK = OutputTile::kW * ThreadsPerWarp::kH / 2 * Warps::kH</td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">static</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<a id="a8325bc9d56155ecb6f2ddbd56f4ed23d"></a>
|
|
<h2 class="memtitle"><span class="permalink"><a href="#a8325bc9d56155ecb6f2ddbd56f4ed23d">◆ </a></span>kThreads</h2>
|
|
|
|
<div class="memitem">
|
|
<div class="memproto">
|
|
<div class="memtemplate">
|
|
template<typename Scalar_ , typename OutputTile_ , typename Warps_ , typename ThreadsPerWarp_ , int kTileH_, int kScalarsPerLds_, int kSkew_ = 0> </div>
|
|
<table class="mlabels">
|
|
<tr>
|
|
<td class="mlabels-left">
|
|
<table class="memname">
|
|
<tr>
|
|
<td class="memname">int const <a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html">cutlass::gemm::GemmSharedLoadTileDTraits</a>< Scalar_, OutputTile_, Warps_, ThreadsPerWarp_, kTileH_, kScalarsPerLds_, kSkew_ >::kThreads = <a class="el" href="structcutlass_1_1ShapeCount.html">ShapeCount</a><<a class="el" href="structcutlass_1_1gemm_1_1GemmSharedLoadTileDTraits.html#a4764f70691cb3fee91ce47653363aa4f">Warps</a>>::kCount * kWarpSize</td>
|
|
</tr>
|
|
</table>
|
|
</td>
|
|
<td class="mlabels-right">
|
|
<span class="mlabels"><span class="mlabel">static</span></span> </td>
|
|
</tr>
|
|
</table>
|
|
</div><div class="memdoc">
|
|
|
|
</div>
|
|
</div>
|
|
<hr/>The documentation for this struct was generated from the following file:<ul>
|
|
<li><a class="el" href="gemm__shared__tile_8h_source.html">gemm_shared_tile.h</a></li>
|
|
</ul>
|
|
</div><!-- contents -->
|
|
<!-- start footer part -->
|
|
<hr class="footer"/><address class="footer"><small>
|
|
Generated on Fri Oct 26 2018 14:53:39 for Cutlass by  <a href="http://www.doxygen.org/index.html">
|
|
<img class="footer" src="doxygen.png" alt="doxygen"/>
|
|
</a> 1.8.14
|
|
</small></address>
|
|
</body>
|
|
</html>
|