149 lines
75 KiB
HTML
149 lines
75 KiB
HTML
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
|
|
<html xmlns="http://www.w3.org/1999/xhtml">
|
|
<head>
|
|
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
|
|
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
|
|
<meta name="generator" content="Doxygen 1.8.14"/>
|
|
<meta name="viewport" content="width=device-width, initial-scale=1"/>
|
|
<title>Cutlass: gemm_global_stream.h Source File</title>
|
|
<link href="tabs.css" rel="stylesheet" type="text/css"/>
|
|
<script type="text/javascript" src="jquery.js"></script>
|
|
<script type="text/javascript" src="dynsections.js"></script>
|
|
<link href="search/search.css" rel="stylesheet" type="text/css"/>
|
|
<script type="text/javascript" src="search/searchdata.js"></script>
|
|
<script type="text/javascript" src="search/search.js"></script>
|
|
<script type="text/x-mathjax-config">
|
|
MathJax.Hub.Config({
|
|
extensions: ["tex2jax.js"],
|
|
jax: ["input/TeX","output/HTML-CSS"],
|
|
});
|
|
</script><script type="text/javascript" async src="http://cdn.mathjax.org/mathjax/latest/MathJax.js"></script>
|
|
<link href="doxygen.css" rel="stylesheet" type="text/css" />
|
|
</head>
|
|
<body>
|
|
<div id="top"><!-- do not remove this div, it is closed by doxygen! -->
|
|
<div id="titlearea">
|
|
<table cellspacing="0" cellpadding="0">
|
|
<tbody>
|
|
<tr style="height: 56px;">
|
|
<td id="projectalign" style="padding-left: 0.5em;">
|
|
<div id="projectname">Cutlass
|
|
</div>
|
|
<div id="projectbrief">CUDA Templates for Linear Algebra Subroutines and Solvers</div>
|
|
</td>
|
|
</tr>
|
|
</tbody>
|
|
</table>
|
|
</div>
|
|
<!-- end header part -->
|
|
<!-- Generated by Doxygen 1.8.14 -->
|
|
<script type="text/javascript">
|
|
/* @license magnet:?xt=urn:btih:cf05388f2679ee054f2beb29a391d25f4e673ac3&dn=gpl-2.0.txt GPL-v2 */
|
|
var searchBox = new SearchBox("searchBox", "search",false,'Search');
|
|
/* @license-end */
|
|
</script>
|
|
<script type="text/javascript" src="menudata.js"></script>
|
|
<script type="text/javascript" src="menu.js"></script>
|
|
<script type="text/javascript">
|
|
/* @license magnet:?xt=urn:btih:cf05388f2679ee054f2beb29a391d25f4e673ac3&dn=gpl-2.0.txt GPL-v2 */
|
|
$(function() {
|
|
initMenu('',true,false,'search.php','Search');
|
|
$(document).ready(function() { init_search(); });
|
|
});
|
|
/* @license-end */</script>
|
|
<div id="main-nav"></div>
|
|
<!-- window showing the filter options -->
|
|
<div id="MSearchSelectWindow"
|
|
onmouseover="return searchBox.OnSearchSelectShow()"
|
|
onmouseout="return searchBox.OnSearchSelectHide()"
|
|
onkeydown="return searchBox.OnSearchSelectKey(event)">
|
|
</div>
|
|
|
|
<!-- iframe showing the search results (closed by default) -->
|
|
<div id="MSearchResultsWindow">
|
|
<iframe src="javascript:void(0)" frameborder="0"
|
|
name="MSearchResults" id="MSearchResults">
|
|
</iframe>
|
|
</div>
|
|
|
|
<div id="nav-path" class="navpath">
|
|
<ul>
|
|
<li class="navelem"><a class="el" href="dir_1417ee5ebebc309c36b7962f26a92c39.html">cutlass</a></li><li class="navelem"><a class="el" href="dir_18d6a367a3982a494d65599933fc67a3.html">gemm</a></li> </ul>
|
|
</div>
|
|
</div><!-- top -->
|
|
<div class="header">
|
|
<div class="headertitle">
|
|
<div class="title">gemm_global_stream.h</div> </div>
|
|
</div><!--header-->
|
|
<div class="contents">
|
|
<a href="gemm__global__stream_8h.html">Go to the documentation of this file.</a><div class="fragment"><div class="line"><a name="l00001"></a><span class="lineno"> 1</span> <span class="comment">/***************************************************************************************************</span></div><div class="line"><a name="l00002"></a><span class="lineno"> 2</span> <span class="comment"> * Copyright (c) 2017-2018, NVIDIA CORPORATION. All rights reserved.</span></div><div class="line"><a name="l00003"></a><span class="lineno"> 3</span> <span class="comment"> *</span></div><div class="line"><a name="l00004"></a><span class="lineno"> 4</span> <span class="comment"> * Redistribution and use in source and binary forms, with or without modification, are permitted</span></div><div class="line"><a name="l00005"></a><span class="lineno"> 5</span> <span class="comment"> * provided that the following conditions are met:</span></div><div class="line"><a name="l00006"></a><span class="lineno"> 6</span> <span class="comment"> * * Redistributions of source code must retain the above copyright notice, this list of</span></div><div class="line"><a name="l00007"></a><span class="lineno"> 7</span> <span class="comment"> * conditions and the following disclaimer.</span></div><div class="line"><a name="l00008"></a><span class="lineno"> 8</span> <span class="comment"> * * Redistributions in binary form must reproduce the above copyright notice, this list of</span></div><div class="line"><a name="l00009"></a><span class="lineno"> 9</span> <span class="comment"> * conditions and the following disclaimer in the documentation and/or other materials</span></div><div class="line"><a name="l00010"></a><span class="lineno"> 10</span> <span class="comment"> * provided with the distribution.</span></div><div class="line"><a name="l00011"></a><span class="lineno"> 11</span> <span class="comment"> * * Neither the name of the NVIDIA CORPORATION nor the names of its contributors may be used</span></div><div class="line"><a name="l00012"></a><span class="lineno"> 12</span> <span class="comment"> * to endorse or promote products derived from this software without specific prior written</span></div><div class="line"><a name="l00013"></a><span class="lineno"> 13</span> <span class="comment"> * permission.</span></div><div class="line"><a name="l00014"></a><span class="lineno"> 14</span> <span class="comment"> *</span></div><div class="line"><a name="l00015"></a><span class="lineno"> 15</span> <span class="comment"> * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR</span></div><div class="line"><a name="l00016"></a><span class="lineno"> 16</span> <span class="comment"> * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND</span></div><div class="line"><a name="l00017"></a><span class="lineno"> 17</span> <span class="comment"> * FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE</span></div><div class="line"><a name="l00018"></a><span class="lineno"> 18</span> <span class="comment"> * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,</span></div><div class="line"><a name="l00019"></a><span class="lineno"> 19</span> <span class="comment"> * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;</span></div><div class="line"><a name="l00020"></a><span class="lineno"> 20</span> <span class="comment"> * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,</span></div><div class="line"><a name="l00021"></a><span class="lineno"> 21</span> <span class="comment"> * STRICT LIABILITY, OR TOR (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE</span></div><div class="line"><a name="l00022"></a><span class="lineno"> 22</span> <span class="comment"> * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.</span></div><div class="line"><a name="l00023"></a><span class="lineno"> 23</span> <span class="comment"> *</span></div><div class="line"><a name="l00024"></a><span class="lineno"> 24</span> <span class="comment"> **************************************************************************************************/</span></div><div class="line"><a name="l00030"></a><span class="lineno"> 30</span> <span class="preprocessor">#pragma once</span></div><div class="line"><a name="l00031"></a><span class="lineno"> 31</span> </div><div class="line"><a name="l00032"></a><span class="lineno"> 32</span> <span class="preprocessor">#include "<a class="code" href="coord_8h.html">cutlass/coord.h</a>"</span></div><div class="line"><a name="l00033"></a><span class="lineno"> 33</span> <span class="preprocessor">#include "<a class="code" href="convert_8h.html">cutlass/convert.h</a>"</span></div><div class="line"><a name="l00034"></a><span class="lineno"> 34</span> <span class="preprocessor">#include "<a class="code" href="gemm__global__tile_8h.html">cutlass/gemm/gemm_global_tile.h</a>"</span></div><div class="line"><a name="l00035"></a><span class="lineno"> 35</span> <span class="preprocessor">#include "<a class="code" href="tile__allocation_8h.html">cutlass/tile_allocation.h</a>"</span></div><div class="line"><a name="l00036"></a><span class="lineno"> 36</span> </div><div class="line"><a name="l00037"></a><span class="lineno"> 37</span> <span class="keyword">namespace </span><a class="code" href="namespacecutlass.html">cutlass</a> {</div><div class="line"><a name="l00038"></a><span class="lineno"> 38</span> <span class="keyword">namespace </span>gemm {</div><div class="line"><a name="l00039"></a><span class="lineno"> 39</span> </div><div class="line"><a name="l00041"></a><span class="lineno"> 41</span> </div><div class="line"><a name="l00042"></a><span class="lineno"> 42</span> <span class="keyword">template</span> <</div><div class="line"><a name="l00044"></a><span class="lineno"> 44</span>  <a class="code" href="structcutlass_1_1GemmOperand.html#ab209ea3de198efabe8e8707dfe8e0a0c">GemmOperand::Kind</a> Operand,</div><div class="line"><a name="l00046"></a><span class="lineno"> 46</span>  <span class="keyword">typename</span> LoadIterator_,</div><div class="line"><a name="l00048"></a><span class="lineno"> 48</span>  <span class="keyword">typename</span> StoreIterator_,</div><div class="line"><a name="l00050"></a><span class="lineno"> 50</span>  <span class="keyword">typename</span> Transformer_></div><div class="line"><a name="l00051"></a><span class="lineno"> 51</span> </div><div class="line"><a name="l00052"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html"> 52</a></span> <span class="keyword">struct </span><a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html">GlobalLoadStream</a> {</div><div class="line"><a name="l00054"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a30113b850dfd3de60f8778bc7a66f700"> 54</a></span>  <span class="keyword">static</span> <a class="code" href="structcutlass_1_1GemmOperand.html#ab209ea3de198efabe8e8707dfe8e0a0c">GemmOperand::Kind</a> <span class="keyword">const</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a30113b850dfd3de60f8778bc7a66f700">kOperand</a> = Operand;</div><div class="line"><a name="l00056"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a905c219287a7342b2ddb58b84e413d64"> 56</a></span>  <span class="keyword">typedef</span> LoadIterator_ <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a905c219287a7342b2ddb58b84e413d64">LoadIterator</a>;</div><div class="line"><a name="l00058"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#aa79a27cbe2420882fbaca55e42803f02"> 58</a></span>  <span class="keyword">typedef</span> Transformer_ <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#aa79a27cbe2420882fbaca55e42803f02">Transformer</a>;</div><div class="line"><a name="l00060"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac16e31930c346068d7522dd8de9d93d2"> 60</a></span>  <span class="keyword">typedef</span> StoreIterator_ <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac16e31930c346068d7522dd8de9d93d2">StoreIterator</a>;</div><div class="line"><a name="l00061"></a><span class="lineno"> 61</span> </div><div class="line"><a name="l00063"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7d9b4339129c1ab4f21f1df1144faddf"> 63</a></span>  <span class="keyword">typedef</span> <span class="keyword">typename</span> LoadIterator::Fragment <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7d9b4339129c1ab4f21f1df1144faddf">FetchedFragment</a>;</div><div class="line"><a name="l00065"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a9eb2fb49698d0d018c04e7712e239ce9"> 65</a></span>  <span class="keyword">typedef</span> <span class="keyword">typename</span> Transformer::OutputFragment <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a9eb2fb49698d0d018c04e7712e239ce9">TransformedFragment</a>;</div><div class="line"><a name="l00067"></a><span class="lineno"> 67</span>  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>((<a class="code" href="structcutlass_1_1platform_1_1is__same.html">platform::is_same<FetchedFragment, typename Transformer::InputFragment>::value</a>),</div><div class="line"><a name="l00068"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ab7e315253b3301c191581bce05644106"> 68</a></span>  <span class="stringliteral">""</span>);</div><div class="line"><a name="l00070"></a><span class="lineno"> 70</span>  <span class="keyword">typedef</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a9eb2fb49698d0d018c04e7712e239ce9">TransformedFragment</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ab7e315253b3301c191581bce05644106">Fragment</a>;</div><div class="line"><a name="l00072"></a><span class="lineno"> 72</span>  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>((<a class="code" href="structcutlass_1_1platform_1_1is__same.html">platform::is_same<TransformedFragment, typename StoreIterator::Fragment>::value</a>),</div><div class="line"><a name="l00073"></a><span class="lineno"> 73</span>  <span class="stringliteral">""</span>);</div><div class="line"><a name="l00074"></a><span class="lineno"> 74</span> </div><div class="line"><a name="l00076"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac29cd1ba94e802762d665c300e22e7db"> 76</a></span>  <span class="keyword">static</span> <a class="code" href="namespacecutlass_1_1MatrixLayout.html#a97ef07af21b122c1804245b0c7784d2b">MatrixLayout::Kind</a> <span class="keyword">const</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac29cd1ba94e802762d665c300e22e7db">kLayout</a> = LoadIterator::kLayout;</div><div class="line"><a name="l00078"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7073b32c2cc62ffcad70a9ca46995c4c"> 78</a></span>  <span class="keyword">typedef</span> <span class="keyword">typename</span> LoadIterator::Scalar <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7073b32c2cc62ffcad70a9ca46995c4c">Scalar</a>;</div><div class="line"><a name="l00080"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac4452df991f57f9bb0b86dfd380179b2"> 80</a></span>  <span class="keyword">typedef</span> <span class="keyword">typename</span> LoadIterator::Pointer <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac4452df991f57f9bb0b86dfd380179b2">Pointer</a>;</div><div class="line"><a name="l00082"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02"> 82</a></span>  <span class="keyword">typedef</span> <span class="keyword">typename</span> LoadIterator::Index <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a>;</div><div class="line"><a name="l00084"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ae033a49a784964e75a5c1b6135b21e47"> 84</a></span>  <span class="keyword">typedef</span> <span class="keyword">typename</span> LoadIterator::LongIndex <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ae033a49a784964e75a5c1b6135b21e47">LongIndex</a>;</div><div class="line"><a name="l00086"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a260543a618fb187c2da40c9f630925ec"> 86</a></span>  <span class="keyword">typedef</span> <span class="keyword">typename</span> LoadIterator::Tile <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a260543a618fb187c2da40c9f630925ec">Tile</a>;</div><div class="line"><a name="l00087"></a><span class="lineno"> 87</span> </div><div class="line"><a name="l00089"></a><span class="lineno"> 89</span>  <span class="keyword">typedef</span> <a class="code" href="structcutlass_1_1TileAllocation.html">TileAllocation<typename StoreIterator::Scalar, typename StoreIterator::Tile></a></div><div class="line"><a name="l00090"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a17804b01904a9a4ee7a857905833f7a8"> 90</a></span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a17804b01904a9a4ee7a857905833f7a8">ThreadblockTileStorage</a>;</div><div class="line"><a name="l00091"></a><span class="lineno"> 91</span> </div><div class="line"><a name="l00093"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a011287c8289b7b026f9993da663abd77"> 93</a></span>  <span class="keyword">typedef</span> <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1TileAllocation.html#aa0bf6caeab13dc004350c6c0cfe0df80">ThreadblockTileStorage::TensorRef</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a011287c8289b7b026f9993da663abd77">ThreadblockTileRef</a>;</div><div class="line"><a name="l00094"></a><span class="lineno"> 94</span> </div><div class="line"><a name="l00096"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html"> 96</a></span>  <span class="keyword">struct </span><a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html">Params</a> {</div><div class="line"><a name="l00097"></a><span class="lineno"> 97</span>  <span class="comment">// The load iterator.</span></div><div class="line"><a name="l00098"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a46f2546f9b88f4fc87f1396d0f08b065"> 98</a></span>  <span class="keyword">typename</span> LoadIterator::Params <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a46f2546f9b88f4fc87f1396d0f08b065">load_iterator</a>;</div><div class="line"><a name="l00099"></a><span class="lineno"> 99</span> </div><div class="line"><a name="l00101"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#ab5d9e5de9b1cc3462920ce7a8f52bbec"> 101</a></span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ae033a49a784964e75a5c1b6135b21e47">LongIndex</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#ab5d9e5de9b1cc3462920ce7a8f52bbec">batch_stride</a>;</div><div class="line"><a name="l00102"></a><span class="lineno"> 102</span> </div><div class="line"><a name="l00103"></a><span class="lineno"> 103</span>  <span class="comment">// The store iterator.</span></div><div class="line"><a name="l00104"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a289ac736c0c098ae6da6a21c9abfe63f"> 104</a></span>  <span class="keyword">typename</span> StoreIterator::Params <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a289ac736c0c098ae6da6a21c9abfe63f">store_iterator</a>;</div><div class="line"><a name="l00105"></a><span class="lineno"> 105</span> </div><div class="line"><a name="l00106"></a><span class="lineno"> 106</span>  <span class="comment">// Offset to residue.</span></div><div class="line"><a name="l00107"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a73bb518f85aee62310b3c886a1fba3f1"> 107</a></span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a73bb518f85aee62310b3c886a1fba3f1">offset_to_residue</a>;</div><div class="line"><a name="l00108"></a><span class="lineno"> 108</span> </div><div class="line"><a name="l00109"></a><span class="lineno"> 109</span>  <span class="comment">// Offset to residue for the last partition</span></div><div class="line"><a name="l00110"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a7cad4eeadacc7efbfe9d2442997eeb82"> 110</a></span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a7cad4eeadacc7efbfe9d2442997eeb82">offset_to_residue_last_partition</a>;</div><div class="line"><a name="l00111"></a><span class="lineno"> 111</span> </div><div class="line"><a name="l00113"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#aeb306cd3cb97471774b425fb50a861ae"> 113</a></span>  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a> <span class="keywordtype">int</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#aeb306cd3cb97471774b425fb50a861ae">initialize</a>(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac4452df991f57f9bb0b86dfd380179b2">Pointer</a> pointer,</div><div class="line"><a name="l00114"></a><span class="lineno"> 114</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ae033a49a784964e75a5c1b6135b21e47">LongIndex</a> batch_stride_,</div><div class="line"><a name="l00115"></a><span class="lineno"> 115</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> ldm,</div><div class="line"><a name="l00116"></a><span class="lineno"> 116</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> offset_to_residue_,</div><div class="line"><a name="l00117"></a><span class="lineno"> 117</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> offset_to_residue_last_partition_) {</div><div class="line"><a name="l00118"></a><span class="lineno"> 118</span> </div><div class="line"><a name="l00119"></a><span class="lineno"> 119</span>  <span class="keywordtype">int</span> error_code = <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a46f2546f9b88f4fc87f1396d0f08b065">load_iterator</a>.initialize(pointer, ldm, ldm);</div><div class="line"><a name="l00120"></a><span class="lineno"> 120</span>  <span class="keywordflow">if</span> (error_code) {</div><div class="line"><a name="l00121"></a><span class="lineno"> 121</span>  <span class="keywordflow">return</span> error_code;</div><div class="line"><a name="l00122"></a><span class="lineno"> 122</span>  }</div><div class="line"><a name="l00123"></a><span class="lineno"> 123</span> </div><div class="line"><a name="l00124"></a><span class="lineno"> 124</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#ab5d9e5de9b1cc3462920ce7a8f52bbec">batch_stride</a> = batch_stride_;</div><div class="line"><a name="l00125"></a><span class="lineno"> 125</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a73bb518f85aee62310b3c886a1fba3f1">offset_to_residue</a> = offset_to_residue_;</div><div class="line"><a name="l00126"></a><span class="lineno"> 126</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a7cad4eeadacc7efbfe9d2442997eeb82">offset_to_residue_last_partition</a> = offset_to_residue_last_partition_;</div><div class="line"><a name="l00127"></a><span class="lineno"> 127</span> </div><div class="line"><a name="l00128"></a><span class="lineno"> 128</span>  <span class="keywordflow">return</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a289ac736c0c098ae6da6a21c9abfe63f">store_iterator</a>.initialize();</div><div class="line"><a name="l00129"></a><span class="lineno"> 129</span>  }</div><div class="line"><a name="l00130"></a><span class="lineno"> 130</span> </div><div class="line"><a name="l00131"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a9c0707b48565a522884cbd077aa299ee"> 131</a></span>  CUTLASS_DEVICE <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a9c0707b48565a522884cbd077aa299ee">get_offset_to_residue</a>() {</div><div class="line"><a name="l00132"></a><span class="lineno"> 132</span>  <span class="keywordflow">if</span> (blockIdx.z == gridDim.z - 1) { <span class="comment">//last partition</span></div><div class="line"><a name="l00133"></a><span class="lineno"> 133</span>  <span class="keywordflow">return</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a7cad4eeadacc7efbfe9d2442997eeb82">offset_to_residue_last_partition</a>;</div><div class="line"><a name="l00134"></a><span class="lineno"> 134</span>  }</div><div class="line"><a name="l00135"></a><span class="lineno"> 135</span>  <span class="keywordflow">else</span> {</div><div class="line"><a name="l00136"></a><span class="lineno"> 136</span>  <span class="keywordflow">return</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a73bb518f85aee62310b3c886a1fba3f1">offset_to_residue</a>;</div><div class="line"><a name="l00137"></a><span class="lineno"> 137</span>  }</div><div class="line"><a name="l00138"></a><span class="lineno"> 138</span>  }</div><div class="line"><a name="l00139"></a><span class="lineno"> 139</span>  };</div><div class="line"><a name="l00140"></a><span class="lineno"> 140</span> </div><div class="line"><a name="l00144"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1SharedStorage.html"> 144</a></span>  <span class="keyword">struct </span><a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1SharedStorage.html">SharedStorage</a> {};</div><div class="line"><a name="l00145"></a><span class="lineno"> 145</span> </div><div class="line"><a name="l00146"></a><span class="lineno"> 146</span>  <span class="comment">//</span></div><div class="line"><a name="l00147"></a><span class="lineno"> 147</span>  <span class="comment">// Static member functions</span></div><div class="line"><a name="l00148"></a><span class="lineno"> 148</span>  <span class="comment">//</span></div><div class="line"><a name="l00149"></a><span class="lineno"> 149</span> </div><div class="line"><a name="l00151"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a16542631e4a4562cc72aa50f146a9724"> 151</a></span>  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a> <span class="keyword">static</span> <a class="code" href="structcutlass_1_1Coord.html">Coord<3></a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a16542631e4a4562cc72aa50f146a9724">project_coordinate</a>(<a class="code" href="structcutlass_1_1Coord.html">Coord<3></a> <span class="keyword">const</span>& coord, <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> d_offset = 0) {</div><div class="line"><a name="l00152"></a><span class="lineno"> 152</span>  <span class="keywordtype">bool</span> <span class="keyword">const</span> kKstrided =</div><div class="line"><a name="l00153"></a><span class="lineno"> 153</span>  <a class="code" href="structcutlass_1_1gemm_1_1GemmMultiplicandTraits.html">GemmMultiplicandTraits<typename LoadIterator::Tile, kOperand, kLayout>::kKstrided</a>;</div><div class="line"><a name="l00154"></a><span class="lineno"> 154</span>  <a class="code" href="structcutlass_1_1Coord.html">Coord<3></a> tile_coord = <a class="code" href="structcutlass_1_1gemm_1_1ProjectOperand.html">ProjectOperand<kOperand, kKstrided>::project</a>(coord);</div><div class="line"><a name="l00155"></a><span class="lineno"> 155</span>  <span class="keywordflow">return</span> <a class="code" href="namespacecutlass.html#a7419519fa453a121dfa5f26bf87318d9">make_Coord</a>(</div><div class="line"><a name="l00156"></a><span class="lineno"> 156</span>  tile_coord[0] + d_offset, tile_coord[1], tile_coord[2] / LoadIterator::Tile::kC);</div><div class="line"><a name="l00157"></a><span class="lineno"> 157</span>  }</div><div class="line"><a name="l00158"></a><span class="lineno"> 158</span> </div><div class="line"><a name="l00160"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#aec86bdf5d7d4ad1f7b6ebebcf2da8395"> 160</a></span>  CUTLASS_DEVICE <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#aec86bdf5d7d4ad1f7b6ebebcf2da8395">GlobalLoadStream</a>(</div><div class="line"><a name="l00161"></a><span class="lineno"> 161</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html">Params</a> <span class="keyword">const</span>& _params,</div><div class="line"><a name="l00162"></a><span class="lineno"> 162</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1SharedStorage.html">SharedStorage</a>& shared_storage,</div><div class="line"><a name="l00163"></a><span class="lineno"> 163</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a011287c8289b7b026f9993da663abd77">ThreadblockTileRef</a> <span class="keyword">const</span>& threadblock_tile_ref,</div><div class="line"><a name="l00164"></a><span class="lineno"> 164</span>  <a class="code" href="structcutlass_1_1Coord.html">Coord<3></a> <span class="keyword">const</span> bounds,</div><div class="line"><a name="l00165"></a><span class="lineno"> 165</span>  <a class="code" href="structcutlass_1_1Coord.html">Coord<3></a> <span class="keyword">const</span>& _threadblock_offset)</div><div class="line"><a name="l00166"></a><span class="lineno"> 166</span>  : <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac8ff1a3e10b25c212cd3cf5ed997fc0e">params</a>(_params),</div><div class="line"><a name="l00167"></a><span class="lineno"> 167</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a563961c326d2e55f5b8682a30b64a24a">threadblock_offset</a>(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a16542631e4a4562cc72aa50f146a9724">project_coordinate</a>(_threadblock_offset)),</div><div class="line"><a name="l00168"></a><span class="lineno"> 168</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a386f2f4d2e239075f0fe1489ed7788c1">multiplicand_bounds</a>(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a16542631e4a4562cc72aa50f146a9724">project_coordinate</a>(bounds, 1)),</div><div class="line"><a name="l00169"></a><span class="lineno"> 169</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac8ff1a3e10b25c212cd3cf5ed997fc0e">params</a>.<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>, <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a563961c326d2e55f5b8682a30b64a24a">threadblock_offset</a>),</div><div class="line"><a name="l00170"></a><span class="lineno"> 170</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ab68ba57fe69430c557379b3457faebc4">transformer</a>(),</div><div class="line"><a name="l00171"></a><span class="lineno"> 171</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a45a4bceb72fcb856e32eaa20eec11e9d">store_iterator</a>(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac8ff1a3e10b25c212cd3cf5ed997fc0e">params</a>.<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a45a4bceb72fcb856e32eaa20eec11e9d">store_iterator</a>, threadblock_tile_ref.data()) {</div><div class="line"><a name="l00172"></a><span class="lineno"> 172</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>.initialize_predicates(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a386f2f4d2e239075f0fe1489ed7788c1">multiplicand_bounds</a>, <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a563961c326d2e55f5b8682a30b64a24a">threadblock_offset</a>);</div><div class="line"><a name="l00173"></a><span class="lineno"> 173</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a1c117b87024937f1dc3da128795b6e03">fetched_fragment</a>.clear();</div><div class="line"><a name="l00174"></a><span class="lineno"> 174</span>  }</div><div class="line"><a name="l00175"></a><span class="lineno"> 175</span> </div><div class="line"><a name="l00176"></a><span class="lineno"> 176</span> </div><div class="line"><a name="l00178"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a3784dbb3efe0865ffa946419111c824a"> 178</a></span>  CUTLASS_DEVICE <span class="keywordtype">void</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a3784dbb3efe0865ffa946419111c824a">copy</a>() {</div><div class="line"><a name="l00179"></a><span class="lineno"> 179</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>.load_post_increment(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a1c117b87024937f1dc3da128795b6e03">fetched_fragment</a>);</div><div class="line"><a name="l00180"></a><span class="lineno"> 180</span>  }</div><div class="line"><a name="l00181"></a><span class="lineno"> 181</span> </div><div class="line"><a name="l00183"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ab39c82ac1a8138c4b6d69dab9d48bdbc"> 183</a></span>  CUTLASS_DEVICE <span class="keywordtype">void</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ab39c82ac1a8138c4b6d69dab9d48bdbc">commit</a>() {</div><div class="line"><a name="l00184"></a><span class="lineno"> 184</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ab68ba57fe69430c557379b3457faebc4">transformer</a>.transform(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a1c117b87024937f1dc3da128795b6e03">fetched_fragment</a>, <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7d7042e60aaab0dd00772b239e1f1db1">transformed_fragment</a>);</div><div class="line"><a name="l00185"></a><span class="lineno"> 185</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a45a4bceb72fcb856e32eaa20eec11e9d">store_iterator</a>.store_post_increment(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7d7042e60aaab0dd00772b239e1f1db1">transformed_fragment</a>);</div><div class="line"><a name="l00186"></a><span class="lineno"> 186</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a45a4bceb72fcb856e32eaa20eec11e9d">store_iterator</a>.inc_stage();</div><div class="line"><a name="l00187"></a><span class="lineno"> 187</span>  }</div><div class="line"><a name="l00188"></a><span class="lineno"> 188</span> </div><div class="line"><a name="l00190"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a235adaea5d4f01232c79cb6109dc6d17"> 190</a></span>  CUTLASS_DEVICE <span class="keywordtype">void</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a235adaea5d4f01232c79cb6109dc6d17">residue</a>(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> k, <span class="keywordtype">bool</span> skip_clear = <span class="keyword">false</span>) {</div><div class="line"><a name="l00191"></a><span class="lineno"> 191</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>.residue(k);</div><div class="line"><a name="l00192"></a><span class="lineno"> 192</span>  <span class="keywordflow">if</span> (!skip_clear) {</div><div class="line"><a name="l00193"></a><span class="lineno"> 193</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a1c117b87024937f1dc3da128795b6e03">fetched_fragment</a>.clear();</div><div class="line"><a name="l00194"></a><span class="lineno"> 194</span>  }</div><div class="line"><a name="l00195"></a><span class="lineno"> 195</span>  }</div><div class="line"><a name="l00196"></a><span class="lineno"> 196</span> </div><div class="line"><a name="l00198"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac269a9280a55d3988ca60f571bdf7f29"> 198</a></span>  CUTLASS_DEVICE <span class="keywordtype">void</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac269a9280a55d3988ca60f571bdf7f29">move_to_residue</a>(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> k, <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> kTileK) {</div><div class="line"><a name="l00199"></a><span class="lineno"> 199</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> kResidue = k % kTileK;</div><div class="line"><a name="l00200"></a><span class="lineno"> 200</span>  <span class="keywordflow">if</span> (kResidue) {</div><div class="line"><a name="l00201"></a><span class="lineno"> 201</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a235adaea5d4f01232c79cb6109dc6d17">residue</a>(kResidue);</div><div class="line"><a name="l00202"></a><span class="lineno"> 202</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> this_offset_residue = <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac8ff1a3e10b25c212cd3cf5ed997fc0e">params</a>.<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a9c0707b48565a522884cbd077aa299ee">get_offset_to_residue</a>();</div><div class="line"><a name="l00203"></a><span class="lineno"> 203</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>.add_pointer_offset(this_offset_residue * <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>.stride_advance());</div><div class="line"><a name="l00204"></a><span class="lineno"> 204</span>  }</div><div class="line"><a name="l00205"></a><span class="lineno"> 205</span>  }</div><div class="line"><a name="l00206"></a><span class="lineno"> 206</span> </div><div class="line"><a name="l00208"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a1e2eecdba1871fc11aa43a06edf6ed34"> 208</a></span>  CUTLASS_DEVICE <span class="keywordtype">void</span> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a1e2eecdba1871fc11aa43a06edf6ed34">rollback</a>(<span class="keywordtype">void</span>) {</div><div class="line"><a name="l00209"></a><span class="lineno"> 209</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>.initialize_predicates(<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a386f2f4d2e239075f0fe1489ed7788c1">multiplicand_bounds</a>, <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a563961c326d2e55f5b8682a30b64a24a">threadblock_offset</a>);</div><div class="line"><a name="l00210"></a><span class="lineno"> 210</span> </div><div class="line"><a name="l00211"></a><span class="lineno"> 211</span>  <span class="keywordtype">int</span> <span class="keyword">const</span> kBlock = <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a30113b850dfd3de60f8778bc7a66f700">kOperand</a> == <a class="code" href="structcutlass_1_1GemmOperand.html#ab209ea3de198efabe8e8707dfe8e0a0cac2b9fe9e3679a059d1a6c946b2a2c31a">GemmOperand::kA</a></div><div class="line"><a name="l00212"></a><span class="lineno"> 212</span>  ? (<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac29cd1ba94e802762d665c300e22e7db">kLayout</a> == <a class="code" href="namespacecutlass_1_1MatrixLayout.html#a97ef07af21b122c1804245b0c7784d2bac15988acba79c11072d38b295f163a2b">MatrixLayout::kColumnMajor</a> ? Tile::kH : Tile::kW)</div><div class="line"><a name="l00213"></a><span class="lineno"> 213</span>  : (<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac29cd1ba94e802762d665c300e22e7db">kLayout</a> == <a class="code" href="namespacecutlass_1_1MatrixLayout.html#a97ef07af21b122c1804245b0c7784d2ba6a287c17f9f5bf53528ae68296beeedb">MatrixLayout::kRowMajor</a> ? Tile::kH : Tile::kW);</div><div class="line"><a name="l00214"></a><span class="lineno"> 214</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">Index</a> this_offset_residue = <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac8ff1a3e10b25c212cd3cf5ed997fc0e">params</a>.<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a9c0707b48565a522884cbd077aa299ee">get_offset_to_residue</a>();</div><div class="line"><a name="l00215"></a><span class="lineno"> 215</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>.add_pointer_offset(-(this_offset_residue + kBlock) *</div><div class="line"><a name="l00216"></a><span class="lineno"> 216</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>.stride_advance());</div><div class="line"><a name="l00217"></a><span class="lineno"> 217</span>  }</div><div class="line"><a name="l00218"></a><span class="lineno"> 218</span> </div><div class="line"><a name="l00220"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a8e79a153de72eef10d90bfd02b5dd27e"> 220</a></span>  CUTLASS_DEVICE <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html">GlobalLoadStream</a> &<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a8e79a153de72eef10d90bfd02b5dd27e">operator+=</a>(<a class="code" href="structcutlass_1_1Coord.html">Coord<3></a> <span class="keyword">const</span> &offset) {</div><div class="line"><a name="l00221"></a><span class="lineno"> 221</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a> += offset;</div><div class="line"><a name="l00222"></a><span class="lineno"> 222</span>  <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00223"></a><span class="lineno"> 223</span>  }</div><div class="line"><a name="l00224"></a><span class="lineno"> 224</span> </div><div class="line"><a name="l00226"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#aed33be079f056998624015460b4e3836"> 226</a></span>  CUTLASS_DEVICE <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html">GlobalLoadStream</a> &<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#aed33be079f056998624015460b4e3836">add_batch_offset</a>(<span class="keywordtype">int</span> batch_id) {</div><div class="line"><a name="l00227"></a><span class="lineno"> 227</span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>.add_pointer_offset(batch_id * <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac8ff1a3e10b25c212cd3cf5ed997fc0e">params</a>.<a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#ab5d9e5de9b1cc3462920ce7a8f52bbec">batch_stride</a>);</div><div class="line"><a name="l00228"></a><span class="lineno"> 228</span>  <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00229"></a><span class="lineno"> 229</span>  }</div><div class="line"><a name="l00230"></a><span class="lineno"> 230</span> </div><div class="line"><a name="l00231"></a><span class="lineno"> 231</span>  <span class="comment">//</span></div><div class="line"><a name="l00232"></a><span class="lineno"> 232</span>  <span class="comment">// Data members</span></div><div class="line"><a name="l00233"></a><span class="lineno"> 233</span>  <span class="comment">//</span></div><div class="line"><a name="l00234"></a><span class="lineno"> 234</span> </div><div class="line"><a name="l00236"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac8ff1a3e10b25c212cd3cf5ed997fc0e"> 236</a></span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html">Params</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac8ff1a3e10b25c212cd3cf5ed997fc0e">params</a>;</div><div class="line"><a name="l00238"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a563961c326d2e55f5b8682a30b64a24a"> 238</a></span>  <a class="code" href="structcutlass_1_1Coord.html">Coord<3></a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a563961c326d2e55f5b8682a30b64a24a">threadblock_offset</a>;</div><div class="line"><a name="l00240"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a386f2f4d2e239075f0fe1489ed7788c1"> 240</a></span>  <a class="code" href="structcutlass_1_1Coord.html">Coord<3></a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a386f2f4d2e239075f0fe1489ed7788c1">multiplicand_bounds</a>;</div><div class="line"><a name="l00242"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c"> 242</a></span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a905c219287a7342b2ddb58b84e413d64">LoadIterator</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">load_iterator</a>;</div><div class="line"><a name="l00244"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a1c117b87024937f1dc3da128795b6e03"> 244</a></span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7d9b4339129c1ab4f21f1df1144faddf">FetchedFragment</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a1c117b87024937f1dc3da128795b6e03">fetched_fragment</a>;</div><div class="line"><a name="l00246"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ab68ba57fe69430c557379b3457faebc4"> 246</a></span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#aa79a27cbe2420882fbaca55e42803f02">Transformer</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ab68ba57fe69430c557379b3457faebc4">transformer</a>;</div><div class="line"><a name="l00248"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7d7042e60aaab0dd00772b239e1f1db1"> 248</a></span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a9eb2fb49698d0d018c04e7712e239ce9">TransformedFragment</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7d7042e60aaab0dd00772b239e1f1db1">transformed_fragment</a>;</div><div class="line"><a name="l00250"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a45a4bceb72fcb856e32eaa20eec11e9d"> 250</a></span>  <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac16e31930c346068d7522dd8de9d93d2">StoreIterator</a> <a class="code" href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a45a4bceb72fcb856e32eaa20eec11e9d">store_iterator</a>;</div><div class="line"><a name="l00251"></a><span class="lineno"> 251</span> };</div><div class="line"><a name="l00252"></a><span class="lineno"> 252</span> </div><div class="line"><a name="l00254"></a><span class="lineno"> 254</span> } <span class="comment">// namespace gemm</span></div><div class="line"><a name="l00255"></a><span class="lineno"> 255</span> } <span class="comment">// namespace cutlass</span></div><div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a011287c8289b7b026f9993da663abd77"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a011287c8289b7b026f9993da663abd77">cutlass::gemm::GlobalLoadStream::ThreadblockTileRef</a></div><div class="ttdeci">ThreadblockTileStorage::TensorRef ThreadblockTileRef</div><div class="ttdoc">Tensor reference to threadblock tile. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:93</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_ac4452df991f57f9bb0b86dfd380179b2"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac4452df991f57f9bb0b86dfd380179b2">cutlass::gemm::GlobalLoadStream::Pointer</a></div><div class="ttdeci">LoadIterator::Pointer Pointer</div><div class="ttdoc">The pointer. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:80</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a5ef4cc42c7cec73523550e5ea56df88c"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a5ef4cc42c7cec73523550e5ea56df88c">cutlass::gemm::GlobalLoadStream::load_iterator</a></div><div class="ttdeci">LoadIterator load_iterator</div><div class="ttdoc">The iterator. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:242</div></div>
|
|
<div class="ttc" id="namespacecutlass_html"><div class="ttname"><a href="namespacecutlass.html">cutlass</a></div><div class="ttdef"><b>Definition:</b> convert.h:33</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a16542631e4a4562cc72aa50f146a9724"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a16542631e4a4562cc72aa50f146a9724">cutlass::gemm::GlobalLoadStream::project_coordinate</a></div><div class="ttdeci">static CUTLASS_HOST_DEVICE Coord< 3 > project_coordinate(Coord< 3 > const &coord, Index d_offset=0)</div><div class="ttdoc">Maps a coordinate in the GEMM&#39;s (K, N, M) coordinate system to global memory. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:151</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a45a4bceb72fcb856e32eaa20eec11e9d"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a45a4bceb72fcb856e32eaa20eec11e9d">cutlass::gemm::GlobalLoadStream::store_iterator</a></div><div class="ttdeci">StoreIterator store_iterator</div><div class="ttdoc">The store iterator. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:250</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_ac8ff1a3e10b25c212cd3cf5ed997fc0e"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac8ff1a3e10b25c212cd3cf5ed997fc0e">cutlass::gemm::GlobalLoadStream::params</a></div><div class="ttdeci">Params params</div><div class="ttdoc">Parameters. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:236</div></div>
|
|
<div class="ttc" id="gemm__global__tile_8h_html"><div class="ttname"><a href="gemm__global__tile_8h.html">gemm_global_tile.h</a></div><div class="ttdoc">Defines iterators for efficiently loading and storing to global memory. </div></div>
|
|
<div class="ttc" id="structcutlass_1_1platform_1_1is__same_html"><div class="ttname"><a href="structcutlass_1_1platform_1_1is__same.html">cutlass::platform::is_same</a></div><div class="ttdoc">std::is_same (false specialization) </div><div class="ttdef"><b>Definition:</b> platform.h:420</div></div>
|
|
<div class="ttc" id="structcutlass_1_1TileAllocation_html_aa0bf6caeab13dc004350c6c0cfe0df80"><div class="ttname"><a href="structcutlass_1_1TileAllocation.html#aa0bf6caeab13dc004350c6c0cfe0df80">cutlass::TileAllocation::TensorRef</a></div><div class="ttdeci">TensorRef< Scalar, 4 > TensorRef</div><div class="ttdoc">Defines the tensor reference for this allocation. </div><div class="ttdef"><b>Definition:</b> tile_allocation.h:63</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a30113b850dfd3de60f8778bc7a66f700"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a30113b850dfd3de60f8778bc7a66f700">cutlass::gemm::GlobalLoadStream::kOperand</a></div><div class="ttdeci">static GemmOperand::Kind const kOperand</div><div class="ttdoc">Indicates the type of GEMM operand. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:54</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a8e79a153de72eef10d90bfd02b5dd27e"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a8e79a153de72eef10d90bfd02b5dd27e">cutlass::gemm::GlobalLoadStream::operator+=</a></div><div class="ttdeci">CUTLASS_DEVICE GlobalLoadStream & operator+=(Coord< 3 > const &offset)</div><div class="ttdoc">Adds a Coord<3> to the underlying global load iterator. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:220</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a3784dbb3efe0865ffa946419111c824a"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a3784dbb3efe0865ffa946419111c824a">cutlass::gemm::GlobalLoadStream::copy</a></div><div class="ttdeci">CUTLASS_DEVICE void copy()</div><div class="ttdoc">Load the data from shared memory to the fetch fragment. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:178</div></div>
|
|
<div class="ttc" id="coord_8h_html"><div class="ttname"><a href="coord_8h.html">coord.h</a></div><div class="ttdoc">A Coord is a coordinate of arbitrary rank into a tensor or matrix. </div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a386f2f4d2e239075f0fe1489ed7788c1"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a386f2f4d2e239075f0fe1489ed7788c1">cutlass::gemm::GlobalLoadStream::multiplicand_bounds</a></div><div class="ttdeci">Coord< 3 > multiplicand_bounds</div><div class="ttdoc">Multiplicand bounds. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:240</div></div>
|
|
<div class="ttc" id="namespacecutlass_html_a7419519fa453a121dfa5f26bf87318d9"><div class="ttname"><a href="namespacecutlass.html#a7419519fa453a121dfa5f26bf87318d9">cutlass::make_Coord</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE Coord< 1 > make_Coord(int _0)</div><div class="ttdoc">Helper to make a 2-element coordinate. </div><div class="ttdef"><b>Definition:</b> coord.h:368</div></div>
|
|
<div class="ttc" id="namespacecutlass_1_1MatrixLayout_html_a97ef07af21b122c1804245b0c7784d2b"><div class="ttname"><a href="namespacecutlass_1_1MatrixLayout.html#a97ef07af21b122c1804245b0c7784d2b">cutlass::MatrixLayout::Kind</a></div><div class="ttdeci">Kind</div><div class="ttdoc">Enumeration defining fundamental contiguous layouts. </div><div class="ttdef"><b>Definition:</b> matrix_traits.h:159</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_ac29cd1ba94e802762d665c300e22e7db"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac29cd1ba94e802762d665c300e22e7db">cutlass::gemm::GlobalLoadStream::kLayout</a></div><div class="ttdeci">static MatrixLayout::Kind const kLayout</div><div class="ttdoc">Make sure the transformed fragment is the same as the store fragment. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:76</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params_html_a289ac736c0c098ae6da6a21c9abfe63f"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a289ac736c0c098ae6da6a21c9abfe63f">cutlass::gemm::GlobalLoadStream::Params::store_iterator</a></div><div class="ttdeci">StoreIterator::Params store_iterator</div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:104</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_ae033a49a784964e75a5c1b6135b21e47"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ae033a49a784964e75a5c1b6135b21e47">cutlass::gemm::GlobalLoadStream::LongIndex</a></div><div class="ttdeci">LoadIterator::LongIndex LongIndex</div><div class="ttdoc">The index. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:84</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a1c117b87024937f1dc3da128795b6e03"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a1c117b87024937f1dc3da128795b6e03">cutlass::gemm::GlobalLoadStream::fetched_fragment</a></div><div class="ttdeci">FetchedFragment fetched_fragment</div><div class="ttdoc">The fragment to fetch from shared memory. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:244</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params_html_aeb306cd3cb97471774b425fb50a861ae"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#aeb306cd3cb97471774b425fb50a861ae">cutlass::gemm::GlobalLoadStream::Params::initialize</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE int initialize(Pointer pointer, LongIndex batch_stride_, Index ldm, Index offset_to_residue_, Index offset_to_residue_last_partition_)</div><div class="ttdoc">Setup the params. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:113</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html">cutlass::gemm::GlobalLoadStream</a></div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:52</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1SharedStorage_html"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1SharedStorage.html">cutlass::gemm::GlobalLoadStream::SharedStorage</a></div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:144</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a7073b32c2cc62ffcad70a9ca46995c4c"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7073b32c2cc62ffcad70a9ca46995c4c">cutlass::gemm::GlobalLoadStream::Scalar</a></div><div class="ttdeci">LoadIterator::Scalar Scalar</div><div class="ttdoc">The scalar type of the iterator. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:78</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a235adaea5d4f01232c79cb6109dc6d17"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a235adaea5d4f01232c79cb6109dc6d17">cutlass::gemm::GlobalLoadStream::residue</a></div><div class="ttdeci">CUTLASS_DEVICE void residue(Index k, bool skip_clear=false)</div><div class="ttdoc">Execute the residue code. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:190</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a7d7042e60aaab0dd00772b239e1f1db1"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7d7042e60aaab0dd00772b239e1f1db1">cutlass::gemm::GlobalLoadStream::transformed_fragment</a></div><div class="ttdeci">TransformedFragment transformed_fragment</div><div class="ttdoc">The fragment to convert the data after it has been fetched from shared memory. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:248</div></div>
|
|
<div class="ttc" id="tile__allocation_8h_html"><div class="ttname"><a href="tile__allocation_8h.html">tile_allocation.h</a></div><div class="ttdoc">Defines a fragment based on a Shape<> template. </div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params_html_a73bb518f85aee62310b3c886a1fba3f1"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a73bb518f85aee62310b3c886a1fba3f1">cutlass::gemm::GlobalLoadStream::Params::offset_to_residue</a></div><div class="ttdeci">Index offset_to_residue</div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:107</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_ab7e315253b3301c191581bce05644106"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ab7e315253b3301c191581bce05644106">cutlass::gemm::GlobalLoadStream::Fragment</a></div><div class="ttdeci">TransformedFragment Fragment</div><div class="ttdoc">Make sure the fragments match. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:68</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_aed33be079f056998624015460b4e3836"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#aed33be079f056998624015460b4e3836">cutlass::gemm::GlobalLoadStream::add_batch_offset</a></div><div class="ttdeci">CUTLASS_DEVICE GlobalLoadStream & add_batch_offset(int batch_id)</div><div class="ttdoc">Adds an offset based on batch stride. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:226</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a905c219287a7342b2ddb58b84e413d64"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a905c219287a7342b2ddb58b84e413d64">cutlass::gemm::GlobalLoadStream::LoadIterator</a></div><div class="ttdeci">LoadIterator_ LoadIterator</div><div class="ttdoc">The load iterator. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:56</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GemmMultiplicandTraits_html"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GemmMultiplicandTraits.html">cutlass::gemm::GemmMultiplicandTraits</a></div><div class="ttdef"><b>Definition:</b> gemm_operand.h:67</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params_html_a7cad4eeadacc7efbfe9d2442997eeb82"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a7cad4eeadacc7efbfe9d2442997eeb82">cutlass::gemm::GlobalLoadStream::Params::offset_to_residue_last_partition</a></div><div class="ttdeci">Index offset_to_residue_last_partition</div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:110</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_ab39c82ac1a8138c4b6d69dab9d48bdbc"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ab39c82ac1a8138c4b6d69dab9d48bdbc">cutlass::gemm::GlobalLoadStream::commit</a></div><div class="ttdeci">CUTLASS_DEVICE void commit()</div><div class="ttdoc">Commit the data. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:183</div></div>
|
|
<div class="ttc" id="cutlass_8h_html_a28c2443a142676d3d71effdae1a986b1"><div class="ttname"><a href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="ttdeci">#define CUTLASS_HOST_DEVICE</div><div class="ttdef"><b>Definition:</b> cutlass.h:46</div></div>
|
|
<div class="ttc" id="structcutlass_1_1TileAllocation_html"><div class="ttname"><a href="structcutlass_1_1TileAllocation.html">cutlass::TileAllocation</a></div><div class="ttdoc">Class for storing a tile in memory and accessing it through a tensor ref. </div><div class="ttdef"><b>Definition:</b> tile_allocation.h:42</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_ab68ba57fe69430c557379b3457faebc4"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ab68ba57fe69430c557379b3457faebc4">cutlass::gemm::GlobalLoadStream::transformer</a></div><div class="ttdeci">Transformer transformer</div><div class="ttdoc">The transformer. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:246</div></div>
|
|
<div class="ttc" id="platform_8h_html_adde4c9ea91b753491851361a4198c009"><div class="ttname"><a href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a></div><div class="ttdeci">#define static_assert(__e, __m)</div><div class="ttdef"><b>Definition:</b> platform.h:153</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params_html_ab5d9e5de9b1cc3462920ce7a8f52bbec"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#ab5d9e5de9b1cc3462920ce7a8f52bbec">cutlass::gemm::GlobalLoadStream::Params::batch_stride</a></div><div class="ttdeci">LongIndex batch_stride</div><div class="ttdoc">Batch stride in global memory. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:101</div></div>
|
|
<div class="ttc" id="namespacecutlass_1_1MatrixLayout_html_a97ef07af21b122c1804245b0c7784d2bac15988acba79c11072d38b295f163a2b"><div class="ttname"><a href="namespacecutlass_1_1MatrixLayout.html#a97ef07af21b122c1804245b0c7784d2bac15988acba79c11072d38b295f163a2b">cutlass::MatrixLayout::kColumnMajor</a></div><div class="ttdef"><b>Definition:</b> matrix_traits.h:159</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1ProjectOperand_html"><div class="ttname"><a href="structcutlass_1_1gemm_1_1ProjectOperand.html">cutlass::gemm::ProjectOperand</a></div><div class="ttdef"><b>Definition:</b> gemm_operand.h:96</div></div>
|
|
<div class="ttc" id="structcutlass_1_1Coord_html"><div class="ttname"><a href="structcutlass_1_1Coord.html">cutlass::Coord< 3 ></a></div></div>
|
|
<div class="ttc" id="namespacecutlass_1_1MatrixLayout_html_a97ef07af21b122c1804245b0c7784d2ba6a287c17f9f5bf53528ae68296beeedb"><div class="ttname"><a href="namespacecutlass_1_1MatrixLayout.html#a97ef07af21b122c1804245b0c7784d2ba6a287c17f9f5bf53528ae68296beeedb">cutlass::MatrixLayout::kRowMajor</a></div><div class="ttdef"><b>Definition:</b> matrix_traits.h:159</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_ac16e31930c346068d7522dd8de9d93d2"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac16e31930c346068d7522dd8de9d93d2">cutlass::gemm::GlobalLoadStream::StoreIterator</a></div><div class="ttdeci">StoreIterator_ StoreIterator</div><div class="ttdoc">The store iterator to write to shared memory. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:60</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a17804b01904a9a4ee7a857905833f7a8"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a17804b01904a9a4ee7a857905833f7a8">cutlass::gemm::GlobalLoadStream::ThreadblockTileStorage</a></div><div class="ttdeci">TileAllocation< typename StoreIterator::Scalar, typename StoreIterator::Tile > ThreadblockTileStorage</div><div class="ttdoc">Shared memory allocation for the tile. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:90</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params_html_a46f2546f9b88f4fc87f1396d0f08b065"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a46f2546f9b88f4fc87f1396d0f08b065">cutlass::gemm::GlobalLoadStream::Params::load_iterator</a></div><div class="ttdeci">LoadIterator::Params load_iterator</div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:98</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params_html"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html">cutlass::gemm::GlobalLoadStream::Params</a></div><div class="ttdoc">The params. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:96</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_aa79a27cbe2420882fbaca55e42803f02"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#aa79a27cbe2420882fbaca55e42803f02">cutlass::gemm::GlobalLoadStream::Transformer</a></div><div class="ttdeci">Transformer_ Transformer</div><div class="ttdoc">The transformer. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:58</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a563961c326d2e55f5b8682a30b64a24a"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a563961c326d2e55f5b8682a30b64a24a">cutlass::gemm::GlobalLoadStream::threadblock_offset</a></div><div class="ttdeci">Coord< 3 > threadblock_offset</div><div class="ttdoc">Threadblock offset. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:238</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a7c46d6eb83b43e099d53784bb2a09f02"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7c46d6eb83b43e099d53784bb2a09f02">cutlass::gemm::GlobalLoadStream::Index</a></div><div class="ttdeci">LoadIterator::Index Index</div><div class="ttdoc">The index. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:82</div></div>
|
|
<div class="ttc" id="structcutlass_1_1GemmOperand_html_ab209ea3de198efabe8e8707dfe8e0a0c"><div class="ttname"><a href="structcutlass_1_1GemmOperand.html#ab209ea3de198efabe8e8707dfe8e0a0c">cutlass::GemmOperand::Kind</a></div><div class="ttdeci">Kind</div><div class="ttdef"><b>Definition:</b> matrix_traits.h:357</div></div>
|
|
<div class="ttc" id="structcutlass_1_1GemmOperand_html_ab209ea3de198efabe8e8707dfe8e0a0cac2b9fe9e3679a059d1a6c946b2a2c31a"><div class="ttname"><a href="structcutlass_1_1GemmOperand.html#ab209ea3de198efabe8e8707dfe8e0a0cac2b9fe9e3679a059d1a6c946b2a2c31a">cutlass::GemmOperand::kA</a></div><div class="ttdef"><b>Definition:</b> matrix_traits.h:357</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_ac269a9280a55d3988ca60f571bdf7f29"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#ac269a9280a55d3988ca60f571bdf7f29">cutlass::gemm::GlobalLoadStream::move_to_residue</a></div><div class="ttdeci">CUTLASS_DEVICE void move_to_residue(Index k, Index kTileK)</div><div class="ttdoc">Move to the residue portion. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:198</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a7d9b4339129c1ab4f21f1df1144faddf"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a7d9b4339129c1ab4f21f1df1144faddf">cutlass::gemm::GlobalLoadStream::FetchedFragment</a></div><div class="ttdeci">LoadIterator::Fragment FetchedFragment</div><div class="ttdoc">The fragment that is copied from shared memory. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:63</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a9eb2fb49698d0d018c04e7712e239ce9"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a9eb2fb49698d0d018c04e7712e239ce9">cutlass::gemm::GlobalLoadStream::TransformedFragment</a></div><div class="ttdeci">Transformer::OutputFragment TransformedFragment</div><div class="ttdoc">The fragment that is obtained after the transformation by the transformer. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:65</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_aec86bdf5d7d4ad1f7b6ebebcf2da8395"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#aec86bdf5d7d4ad1f7b6ebebcf2da8395">cutlass::gemm::GlobalLoadStream::GlobalLoadStream</a></div><div class="ttdeci">CUTLASS_DEVICE GlobalLoadStream(Params const &_params, SharedStorage &shared_storage, ThreadblockTileRef const &threadblock_tile_ref, Coord< 3 > const bounds, Coord< 3 > const &_threadblock_offset)</div><div class="ttdoc">Ctor. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:160</div></div>
|
|
<div class="ttc" id="convert_8h_html"><div class="ttname"><a href="convert_8h.html">convert.h</a></div><div class="ttdoc">Defines conversion operations among Fragments of different base type. </div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params_html_a9c0707b48565a522884cbd077aa299ee"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream_1_1Params.html#a9c0707b48565a522884cbd077aa299ee">cutlass::gemm::GlobalLoadStream::Params::get_offset_to_residue</a></div><div class="ttdeci">CUTLASS_DEVICE Index get_offset_to_residue()</div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:131</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a260543a618fb187c2da40c9f630925ec"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a260543a618fb187c2da40c9f630925ec">cutlass::gemm::GlobalLoadStream::Tile</a></div><div class="ttdeci">LoadIterator::Tile Tile</div><div class="ttdoc">The tile. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:86</div></div>
|
|
<div class="ttc" id="structcutlass_1_1gemm_1_1GlobalLoadStream_html_a1e2eecdba1871fc11aa43a06edf6ed34"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GlobalLoadStream.html#a1e2eecdba1871fc11aa43a06edf6ed34">cutlass::gemm::GlobalLoadStream::rollback</a></div><div class="ttdeci">CUTLASS_DEVICE void rollback(void)</div><div class="ttdoc">Rollback to the beginning of the first tile. </div><div class="ttdef"><b>Definition:</b> gemm_global_stream.h:208</div></div>
|
|
</div><!-- fragment --></div><!-- contents -->
|
|
<!-- start footer part -->
|
|
<hr class="footer"/><address class="footer"><small>
|
|
Generated on Fri Oct 26 2018 14:53:33 for Cutlass by  <a href="http://www.doxygen.org/index.html">
|
|
<img class="footer" src="doxygen.png" alt="doxygen"/>
|
|
</a> 1.8.14
|
|
</small></address>
|
|
</body>
|
|
</html>
|