<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
<meta name="generator" content="Doxygen 1.8.11"/>
<title>CUTLASS: regular_tile_access_iterator_tensor_op.h Source File</title>
<link href="tabs.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="jquery.js"></script>
<script type="text/javascript" src="dynsections.js"></script>
<link href="search/search.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="search/searchdata.js"></script>
<script type="text/javascript" src="search/search.js"></script>
<script type="text/javascript">
  $(document).ready(function() { init_search(); });
</script>
<script type="text/x-mathjax-config">
  MathJax.Hub.Config({
    extensions: ["tex2jax.js"],
    jax: ["input/TeX","output/HTML-CSS"],
});
</script><script type="text/javascript" src="http://cdn.mathjax.org/mathjax/latest/MathJax.js"></script>
<link href="doxygen.css" rel="stylesheet" type="text/css" />
</head>
<body>
<div id="top"><!-- do not remove this div, it is closed by doxygen! -->
<div id="titlearea">
<table cellspacing="0" cellpadding="0">
 <tbody>
 <tr style="height: 56px;">
  <td id="projectlogo"><img alt="Logo" src="cutlass-logo-small.png"/></td>
  <td id="projectalign" style="padding-left: 0.5em;">
   <div id="projectname">CUTLASS
   </div>
   <div id="projectbrief">CUDA Templates for Linear Algebra Subroutines and Solvers</div>
  </td>
 </tr>
 </tbody>
</table>
</div>
<!-- end header part -->
<!-- Generated by Doxygen 1.8.11 -->
<script type="text/javascript">
var searchBox = new SearchBox("searchBox", "search",false,'Search');
</script>
  <div id="navrow1" class="tabs">
    <ul class="tablist">
      <li><a href="index.html"><span>Main&#160;Page</span></a></li>
      <li><a href="modules.html"><span>Modules</span></a></li>
      <li><a href="namespaces.html"><span>Namespaces</span></a></li>
      <li><a href="annotated.html"><span>Classes</span></a></li>
      <li class="current"><a href="files.html"><span>Files</span></a></li>
      <li>
        <div id="MSearchBox" class="MSearchBoxInactive">
        <span class="left">
          <img id="MSearchSelect" src="search/mag_sel.png"
               onmouseover="return searchBox.OnSearchSelectShow()"
               onmouseout="return searchBox.OnSearchSelectHide()"
               alt=""/>
          <input type="text" id="MSearchField" value="Search" accesskey="S"
               onfocus="searchBox.OnSearchFieldFocus(true)" 
               onblur="searchBox.OnSearchFieldFocus(false)" 
               onkeyup="searchBox.OnSearchFieldChange(event)"/>
          </span><span class="right">
            <a id="MSearchClose" href="javascript:searchBox.CloseResultsWindow()"><img id="MSearchCloseImg" border="0" src="search/close.png" alt=""/></a>
          </span>
        </div>
      </li>
    </ul>
  </div>
  <div id="navrow2" class="tabs2">
    <ul class="tablist">
      <li><a href="files.html"><span>File&#160;List</span></a></li>
      <li><a href="globals.html"><span>File&#160;Members</span></a></li>
    </ul>
  </div>
<!-- window showing the filter options -->
<div id="MSearchSelectWindow"
     onmouseover="return searchBox.OnSearchSelectShow()"
     onmouseout="return searchBox.OnSearchSelectHide()"
     onkeydown="return searchBox.OnSearchSelectKey(event)">
</div>

<!-- iframe showing the search results (closed by default) -->
<div id="MSearchResultsWindow">
<iframe src="javascript:void(0)" frameborder="0" 
        name="MSearchResults" id="MSearchResults">
</iframe>
</div>

<div id="nav-path" class="navpath">
  <ul>
<li class="navelem"><a class="el" href="dir_d44c64559bbebec7f509842c48db8b23.html">include</a></li><li class="navelem"><a class="el" href="dir_6baf2bb612a2f0daa69af3101ede80a1.html">cutlass</a></li><li class="navelem"><a class="el" href="dir_568e97a0eb81cc0d3daf98cef30c9135.html">transform</a></li><li class="navelem"><a class="el" href="dir_5a68e39c181f2defa4dd959f7500739b.html">threadblock</a></li>  </ul>
</div>
</div><!-- top -->
<div class="header">
  <div class="headertitle">
<div class="title">regular_tile_access_iterator_tensor_op.h</div>  </div>
</div><!--header-->
<div class="contents">
<a href="regular__tile__access__iterator__tensor__op_8h.html">Go to the documentation of this file.</a><div class="fragment"><div class="line"><a name="l00001"></a><span class="lineno">    1</span>&#160;<span class="comment">/***************************************************************************************************</span></div><div class="line"><a name="l00002"></a><span class="lineno">    2</span>&#160;<span class="comment"> * Copyright (c) 2017-2019, NVIDIA CORPORATION.  All rights reserved.</span></div><div class="line"><a name="l00003"></a><span class="lineno">    3</span>&#160;<span class="comment"> *</span></div><div class="line"><a name="l00004"></a><span class="lineno">    4</span>&#160;<span class="comment"> * Redistribution and use in source and binary forms, with or without modification, are permitted</span></div><div class="line"><a name="l00005"></a><span class="lineno">    5</span>&#160;<span class="comment"> * provided that the following conditions are met:</span></div><div class="line"><a name="l00006"></a><span class="lineno">    6</span>&#160;<span class="comment"> *     * Redistributions of source code must retain the above copyright notice, this list of</span></div><div class="line"><a name="l00007"></a><span class="lineno">    7</span>&#160;<span class="comment"> *       conditions and the following disclaimer.</span></div><div class="line"><a name="l00008"></a><span class="lineno">    8</span>&#160;<span class="comment"> *     * Redistributions in binary form must reproduce the above copyright notice, this list of</span></div><div class="line"><a name="l00009"></a><span class="lineno">    9</span>&#160;<span class="comment"> *       conditions and the following disclaimer in the documentation and/or other materials</span></div><div class="line"><a name="l00010"></a><span class="lineno">   10</span>&#160;<span class="comment"> *       provided with the distribution.</span></div><div class="line"><a name="l00011"></a><span class="lineno">   11</span>&#160;<span class="comment"> *     * Neither the name of the NVIDIA CORPORATION nor the names of its contributors may be used</span></div><div class="line"><a name="l00012"></a><span class="lineno">   12</span>&#160;<span class="comment"> *       to endorse or promote products derived from this software without specific prior written</span></div><div class="line"><a name="l00013"></a><span class="lineno">   13</span>&#160;<span class="comment"> *       permission.</span></div><div class="line"><a name="l00014"></a><span class="lineno">   14</span>&#160;<span class="comment"> *</span></div><div class="line"><a name="l00015"></a><span class="lineno">   15</span>&#160;<span class="comment"> * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS &quot;AS IS&quot; AND ANY EXPRESS OR</span></div><div class="line"><a name="l00016"></a><span class="lineno">   16</span>&#160;<span class="comment"> * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND</span></div><div class="line"><a name="l00017"></a><span class="lineno">   17</span>&#160;<span class="comment"> * FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE</span></div><div class="line"><a name="l00018"></a><span class="lineno">   18</span>&#160;<span class="comment"> * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,</span></div><div class="line"><a name="l00019"></a><span class="lineno">   19</span>&#160;<span class="comment"> * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;</span></div><div class="line"><a name="l00020"></a><span class="lineno">   20</span>&#160;<span class="comment"> * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,</span></div><div class="line"><a name="l00021"></a><span class="lineno">   21</span>&#160;<span class="comment"> * STRICT LIABILITY, OR TOR (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE</span></div><div class="line"><a name="l00022"></a><span class="lineno">   22</span>&#160;<span class="comment"> * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.</span></div><div class="line"><a name="l00023"></a><span class="lineno">   23</span>&#160;<span class="comment"> *</span></div><div class="line"><a name="l00024"></a><span class="lineno">   24</span>&#160;<span class="comment"> **************************************************************************************************/</span></div><div class="line"><a name="l00030"></a><span class="lineno">   30</span>&#160;<span class="preprocessor">#pragma once</span></div><div class="line"><a name="l00031"></a><span class="lineno">   31</span>&#160;</div><div class="line"><a name="l00032"></a><span class="lineno">   32</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="array_8h.html">cutlass/array.h</a>&quot;</span></div><div class="line"><a name="l00033"></a><span class="lineno">   33</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="cutlass_8h.html">cutlass/cutlass.h</a>&quot;</span></div><div class="line"><a name="l00034"></a><span class="lineno">   34</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="pitch__linear_8h.html">cutlass/layout/pitch_linear.h</a>&quot;</span></div><div class="line"><a name="l00035"></a><span class="lineno">   35</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="tensor__op__multiplicand__sm75_8h.html">cutlass/layout/tensor_op_multiplicand_sm75.h</a>&quot;</span></div><div class="line"><a name="l00036"></a><span class="lineno">   36</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="matrix__coord_8h.html">cutlass/matrix_coord.h</a>&quot;</span></div><div class="line"><a name="l00037"></a><span class="lineno">   37</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="matrix__shape_8h.html">cutlass/matrix_shape.h</a>&quot;</span></div><div class="line"><a name="l00038"></a><span class="lineno">   38</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="tensor__ref_8h.html">cutlass/tensor_ref.h</a>&quot;</span></div><div class="line"><a name="l00039"></a><span class="lineno">   39</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="regular__tile__access__iterator_8h.html">cutlass/transform/threadblock/regular_tile_access_iterator.h</a>&quot;</span></div><div class="line"><a name="l00040"></a><span class="lineno">   40</span>&#160;</div><div class="line"><a name="l00042"></a><span class="lineno">   42</span>&#160;</div><div class="line"><a name="l00043"></a><span class="lineno">   43</span>&#160;<span class="keyword">namespace </span><a class="code" href="namespacecutlass.html">cutlass</a> {</div><div class="line"><a name="l00044"></a><span class="lineno">   44</span>&#160;<span class="keyword">namespace </span>transform {</div><div class="line"><a name="l00045"></a><span class="lineno">   45</span>&#160;<span class="keyword">namespace </span>threadblock {</div><div class="line"><a name="l00046"></a><span class="lineno">   46</span>&#160;</div><div class="line"><a name="l00048"></a><span class="lineno">   48</span>&#160;</div><div class="line"><a name="l00056"></a><span class="lineno">   56</span>&#160;<span class="keyword">template</span> &lt;<span class="keyword">typename</span> Shape_, <span class="keyword">typename</span> Element_, <span class="keywordtype">int</span> AdvanceRank,</div><div class="line"><a name="l00057"></a><span class="lineno">   57</span>&#160;          <span class="keyword">typename</span> ThreadMap_, <span class="keywordtype">int</span> Alignment&gt;</div><div class="line"><a name="l00058"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html">   58</a></span>&#160;<span class="keyword">class </span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a>&lt;</div><div class="line"><a name="l00059"></a><span class="lineno">   59</span>&#160;    Shape_, Element_,</div><div class="line"><a name="l00060"></a><span class="lineno">   60</span>&#160;    layout::TensorOpMultiplicandCongruous&lt;sizeof_bits&lt;Element_&gt;::value,</div><div class="line"><a name="l00061"></a><span class="lineno">   61</span>&#160;                                          int(128 / sizeof(Element_))&gt;,</div><div class="line"><a name="l00062"></a><span class="lineno">   62</span>&#160;    AdvanceRank, ThreadMap_, Alignment&gt; {</div><div class="line"><a name="l00063"></a><span class="lineno">   63</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00064"></a><span class="lineno">   64</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00065"></a><span class="lineno">   65</span>&#160;      AdvanceRank == 0 || AdvanceRank == 1,</div><div class="line"><a name="l00066"></a><span class="lineno">   66</span>&#160;      <span class="stringliteral">&quot;Specialization for pitch-linear iterator may along advance along the &quot;</span></div><div class="line"><a name="l00067"></a><span class="lineno">   67</span>&#160;      <span class="stringliteral">&quot;contiguous(rank=0) or strided(rank=1) dimension.&quot;</span>);</div><div class="line"><a name="l00068"></a><span class="lineno">   68</span>&#160;</div><div class="line"><a name="l00069"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ad7506791dac3532d745c1d268e7c77f5">   69</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ad7506791dac3532d745c1d268e7c77f5">Shape</a> = Shape_;</div><div class="line"><a name="l00070"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a6b2bd7c503e292cdcfa6c18c77cd7baa">   70</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a6b2bd7c503e292cdcfa6c18c77cd7baa">Element</a> = Element_;</div><div class="line"><a name="l00071"></a><span class="lineno">   71</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous.html">Layout</a> =</div><div class="line"><a name="l00072"></a><span class="lineno">   72</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous.html">layout::TensorOpMultiplicandCongruous&lt;sizeof_bits&lt;Element_&gt;::value</a>,</div><div class="line"><a name="l00073"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ab7cfff85a366f0132c3f242e88a7570a">   73</a></span>&#160;                                            int(128 / <span class="keyword">sizeof</span>(Element_))&gt;;</div><div class="line"><a name="l00074"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a9c2871152eb66979098cff0676b00bbd">   74</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAdvanceRank = AdvanceRank;</div><div class="line"><a name="l00075"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a87bfae407dbf0fc94e4a846ccebf7073">   75</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAlignment = Alignment;</div><div class="line"><a name="l00076"></a><span class="lineno">   76</span>&#160;</div><div class="line"><a name="l00077"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a636e7123ac8169f41d47e071e460fb81">   77</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a636e7123ac8169f41d47e071e460fb81">Index</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous.html#ab498476001a090017735113863e28898">Layout::Index</a>;</div><div class="line"><a name="l00078"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a4051bd65d1bf0b1b127bf46ad2044b83">   78</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a4051bd65d1bf0b1b127bf46ad2044b83">LongIndex</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous.html#aa04ef0da8d8a859c2b7bb08cb3752d3d">Layout::LongIndex</a>;</div><div class="line"><a name="l00079"></a><span class="lineno">   79</span>&#160;</div><div class="line"><a name="l00080"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a7d991d7915e959c1c887fc5c1c37a93f">   80</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> = <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef&lt;Element, Layout&gt;</a>;</div><div class="line"><a name="l00081"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a0e1c1e0c2565df3ade843682d8532435">   81</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a0e1c1e0c2565df3ade843682d8532435">TensorCoord</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1PitchLinearCoord.html">Layout::TensorCoord</a>;</div><div class="line"><a name="l00082"></a><span class="lineno">   82</span>&#160;</div><div class="line"><a name="l00083"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a81cc510ffd092b4b002ef42892ffc0ec">   83</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a81cc510ffd092b4b002ef42892ffc0ec">ThreadMap</a> = ThreadMap_;</div><div class="line"><a name="l00084"></a><span class="lineno">   84</span>&#160;</div><div class="line"><a name="l00086"></a><span class="lineno"><a class="line" href="structcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element_0a9491607d11be8e1780e79ad711aa42.html">   86</a></span>&#160;  <span class="keyword">struct </span>Detail {</div><div class="line"><a name="l00089"></a><span class="lineno"><a class="line" href="structcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element_0a9491607d11be8e1780e79ad711aa42.html#a4491955b1e900aa9cf45e610debc3ee8">   89</a></span>&#160;    <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAccessSizeInBits = 128;</div><div class="line"><a name="l00090"></a><span class="lineno">   90</span>&#160;</div><div class="line"><a name="l00091"></a><span class="lineno">   91</span>&#160;    <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(<a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;Element_&gt;::value</a> *</div><div class="line"><a name="l00092"></a><span class="lineno">   92</span>&#160;                          ThreadMap::kElementsPerAccess ==</div><div class="line"><a name="l00093"></a><span class="lineno">   93</span>&#160;                      kAccessSizeInBits,</div><div class="line"><a name="l00094"></a><span class="lineno">   94</span>&#160;                  <span class="stringliteral">&quot;This iterator requires a policy whose access size is 128bs&quot;</span>);</div><div class="line"><a name="l00095"></a><span class="lineno">   95</span>&#160;</div><div class="line"><a name="l00097"></a><span class="lineno"><a class="line" href="structcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element_0a9491607d11be8e1780e79ad711aa42.html#a5e3a4764a2603fb56a92b24d23b251fa">   97</a></span>&#160;    <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPointerCount =</div><div class="line"><a name="l00098"></a><span class="lineno">   98</span>&#160;        (ThreadMap::Iterations::kStrided &gt; 1 ? 2 : 1);</div><div class="line"><a name="l00099"></a><span class="lineno">   99</span>&#160;  };</div><div class="line"><a name="l00100"></a><span class="lineno">  100</span>&#160;</div><div class="line"><a name="l00102"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ac50ad97c2081de5cdd9600f1721c9037">  102</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ac50ad97c2081de5cdd9600f1721c9037">AccessType</a> = Array&lt;Element, Layout::kElementsPerAccess&gt;;</div><div class="line"><a name="l00103"></a><span class="lineno">  103</span>&#160;</div><div class="line"><a name="l00104"></a><span class="lineno">  104</span>&#160; <span class="keyword">private</span>:</div><div class="line"><a name="l00105"></a><span class="lineno">  105</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00106"></a><span class="lineno">  106</span>&#160;  <span class="comment">// Data members</span></div><div class="line"><a name="l00107"></a><span class="lineno">  107</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00108"></a><span class="lineno">  108</span>&#160;</div><div class="line"><a name="l00110"></a><span class="lineno">  110</span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a636e7123ac8169f41d47e071e460fb81">Index</a> stride_;</div><div class="line"><a name="l00111"></a><span class="lineno">  111</span>&#160;</div><div class="line"><a name="l00113"></a><span class="lineno">  113</span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ac50ad97c2081de5cdd9600f1721c9037">AccessType</a> *pointer_[Detail::kPointerCount];</div><div class="line"><a name="l00114"></a><span class="lineno">  114</span>&#160;</div><div class="line"><a name="l00116"></a><span class="lineno">  116</span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a636e7123ac8169f41d47e071e460fb81">Index</a> byte_offset_;</div><div class="line"><a name="l00117"></a><span class="lineno">  117</span>&#160;</div><div class="line"><a name="l00119"></a><span class="lineno">  119</span>&#160;  <span class="keywordtype">int</span> iteration_contiguous_;</div><div class="line"><a name="l00120"></a><span class="lineno">  120</span>&#160;</div><div class="line"><a name="l00122"></a><span class="lineno">  122</span>&#160;  <span class="keywordtype">int</span> iteration_strided_;</div><div class="line"><a name="l00123"></a><span class="lineno">  123</span>&#160;</div><div class="line"><a name="l00124"></a><span class="lineno">  124</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00126"></a><span class="lineno">  126</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00127"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ae4927c7f718b52aa80f603d9911b9639">  127</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ae4927c7f718b52aa80f603d9911b9639">RegularTileAccessIterator</a>(<a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> ref,  </div><div class="line"><a name="l00128"></a><span class="lineno">  128</span>&#160;                            <span class="keywordtype">int</span> thread_id   </div><div class="line"><a name="l00129"></a><span class="lineno">  129</span>&#160;                            )</div><div class="line"><a name="l00130"></a><span class="lineno">  130</span>&#160;      : stride_(ref.stride(0) / <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous.html">Layout</a>::kElementsPerAccess),</div><div class="line"><a name="l00131"></a><span class="lineno">  131</span>&#160;        byte_offset_(0) {</div><div class="line"><a name="l00132"></a><span class="lineno">  132</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearCoord.html">layout::PitchLinearCoord</a> thread_offset_base =</div><div class="line"><a name="l00133"></a><span class="lineno">  133</span>&#160;        ThreadMap::initial_offset(thread_id);</div><div class="line"><a name="l00134"></a><span class="lineno">  134</span>&#160;</div><div class="line"><a name="l00135"></a><span class="lineno">  135</span>&#160;    <a class="code" href="cutlass_8h.html#a4b1c9f25ab6eaa25e1f2258dd63e6ce4">CUTLASS_PRAGMA_UNROLL</a></div><div class="line"><a name="l00136"></a><span class="lineno">  136</span>&#160;    <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; Detail::kPointerCount; ++i) {</div><div class="line"><a name="l00137"></a><span class="lineno">  137</span>&#160;      <span class="comment">// This is the offset of a thread within a threadblock tile for a specific</span></div><div class="line"><a name="l00138"></a><span class="lineno">  138</span>&#160;      <span class="comment">// pointer (units of elements)</span></div><div class="line"><a name="l00139"></a><span class="lineno">  139</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1PitchLinearCoord.html">layout::PitchLinearCoord</a> thread_offset_in_threadblock_tile =</div><div class="line"><a name="l00140"></a><span class="lineno">  140</span>&#160;          thread_offset_base +</div><div class="line"><a name="l00141"></a><span class="lineno">  141</span>&#160;          <a class="code" href="structcutlass_1_1layout_1_1PitchLinearCoord.html">layout::PitchLinearCoord</a>{</div><div class="line"><a name="l00142"></a><span class="lineno">  142</span>&#160;              0, ThreadMap::Detail::WarpThreadArrangement::kStrided * i};</div><div class="line"><a name="l00143"></a><span class="lineno">  143</span>&#160;</div><div class="line"><a name="l00144"></a><span class="lineno">  144</span>&#160;      <span class="comment">// initialize pointer</span></div><div class="line"><a name="l00145"></a><span class="lineno">  145</span>&#160;      pointer_[i] = <span class="keyword">reinterpret_cast&lt;</span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ac50ad97c2081de5cdd9600f1721c9037">AccessType</a> *<span class="keyword">&gt;</span>(</div><div class="line"><a name="l00146"></a><span class="lineno">  146</span>&#160;          ref.<a class="code" href="classcutlass_1_1TensorRef.html#ac7db3ca62ab1dfe0d3ea08bcadbc9352">data</a>() + ref.<a class="code" href="classcutlass_1_1TensorRef.html#a4166ac2a0754574ac21d5d57d74f34e5">offset</a>(thread_offset_in_threadblock_tile));</div><div class="line"><a name="l00147"></a><span class="lineno">  147</span>&#160;    }</div><div class="line"><a name="l00148"></a><span class="lineno">  148</span>&#160;</div><div class="line"><a name="l00149"></a><span class="lineno">  149</span>&#160;    set_iteration_index(0);</div><div class="line"><a name="l00150"></a><span class="lineno">  150</span>&#160;  }</div><div class="line"><a name="l00151"></a><span class="lineno">  151</span>&#160;</div><div class="line"><a name="l00153"></a><span class="lineno">  153</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00154"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a21ec4fc2d56d5cd3bf58426ae01f369c">  154</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a21ec4fc2d56d5cd3bf58426ae01f369c">set_iteration_index</a>(<span class="keywordtype">int</span> index) {</div><div class="line"><a name="l00155"></a><span class="lineno">  155</span>&#160;    iteration_contiguous_ = index % ThreadMap::Iterations::kContiguous;</div><div class="line"><a name="l00156"></a><span class="lineno">  156</span>&#160;    iteration_strided_ = index / ThreadMap::Iterations::kContiguous;</div><div class="line"><a name="l00157"></a><span class="lineno">  157</span>&#160;  }</div><div class="line"><a name="l00158"></a><span class="lineno">  158</span>&#160;</div><div class="line"><a name="l00160"></a><span class="lineno">  160</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00161"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a9d7b736eddaf28d6bd6216ba76396be1">  161</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a9d7b736eddaf28d6bd6216ba76396be1">add_pointer_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a4051bd65d1bf0b1b127bf46ad2044b83">LongIndex</a> pointer_offset) {</div><div class="line"><a name="l00162"></a><span class="lineno">  162</span>&#160;    byte_offset_ += pointer_offset * <span class="keyword">sizeof</span>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a6b2bd7c503e292cdcfa6c18c77cd7baa">Element</a>);</div><div class="line"><a name="l00163"></a><span class="lineno">  163</span>&#160;  }</div><div class="line"><a name="l00164"></a><span class="lineno">  164</span>&#160;</div><div class="line"><a name="l00166"></a><span class="lineno">  166</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00167"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a2c91372a2ea9bbd5ebb6fc529bd64cd6">  167</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ac50ad97c2081de5cdd9600f1721c9037">AccessType</a> *<span class="keyword">get</span>() <span class="keyword">const</span> {</div><div class="line"><a name="l00168"></a><span class="lineno">  168</span>&#160;    <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ac50ad97c2081de5cdd9600f1721c9037">AccessType</a> *access_ptr = pointer_[iteration_strided_ &amp; 1];</div><div class="line"><a name="l00169"></a><span class="lineno">  169</span>&#160;    <span class="keywordtype">int</span> stride_idx = (iteration_strided_ &amp; ~1);</div><div class="line"><a name="l00170"></a><span class="lineno">  170</span>&#160;</div><div class="line"><a name="l00171"></a><span class="lineno">  171</span>&#160;    <span class="keywordtype">int</span> access_offset = stride_idx * ThreadMap::Delta::kStrided * stride_ +</div><div class="line"><a name="l00172"></a><span class="lineno">  172</span>&#160;                        iteration_contiguous_ * ThreadMap::Delta::kContiguous /</div><div class="line"><a name="l00173"></a><span class="lineno">  173</span>&#160;                            ThreadMap::kElementsPerAccess;</div><div class="line"><a name="l00174"></a><span class="lineno">  174</span>&#160;</div><div class="line"><a name="l00175"></a><span class="lineno">  175</span>&#160;    <span class="keywordtype">char</span> *access_byte_ptr =</div><div class="line"><a name="l00176"></a><span class="lineno">  176</span>&#160;        <span class="keyword">reinterpret_cast&lt;</span><span class="keywordtype">char</span> *<span class="keyword">&gt;</span>(access_ptr + access_offset);</div><div class="line"><a name="l00177"></a><span class="lineno">  177</span>&#160;    <span class="keywordflow">return</span> <span class="keyword">reinterpret_cast&lt;</span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ac50ad97c2081de5cdd9600f1721c9037">AccessType</a> *<span class="keyword">&gt;</span>(access_byte_ptr + byte_offset_);</div><div class="line"><a name="l00178"></a><span class="lineno">  178</span>&#160;  }</div><div class="line"><a name="l00179"></a><span class="lineno">  179</span>&#160;</div><div class="line"><a name="l00181"></a><span class="lineno">  181</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00182"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a3d07f09c89750c04f1056ae2b2285296">  182</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> &amp;<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a3d07f09c89750c04f1056ae2b2285296">operator++</a>() {</div><div class="line"><a name="l00183"></a><span class="lineno">  183</span>&#160;    ++iteration_contiguous_;</div><div class="line"><a name="l00184"></a><span class="lineno">  184</span>&#160;</div><div class="line"><a name="l00185"></a><span class="lineno">  185</span>&#160;    <span class="keywordflow">if</span> (iteration_contiguous_ &lt; ThreadMap::Iterations::kContiguous)</div><div class="line"><a name="l00186"></a><span class="lineno">  186</span>&#160;      <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00187"></a><span class="lineno">  187</span>&#160;</div><div class="line"><a name="l00188"></a><span class="lineno">  188</span>&#160;    <span class="comment">// Enter here only if (iteration_contiguous_ ==</span></div><div class="line"><a name="l00189"></a><span class="lineno">  189</span>&#160;    <span class="comment">// ThreadMap::Iteration::kContiguous)</span></div><div class="line"><a name="l00190"></a><span class="lineno">  190</span>&#160;    iteration_contiguous_ = 0;</div><div class="line"><a name="l00191"></a><span class="lineno">  191</span>&#160;    ++iteration_strided_;</div><div class="line"><a name="l00192"></a><span class="lineno">  192</span>&#160;</div><div class="line"><a name="l00193"></a><span class="lineno">  193</span>&#160;    <span class="keywordflow">if</span> (iteration_strided_ &lt; ThreadMap::Iterations::kStrided) {</div><div class="line"><a name="l00194"></a><span class="lineno">  194</span>&#160;      <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00195"></a><span class="lineno">  195</span>&#160;    }</div><div class="line"><a name="l00196"></a><span class="lineno">  196</span>&#160;</div><div class="line"><a name="l00197"></a><span class="lineno">  197</span>&#160;    <span class="comment">// Enter here only if (iteration_strided_ == ThreadMap::Iteration::kStrided)</span></div><div class="line"><a name="l00198"></a><span class="lineno">  198</span>&#160;    <span class="comment">// which means we enter the next tile.</span></div><div class="line"><a name="l00199"></a><span class="lineno">  199</span>&#160;    iteration_strided_ = 0;</div><div class="line"><a name="l00200"></a><span class="lineno">  200</span>&#160;</div><div class="line"><a name="l00201"></a><span class="lineno">  201</span>&#160;    <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00202"></a><span class="lineno">  202</span>&#160;  }</div><div class="line"><a name="l00203"></a><span class="lineno">  203</span>&#160;</div><div class="line"><a name="l00205"></a><span class="lineno">  205</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00206"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#adeec884a4fce07b0fc82d5ba5dd03fe4">  206</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#adeec884a4fce07b0fc82d5ba5dd03fe4">operator++</a>(<span class="keywordtype">int</span>) {</div><div class="line"><a name="l00207"></a><span class="lineno">  207</span>&#160;    <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> prev(*<span class="keyword">this</span>);</div><div class="line"><a name="l00208"></a><span class="lineno">  208</span>&#160;    this-&gt;<a class="code" href="namespacecutlass.html#a1c7a9e66ca7b5dc7413ea3b8f349530a">operator++</a>();</div><div class="line"><a name="l00209"></a><span class="lineno">  209</span>&#160;</div><div class="line"><a name="l00210"></a><span class="lineno">  210</span>&#160;    <span class="keywordflow">return</span> prev;</div><div class="line"><a name="l00211"></a><span class="lineno">  211</span>&#160;  }</div><div class="line"><a name="l00212"></a><span class="lineno">  212</span>&#160;</div><div class="line"><a name="l00214"></a><span class="lineno">  214</span>&#160;  CUTLASS_DEVICE</div><div class="line"><a name="l00215"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a0b4a33ab3cabb4ffe3a47f5b0ee207d6">  215</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a0b4a33ab3cabb4ffe3a47f5b0ee207d6">add_tile_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a0e1c1e0c2565df3ade843682d8532435">TensorCoord</a> <span class="keyword">const</span> &amp;coord) {</div><div class="line"><a name="l00216"></a><span class="lineno">  216</span>&#160;    add_pointer_offset(coord.contiguous() * Shape::kContiguous +</div><div class="line"><a name="l00217"></a><span class="lineno">  217</span>&#160;                       coord.strided() * Shape::kStrided * stride_ *</div><div class="line"><a name="l00218"></a><span class="lineno">  218</span>&#160;                           Layout::kElementsPerAccess);</div><div class="line"><a name="l00219"></a><span class="lineno">  219</span>&#160;  }</div><div class="line"><a name="l00220"></a><span class="lineno">  220</span>&#160;};</div><div class="line"><a name="l00221"></a><span class="lineno">  221</span>&#160;</div><div class="line"><a name="l00223"></a><span class="lineno">  223</span>&#160;</div><div class="line"><a name="l00231"></a><span class="lineno">  231</span>&#160;<span class="keyword">template</span> &lt;<span class="keyword">typename</span> Shape_, <span class="keyword">typename</span> Element_, <span class="keywordtype">int</span> AdvanceRank,</div><div class="line"><a name="l00232"></a><span class="lineno">  232</span>&#160;          <span class="keyword">typename</span> ThreadMap_, <span class="keywordtype">int</span> Alignment&gt;</div><div class="line"><a name="l00233"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html">  233</a></span>&#160;<span class="keyword">class </span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a>&lt;</div><div class="line"><a name="l00234"></a><span class="lineno">  234</span>&#160;    Shape_, Element_,</div><div class="line"><a name="l00235"></a><span class="lineno">  235</span>&#160;    layout::ColumnMajorTensorOpMultiplicandCongruous&lt;</div><div class="line"><a name="l00236"></a><span class="lineno">  236</span>&#160;        sizeof_bits&lt;Element_&gt;::value, int(128 / sizeof(Element_))&gt;,</div><div class="line"><a name="l00237"></a><span class="lineno">  237</span>&#160;    AdvanceRank, ThreadMap_, Alignment&gt; {</div><div class="line"><a name="l00238"></a><span class="lineno">  238</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00239"></a><span class="lineno">  239</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00240"></a><span class="lineno">  240</span>&#160;      AdvanceRank == 0 || AdvanceRank == 1,</div><div class="line"><a name="l00241"></a><span class="lineno">  241</span>&#160;      <span class="stringliteral">&quot;Specialization for column-major iterator may along advance along the &quot;</span></div><div class="line"><a name="l00242"></a><span class="lineno">  242</span>&#160;      <span class="stringliteral">&quot;columns(rank=0) or rows(rank=1) dimension.&quot;</span>);</div><div class="line"><a name="l00243"></a><span class="lineno">  243</span>&#160;</div><div class="line"><a name="l00244"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a3c99340187479be2fae462f4df982bed">  244</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a3c99340187479be2fae462f4df982bed">Shape</a> = Shape_;</div><div class="line"><a name="l00245"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a18417476d7b76dd34e89b0af174a7bf0">  245</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a18417476d7b76dd34e89b0af174a7bf0">Element</a> = Element_;</div><div class="line"><a name="l00246"></a><span class="lineno">  246</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous.html">Layout</a> = <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous.html">layout::ColumnMajorTensorOpMultiplicandCongruous</a>&lt;</div><div class="line"><a name="l00247"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a03235e88ac2d0697c9259169fc42e7e8">  247</a></span>&#160;      <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;Element_&gt;::value</a>, int(128 / <span class="keyword">sizeof</span>(Element_))&gt;;</div><div class="line"><a name="l00248"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#ab346174acb993db138cfaed18c61d979">  248</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAdvanceRank = AdvanceRank;</div><div class="line"><a name="l00249"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#afcbfb246bfbfda546da90c5f908c2664">  249</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAlignment = Alignment;</div><div class="line"><a name="l00250"></a><span class="lineno">  250</span>&#160;</div><div class="line"><a name="l00251"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a4ba4f46f5286af5b7b647944cf3de8ad">  251</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a4ba4f46f5286af5b7b647944cf3de8ad">Index</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous.html#aa455da7f56592fdb70977b1cad108003">Layout::Index</a>;</div><div class="line"><a name="l00252"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#acee6b05cbcccab9deba3632b35d2f4e7">  252</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#acee6b05cbcccab9deba3632b35d2f4e7">LongIndex</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous.html#a37fd29e6b74010e9a3ae089d6a777724">Layout::LongIndex</a>;</div><div class="line"><a name="l00253"></a><span class="lineno">  253</span>&#160;</div><div class="line"><a name="l00254"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a2b2a8cb71b0c4d7ad9a375427c2f3506">  254</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> = <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef&lt;Element, Layout&gt;</a>;</div><div class="line"><a name="l00255"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a87a657d6b2aca3a6ca421312235d0335">  255</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a87a657d6b2aca3a6ca421312235d0335">TensorCoord</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1MatrixCoord.html">Layout::TensorCoord</a>;</div><div class="line"><a name="l00256"></a><span class="lineno">  256</span>&#160;</div><div class="line"><a name="l00257"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a9c7b26f7077030e9ac16a7124f3a6450">  257</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a9c7b26f7077030e9ac16a7124f3a6450">ThreadMap</a> = ThreadMap_;</div><div class="line"><a name="l00258"></a><span class="lineno">  258</span>&#160;</div><div class="line"><a name="l00260"></a><span class="lineno">  260</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">UnderlyingIterator</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a>&lt;</div><div class="line"><a name="l00261"></a><span class="lineno">  261</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;Shape::kRow, Shape::kColumn&gt;</a>, <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a18417476d7b76dd34e89b0af174a7bf0">Element</a>,</div><div class="line"><a name="l00262"></a><span class="lineno">  262</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous.html">layout::TensorOpMultiplicandCongruous&lt;sizeof_bits&lt;Element_&gt;::value</a>,</div><div class="line"><a name="l00263"></a><span class="lineno">  263</span>&#160;                                            int(128 / <span class="keyword">sizeof</span>(Element_))&gt;,</div><div class="line"><a name="l00264"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a35113ec61b349163e40d0684762b6d1a">  264</a></span>&#160;      (kAdvanceRank == 0 ? 0 : 1), ThreadMap_&gt;;</div><div class="line"><a name="l00265"></a><span class="lineno">  265</span>&#160;</div><div class="line"><a name="l00266"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a1f1e0d9d6ec1ba0627b0ff95343c5706">  266</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a1f1e0d9d6ec1ba0627b0ff95343c5706">AccessType</a> = <span class="keyword">typename</span> UnderlyingIterator::AccessType;</div><div class="line"><a name="l00267"></a><span class="lineno">  267</span>&#160;</div><div class="line"><a name="l00268"></a><span class="lineno">  268</span>&#160; <span class="keyword">private</span>:</div><div class="line"><a name="l00270"></a><span class="lineno">  270</span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">UnderlyingIterator</a> iterator_;</div><div class="line"><a name="l00271"></a><span class="lineno">  271</span>&#160;</div><div class="line"><a name="l00272"></a><span class="lineno">  272</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00274"></a><span class="lineno">  274</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00275"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a633db64682aa6494c2553e11614b5e1d">  275</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a633db64682aa6494c2553e11614b5e1d">RegularTileAccessIterator</a>(<a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> ref,  </div><div class="line"><a name="l00276"></a><span class="lineno">  276</span>&#160;                            <span class="keywordtype">int</span> thread_id   </div><div class="line"><a name="l00277"></a><span class="lineno">  277</span>&#160;                            )</div><div class="line"><a name="l00278"></a><span class="lineno">  278</span>&#160;      : iterator_({ref.<a class="code" href="classcutlass_1_1TensorRef.html#ac7db3ca62ab1dfe0d3ea08bcadbc9352">data</a>(), ref.<a class="code" href="classcutlass_1_1TensorRef.html#a191e88bc0fb310be655d700e937ab97c">stride</a>()}, thread_id) {}</div><div class="line"><a name="l00279"></a><span class="lineno">  279</span>&#160;</div><div class="line"><a name="l00281"></a><span class="lineno">  281</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00282"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a8358531564ae671621b6bb34ab10663e">  282</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a8358531564ae671621b6bb34ab10663e">set_iteration_index</a>(<span class="keywordtype">int</span> index) { iterator_.set_iteration_index(index); }</div><div class="line"><a name="l00283"></a><span class="lineno">  283</span>&#160;</div><div class="line"><a name="l00285"></a><span class="lineno">  285</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00286"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#acd5af8cbd89b13ad8678be98d495a44b">  286</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#acd5af8cbd89b13ad8678be98d495a44b">add_pointer_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#acee6b05cbcccab9deba3632b35d2f4e7">LongIndex</a> pointer_offset) {</div><div class="line"><a name="l00287"></a><span class="lineno">  287</span>&#160;    iterator_.add_pointer_offset(pointer_offset);</div><div class="line"><a name="l00288"></a><span class="lineno">  288</span>&#160;  }</div><div class="line"><a name="l00289"></a><span class="lineno">  289</span>&#160;</div><div class="line"><a name="l00291"></a><span class="lineno">  291</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00292"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#ab3681ca017522ca95a379acc6c7ef791">  292</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a1f1e0d9d6ec1ba0627b0ff95343c5706">AccessType</a> *<span class="keyword">get</span>() <span class="keyword">const</span> {</div><div class="line"><a name="l00293"></a><span class="lineno">  293</span>&#160;    <span class="keywordflow">return</span> <span class="keyword">reinterpret_cast&lt;</span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a1f1e0d9d6ec1ba0627b0ff95343c5706">AccessType</a> *<span class="keyword">&gt;</span>(iterator_.get());</div><div class="line"><a name="l00294"></a><span class="lineno">  294</span>&#160;  }</div><div class="line"><a name="l00295"></a><span class="lineno">  295</span>&#160;</div><div class="line"><a name="l00297"></a><span class="lineno">  297</span>&#160;  CUTLASS_DEVICE</div><div class="line"><a name="l00298"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a827059393710930e72337cb7c62b6ef2">  298</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a827059393710930e72337cb7c62b6ef2">add_tile_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a87a657d6b2aca3a6ca421312235d0335">TensorCoord</a> <span class="keyword">const</span> &amp;coord) {</div><div class="line"><a name="l00299"></a><span class="lineno">  299</span>&#160;    iterator_.add_tile_offset({coord.row(), coord.column()});</div><div class="line"><a name="l00300"></a><span class="lineno">  300</span>&#160;  }</div><div class="line"><a name="l00301"></a><span class="lineno">  301</span>&#160;</div><div class="line"><a name="l00303"></a><span class="lineno">  303</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00304"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a3c9014675466aec05102de18ef6eb40a">  304</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> &amp;<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a3c9014675466aec05102de18ef6eb40a">operator++</a>() {</div><div class="line"><a name="l00305"></a><span class="lineno">  305</span>&#160;    ++iterator_;</div><div class="line"><a name="l00306"></a><span class="lineno">  306</span>&#160;    <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00307"></a><span class="lineno">  307</span>&#160;  }</div><div class="line"><a name="l00308"></a><span class="lineno">  308</span>&#160;</div><div class="line"><a name="l00310"></a><span class="lineno">  310</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00311"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#ab56d2b152243b8898b9f8a77af5b3508">  311</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#ab56d2b152243b8898b9f8a77af5b3508">operator++</a>(<span class="keywordtype">int</span>) {</div><div class="line"><a name="l00312"></a><span class="lineno">  312</span>&#160;    <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> prev(*<span class="keyword">this</span>);</div><div class="line"><a name="l00313"></a><span class="lineno">  313</span>&#160;    ++iterator_;</div><div class="line"><a name="l00314"></a><span class="lineno">  314</span>&#160;</div><div class="line"><a name="l00315"></a><span class="lineno">  315</span>&#160;    <span class="keywordflow">return</span> prev;</div><div class="line"><a name="l00316"></a><span class="lineno">  316</span>&#160;  }</div><div class="line"><a name="l00317"></a><span class="lineno">  317</span>&#160;};</div><div class="line"><a name="l00318"></a><span class="lineno">  318</span>&#160;</div><div class="line"><a name="l00320"></a><span class="lineno">  320</span>&#160;</div><div class="line"><a name="l00328"></a><span class="lineno">  328</span>&#160;<span class="keyword">template</span> &lt;<span class="keyword">typename</span> Shape_, <span class="keyword">typename</span> Element_, <span class="keywordtype">int</span> AdvanceRank,</div><div class="line"><a name="l00329"></a><span class="lineno">  329</span>&#160;          <span class="keyword">typename</span> ThreadMap_, <span class="keywordtype">int</span> Alignment&gt;</div><div class="line"><a name="l00330"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html">  330</a></span>&#160;<span class="keyword">class </span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a>&lt;</div><div class="line"><a name="l00331"></a><span class="lineno">  331</span>&#160;    Shape_, Element_,</div><div class="line"><a name="l00332"></a><span class="lineno">  332</span>&#160;    layout::RowMajorTensorOpMultiplicandCongruous&lt;sizeof_bits&lt;Element_&gt;::value,</div><div class="line"><a name="l00333"></a><span class="lineno">  333</span>&#160;                                                  int(128 / sizeof(Element_))&gt;,</div><div class="line"><a name="l00334"></a><span class="lineno">  334</span>&#160;    AdvanceRank, ThreadMap_, Alignment&gt; {</div><div class="line"><a name="l00335"></a><span class="lineno">  335</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00336"></a><span class="lineno">  336</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00337"></a><span class="lineno">  337</span>&#160;      AdvanceRank == 0 || AdvanceRank == 1,</div><div class="line"><a name="l00338"></a><span class="lineno">  338</span>&#160;      <span class="stringliteral">&quot;Specialization for row-major iterator may along advance along the &quot;</span></div><div class="line"><a name="l00339"></a><span class="lineno">  339</span>&#160;      <span class="stringliteral">&quot;columns(rank=0) or rows(rank=1) dimension.&quot;</span>);</div><div class="line"><a name="l00340"></a><span class="lineno">  340</span>&#160;</div><div class="line"><a name="l00341"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a1c4dbad00b218fa641b615a19d611d9a">  341</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a1c4dbad00b218fa641b615a19d611d9a">Shape</a> = Shape_;</div><div class="line"><a name="l00342"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a3cb17cb1dfcd2791fb05860dbeef6365">  342</a></span>&#160;  <span class="keyword">using</span> Element = Element_;</div><div class="line"><a name="l00343"></a><span class="lineno">  343</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCongruous.html">Layout</a> = <a class="code" href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCongruous.html">layout::RowMajorTensorOpMultiplicandCongruous</a>&lt;</div><div class="line"><a name="l00344"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a5958d05653fca54158d052d3cdba42ac">  344</a></span>&#160;      <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;Element_&gt;::value</a>, int(128 / <span class="keyword">sizeof</span>(Element_))&gt;;</div><div class="line"><a name="l00345"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#af076255d0a7dde0025c10f69af9b25b9">  345</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAdvanceRank = AdvanceRank;</div><div class="line"><a name="l00346"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a13df81b103c33b25af2c1f6527ca8584">  346</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAlignment = Alignment;</div><div class="line"><a name="l00347"></a><span class="lineno">  347</span>&#160;</div><div class="line"><a name="l00348"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a5cc867dbd6b5a122e9951ff492f5238a">  348</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a5cc867dbd6b5a122e9951ff492f5238a">Index</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCongruous.html#a32c8623b9c3c8490263ea0af24a1410f">Layout::Index</a>;</div><div class="line"><a name="l00349"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a81ddaa615b424060e6442d1328d02e55">  349</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a81ddaa615b424060e6442d1328d02e55">LongIndex</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCongruous.html#ad49467d9028288b0bb93dbf376ef573a">Layout::LongIndex</a>;</div><div class="line"><a name="l00350"></a><span class="lineno">  350</span>&#160;</div><div class="line"><a name="l00351"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a868a6daa12db64c972fafb190b0b9bd5">  351</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> = <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef&lt;Element, Layout&gt;</a>;</div><div class="line"><a name="l00352"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#ad9d32a6458380ec72a6e2315486d20fc">  352</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#ad9d32a6458380ec72a6e2315486d20fc">TensorCoord</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1MatrixCoord.html">Layout::TensorCoord</a>;</div><div class="line"><a name="l00353"></a><span class="lineno">  353</span>&#160;</div><div class="line"><a name="l00354"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a6a7b6b794720ed928b8744c7cde34aff">  354</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a6a7b6b794720ed928b8744c7cde34aff">ThreadMap</a> = ThreadMap_;</div><div class="line"><a name="l00355"></a><span class="lineno">  355</span>&#160;</div><div class="line"><a name="l00357"></a><span class="lineno">  357</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">UnderlyingIterator</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a>&lt;</div><div class="line"><a name="l00358"></a><span class="lineno">  358</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;Shape::kColumn, Shape::kRow&gt;</a>, Element,</div><div class="line"><a name="l00359"></a><span class="lineno">  359</span>&#160;      layout::TensorOpMultiplicandCongruous&lt;sizeof_bits&lt;Element_&gt;::value,</div><div class="line"><a name="l00360"></a><span class="lineno">  360</span>&#160;                                            int(128 / <span class="keyword">sizeof</span>(Element_))&gt;,</div><div class="line"><a name="l00361"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a320f3007be32a9deb4bc875e0e837421">  361</a></span>&#160;      (kAdvanceRank == 0 ? 1 : 0), ThreadMap_&gt;;</div><div class="line"><a name="l00362"></a><span class="lineno">  362</span>&#160;</div><div class="line"><a name="l00363"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a9e88ba17c1c659b84511c7dbdf9b665a">  363</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a9e88ba17c1c659b84511c7dbdf9b665a">AccessType</a> = <span class="keyword">typename</span> UnderlyingIterator::AccessType;</div><div class="line"><a name="l00364"></a><span class="lineno">  364</span>&#160;</div><div class="line"><a name="l00365"></a><span class="lineno">  365</span>&#160; <span class="keyword">private</span>:</div><div class="line"><a name="l00367"></a><span class="lineno">  367</span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">UnderlyingIterator</a> iterator_;</div><div class="line"><a name="l00368"></a><span class="lineno">  368</span>&#160;</div><div class="line"><a name="l00369"></a><span class="lineno">  369</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00371"></a><span class="lineno">  371</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00372"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#abf23348f7e8d3b8aaac6f23c116dcf5c">  372</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#abf23348f7e8d3b8aaac6f23c116dcf5c">RegularTileAccessIterator</a>(<a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> ref,  </div><div class="line"><a name="l00373"></a><span class="lineno">  373</span>&#160;                            <span class="keywordtype">int</span> thread_id   </div><div class="line"><a name="l00374"></a><span class="lineno">  374</span>&#160;                            )</div><div class="line"><a name="l00375"></a><span class="lineno">  375</span>&#160;      : iterator_({ref.<a class="code" href="classcutlass_1_1TensorRef.html#ac7db3ca62ab1dfe0d3ea08bcadbc9352">data</a>(), ref.<a class="code" href="classcutlass_1_1TensorRef.html#a191e88bc0fb310be655d700e937ab97c">stride</a>()}, thread_id) {}</div><div class="line"><a name="l00376"></a><span class="lineno">  376</span>&#160;</div><div class="line"><a name="l00378"></a><span class="lineno">  378</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00379"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#aa511f61915cdaccd0e39b7a6b8fb469b">  379</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#aa511f61915cdaccd0e39b7a6b8fb469b">set_iteration_index</a>(<span class="keywordtype">int</span> index) { iterator_.set_iteration_index(index); }</div><div class="line"><a name="l00380"></a><span class="lineno">  380</span>&#160;</div><div class="line"><a name="l00382"></a><span class="lineno">  382</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00383"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a44c0e7a192429e2f051f47572a89446a">  383</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a44c0e7a192429e2f051f47572a89446a">add_pointer_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a81ddaa615b424060e6442d1328d02e55">LongIndex</a> pointer_offset) {</div><div class="line"><a name="l00384"></a><span class="lineno">  384</span>&#160;    iterator_.add_pointer_offset(pointer_offset);</div><div class="line"><a name="l00385"></a><span class="lineno">  385</span>&#160;  }</div><div class="line"><a name="l00386"></a><span class="lineno">  386</span>&#160;</div><div class="line"><a name="l00388"></a><span class="lineno">  388</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00389"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#aa76837c456b5dd36569863c6b4694243">  389</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a9e88ba17c1c659b84511c7dbdf9b665a">AccessType</a> *<span class="keyword">get</span>() <span class="keyword">const</span> {</div><div class="line"><a name="l00390"></a><span class="lineno">  390</span>&#160;    <span class="keywordflow">return</span> <span class="keyword">reinterpret_cast&lt;</span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a9e88ba17c1c659b84511c7dbdf9b665a">AccessType</a> *<span class="keyword">&gt;</span>(iterator_.get());</div><div class="line"><a name="l00391"></a><span class="lineno">  391</span>&#160;  }</div><div class="line"><a name="l00392"></a><span class="lineno">  392</span>&#160;</div><div class="line"><a name="l00394"></a><span class="lineno">  394</span>&#160;  CUTLASS_DEVICE</div><div class="line"><a name="l00395"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a33a042734128cc06fa72b47420b19c36">  395</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a33a042734128cc06fa72b47420b19c36">add_tile_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#ad9d32a6458380ec72a6e2315486d20fc">TensorCoord</a> <span class="keyword">const</span> &amp;coord) {</div><div class="line"><a name="l00396"></a><span class="lineno">  396</span>&#160;    iterator_.add_tile_offset({coord.column(), coord.row()});</div><div class="line"><a name="l00397"></a><span class="lineno">  397</span>&#160;  }</div><div class="line"><a name="l00398"></a><span class="lineno">  398</span>&#160;</div><div class="line"><a name="l00400"></a><span class="lineno">  400</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00401"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#ad3153ccc12d036260b80a0a6ab4081d5">  401</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> &amp;<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#ad3153ccc12d036260b80a0a6ab4081d5">operator++</a>() {</div><div class="line"><a name="l00402"></a><span class="lineno">  402</span>&#160;    ++iterator_;</div><div class="line"><a name="l00403"></a><span class="lineno">  403</span>&#160;    <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00404"></a><span class="lineno">  404</span>&#160;  }</div><div class="line"><a name="l00405"></a><span class="lineno">  405</span>&#160;</div><div class="line"><a name="l00407"></a><span class="lineno">  407</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00408"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#ace8da2b9203dd41a4130fdbbdc84f556">  408</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#ace8da2b9203dd41a4130fdbbdc84f556">operator++</a>(<span class="keywordtype">int</span>) {</div><div class="line"><a name="l00409"></a><span class="lineno">  409</span>&#160;    <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> prev(*<span class="keyword">this</span>);</div><div class="line"><a name="l00410"></a><span class="lineno">  410</span>&#160;    ++iterator_;</div><div class="line"><a name="l00411"></a><span class="lineno">  411</span>&#160;</div><div class="line"><a name="l00412"></a><span class="lineno">  412</span>&#160;    <span class="keywordflow">return</span> prev;</div><div class="line"><a name="l00413"></a><span class="lineno">  413</span>&#160;  }</div><div class="line"><a name="l00414"></a><span class="lineno">  414</span>&#160;};</div><div class="line"><a name="l00415"></a><span class="lineno">  415</span>&#160;</div><div class="line"><a name="l00417"></a><span class="lineno">  417</span>&#160;</div><div class="line"><a name="l00425"></a><span class="lineno">  425</span>&#160;<span class="keyword">template</span> &lt;<span class="keyword">typename</span> Shape_, <span class="keyword">typename</span> Element_, <span class="keywordtype">int</span> AdvanceRank,</div><div class="line"><a name="l00426"></a><span class="lineno">  426</span>&#160;          <span class="keyword">typename</span> ThreadMap_, <span class="keywordtype">int</span> Alignment, <span class="keywordtype">int</span> Crosswise&gt;</div><div class="line"><a name="l00427"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html">  427</a></span>&#160;<span class="keyword">class </span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a>&lt;Shape_, Element_,</div><div class="line"><a name="l00428"></a><span class="lineno">  428</span>&#160;                                layout::TensorOpMultiplicandCrosswise&lt;</div><div class="line"><a name="l00429"></a><span class="lineno">  429</span>&#160;                                    sizeof_bits&lt;Element_&gt;::value, Crosswise&gt;,</div><div class="line"><a name="l00430"></a><span class="lineno">  430</span>&#160;                                AdvanceRank, ThreadMap_, Alignment&gt; {</div><div class="line"><a name="l00431"></a><span class="lineno">  431</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00432"></a><span class="lineno">  432</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00433"></a><span class="lineno">  433</span>&#160;      AdvanceRank == 0 || AdvanceRank == 1,</div><div class="line"><a name="l00434"></a><span class="lineno">  434</span>&#160;      <span class="stringliteral">&quot;Specialization for pitch-linear iterator may along advance along the &quot;</span></div><div class="line"><a name="l00435"></a><span class="lineno">  435</span>&#160;      <span class="stringliteral">&quot;contiguous(rank=0) or strided(rank=1) dimension.&quot;</span>);</div><div class="line"><a name="l00436"></a><span class="lineno">  436</span>&#160;</div><div class="line"><a name="l00437"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#aab0cd2dae6c59807b02b6ee5119d73a3">  437</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#aab0cd2dae6c59807b02b6ee5119d73a3">Shape</a> = Shape_;</div><div class="line"><a name="l00438"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a73a09a50b2f440ec24e8816daa904c28">  438</a></span>&#160;  <span class="keyword">using</span> Element = Element_;</div><div class="line"><a name="l00439"></a><span class="lineno">  439</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html">Layout</a> =</div><div class="line"><a name="l00440"></a><span class="lineno">  440</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html">layout::TensorOpMultiplicandCrosswise&lt;sizeof_bits&lt;Element_&gt;::value</a>,</div><div class="line"><a name="l00441"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a15f26bb9cabd05984ef2cce8ee0e41fb">  441</a></span>&#160;                                            Crosswise&gt;;</div><div class="line"><a name="l00442"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a55f42293c103fdc0771abb0ba0b6fc6e">  442</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAdvanceRank = AdvanceRank;</div><div class="line"><a name="l00443"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a25cf1f0784f01682051fa28d15e28b4d">  443</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAlignment = Alignment;</div><div class="line"><a name="l00444"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a6fcdcb5f60d4afb2d2ac8db323ca4061">  444</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kCrosswise = Crosswise;</div><div class="line"><a name="l00445"></a><span class="lineno">  445</span>&#160;</div><div class="line"><a name="l00446"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#abc58f5f5ad3c41b62db504ef05bf7a93">  446</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#abc58f5f5ad3c41b62db504ef05bf7a93">Index</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html#a4e8aa7fa89ae4ebd8afe284a9786df27">Layout::Index</a>;</div><div class="line"><a name="l00447"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#af7654c26faa6bbef9898085f10bceb9f">  447</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#af7654c26faa6bbef9898085f10bceb9f">LongIndex</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html#a07de92ffadfe255537479c37b04cde6f">Layout::LongIndex</a>;</div><div class="line"><a name="l00448"></a><span class="lineno">  448</span>&#160;</div><div class="line"><a name="l00449"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#ac27f139ceb817ff94954f2f8da4d5a19">  449</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> = <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef&lt;Element, Layout&gt;</a>;</div><div class="line"><a name="l00450"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a55aff8c59952d96e4359005dac44db34">  450</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a55aff8c59952d96e4359005dac44db34">TensorCoord</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1PitchLinearCoord.html">Layout::TensorCoord</a>;</div><div class="line"><a name="l00451"></a><span class="lineno">  451</span>&#160;</div><div class="line"><a name="l00452"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#acc8da22531c619ac3ef5e817fef2d52f">  452</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#acc8da22531c619ac3ef5e817fef2d52f">ThreadMap</a> = ThreadMap_;</div><div class="line"><a name="l00453"></a><span class="lineno">  453</span>&#160;</div><div class="line"><a name="l00455"></a><span class="lineno"><a class="line" href="structcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element_3be8b96d170d886f39b6b30acab65e7a.html">  455</a></span>&#160;  <span class="keyword">struct </span>Detail {</div><div class="line"><a name="l00458"></a><span class="lineno"><a class="line" href="structcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element_3be8b96d170d886f39b6b30acab65e7a.html#a1ef8ca3c06d9ce974836317f67b5d752">  458</a></span>&#160;    <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAccessSizeInBits = 128;</div><div class="line"><a name="l00459"></a><span class="lineno">  459</span>&#160;</div><div class="line"><a name="l00460"></a><span class="lineno">  460</span>&#160;    <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(<a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;Element_&gt;::value</a> *</div><div class="line"><a name="l00461"></a><span class="lineno">  461</span>&#160;                          ThreadMap::kElementsPerAccess ==</div><div class="line"><a name="l00462"></a><span class="lineno">  462</span>&#160;                      kAccessSizeInBits,</div><div class="line"><a name="l00463"></a><span class="lineno">  463</span>&#160;                  <span class="stringliteral">&quot;This iterator requires a policy whose access size is 128bs&quot;</span>);</div><div class="line"><a name="l00464"></a><span class="lineno">  464</span>&#160;</div><div class="line"><a name="l00469"></a><span class="lineno"><a class="line" href="structcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element_3be8b96d170d886f39b6b30acab65e7a.html#af6f2e4a74ec2bd4c258208d53e06f4d0">  469</a></span>&#160;    <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPointerCount =</div><div class="line"><a name="l00470"></a><span class="lineno">  470</span>&#160;        (ThreadMap::Iterations::kStrided &gt; 1 ? 2 : 1);</div><div class="line"><a name="l00471"></a><span class="lineno">  471</span>&#160;  };</div><div class="line"><a name="l00472"></a><span class="lineno">  472</span>&#160;</div><div class="line"><a name="l00474"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a5f26df7eaec00b0535fb5193d7ee9618">  474</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a5f26df7eaec00b0535fb5193d7ee9618">AccessType</a> = Array&lt;Element, Layout::kElementsPerAccess&gt;;</div><div class="line"><a name="l00475"></a><span class="lineno">  475</span>&#160;</div><div class="line"><a name="l00476"></a><span class="lineno">  476</span>&#160; <span class="keyword">private</span>:</div><div class="line"><a name="l00477"></a><span class="lineno">  477</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00478"></a><span class="lineno">  478</span>&#160;  <span class="comment">// Data members</span></div><div class="line"><a name="l00479"></a><span class="lineno">  479</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00480"></a><span class="lineno">  480</span>&#160;</div><div class="line"><a name="l00485"></a><span class="lineno">  485</span>&#160;  <span class="keywordtype">int</span> sections_;</div><div class="line"><a name="l00486"></a><span class="lineno">  486</span>&#160;</div><div class="line"><a name="l00488"></a><span class="lineno">  488</span>&#160;  <span class="keywordtype">int</span> sections_per_stage_;</div><div class="line"><a name="l00489"></a><span class="lineno">  489</span>&#160;</div><div class="line"><a name="l00491"></a><span class="lineno">  491</span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#abc58f5f5ad3c41b62db504ef05bf7a93">Index</a> stride_;</div><div class="line"><a name="l00492"></a><span class="lineno">  492</span>&#160;</div><div class="line"><a name="l00494"></a><span class="lineno">  494</span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a5f26df7eaec00b0535fb5193d7ee9618">AccessType</a> *pointer_[Detail::kPointerCount];</div><div class="line"><a name="l00495"></a><span class="lineno">  495</span>&#160;</div><div class="line"><a name="l00497"></a><span class="lineno">  497</span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#abc58f5f5ad3c41b62db504ef05bf7a93">Index</a> byte_offset_;</div><div class="line"><a name="l00498"></a><span class="lineno">  498</span>&#160;</div><div class="line"><a name="l00500"></a><span class="lineno">  500</span>&#160;  <span class="keywordtype">int</span> iteration_contiguous_;</div><div class="line"><a name="l00501"></a><span class="lineno">  501</span>&#160;</div><div class="line"><a name="l00503"></a><span class="lineno">  503</span>&#160;  <span class="keywordtype">int</span> iteration_strided_;</div><div class="line"><a name="l00504"></a><span class="lineno">  504</span>&#160;</div><div class="line"><a name="l00505"></a><span class="lineno">  505</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00507"></a><span class="lineno">  507</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00508"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a0f1e846cd4287c51e2d6135a8472c1a8">  508</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a0f1e846cd4287c51e2d6135a8472c1a8">RegularTileAccessIterator</a>(<a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> ref,  </div><div class="line"><a name="l00509"></a><span class="lineno">  509</span>&#160;                            <span class="keywordtype">int</span> thread_id   </div><div class="line"><a name="l00510"></a><span class="lineno">  510</span>&#160;                            )</div><div class="line"><a name="l00511"></a><span class="lineno">  511</span>&#160;      : sections_(ref.stride(0) / kCrosswise),</div><div class="line"><a name="l00512"></a><span class="lineno">  512</span>&#160;        sections_per_stage_(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#aab0cd2dae6c59807b02b6ee5119d73a3">Shape</a>::kContiguous / kCrosswise),</div><div class="line"><a name="l00513"></a><span class="lineno">  513</span>&#160;        <span class="comment">// stride_ = kCrosswise x sections_ x kFactor</span></div><div class="line"><a name="l00514"></a><span class="lineno">  514</span>&#160;        stride_(ref.stride(0) * <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html">Layout</a>::kFactor / <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html">Layout</a>::kElementsPerAccess),</div><div class="line"><a name="l00515"></a><span class="lineno">  515</span>&#160;        byte_offset_(0) {</div><div class="line"><a name="l00516"></a><span class="lineno">  516</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearCoord.html">layout::PitchLinearCoord</a> thread_offset_base =</div><div class="line"><a name="l00517"></a><span class="lineno">  517</span>&#160;        ThreadMap::initial_offset(thread_id);</div><div class="line"><a name="l00518"></a><span class="lineno">  518</span>&#160;</div><div class="line"><a name="l00519"></a><span class="lineno">  519</span>&#160;    <a class="code" href="cutlass_8h.html#a4b1c9f25ab6eaa25e1f2258dd63e6ce4">CUTLASS_PRAGMA_UNROLL</a></div><div class="line"><a name="l00520"></a><span class="lineno">  520</span>&#160;    <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; Detail::kPointerCount; ++i) {</div><div class="line"><a name="l00521"></a><span class="lineno">  521</span>&#160;      <span class="comment">// This is the offset of a thread within a threadblock tile for a specific</span></div><div class="line"><a name="l00522"></a><span class="lineno">  522</span>&#160;      <span class="comment">// pointer (units of elements)</span></div><div class="line"><a name="l00523"></a><span class="lineno">  523</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1PitchLinearCoord.html">layout::PitchLinearCoord</a> thread_offset_in_threadblock_tile =</div><div class="line"><a name="l00524"></a><span class="lineno">  524</span>&#160;          thread_offset_base +</div><div class="line"><a name="l00525"></a><span class="lineno">  525</span>&#160;          <a class="code" href="structcutlass_1_1layout_1_1PitchLinearCoord.html">layout::PitchLinearCoord</a>{</div><div class="line"><a name="l00526"></a><span class="lineno">  526</span>&#160;              0, ThreadMap::Detail::WarpThreadArrangement::kStrided * i};</div><div class="line"><a name="l00527"></a><span class="lineno">  527</span>&#160;      <span class="comment">// initialize pointer</span></div><div class="line"><a name="l00528"></a><span class="lineno">  528</span>&#160;      pointer_[i] = <span class="keyword">reinterpret_cast&lt;</span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a5f26df7eaec00b0535fb5193d7ee9618">AccessType</a> *<span class="keyword">&gt;</span>(ref.<a class="code" href="classcutlass_1_1TensorRef.html#ac7db3ca62ab1dfe0d3ea08bcadbc9352">data</a>()) +</div><div class="line"><a name="l00529"></a><span class="lineno">  529</span>&#160;                    ref.<a class="code" href="classcutlass_1_1TensorRef.html#a4166ac2a0754574ac21d5d57d74f34e5">offset</a>(thread_offset_in_threadblock_tile) /</div><div class="line"><a name="l00530"></a><span class="lineno">  530</span>&#160;                        Layout::kElementsPerAccess;</div><div class="line"><a name="l00531"></a><span class="lineno">  531</span>&#160;    }</div><div class="line"><a name="l00532"></a><span class="lineno">  532</span>&#160;</div><div class="line"><a name="l00533"></a><span class="lineno">  533</span>&#160;    set_iteration_index(0);</div><div class="line"><a name="l00534"></a><span class="lineno">  534</span>&#160;  }</div><div class="line"><a name="l00535"></a><span class="lineno">  535</span>&#160;</div><div class="line"><a name="l00537"></a><span class="lineno">  537</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00538"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a4ecee87aa180496eff8cb783602322f3">  538</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a4ecee87aa180496eff8cb783602322f3">set_iteration_index</a>(<span class="keywordtype">int</span> index) {</div><div class="line"><a name="l00539"></a><span class="lineno">  539</span>&#160;    iteration_contiguous_ = index % ThreadMap::Iterations::kContiguous;</div><div class="line"><a name="l00540"></a><span class="lineno">  540</span>&#160;    iteration_strided_ = index / ThreadMap::Iterations::kContiguous;</div><div class="line"><a name="l00541"></a><span class="lineno">  541</span>&#160;  }</div><div class="line"><a name="l00542"></a><span class="lineno">  542</span>&#160;</div><div class="line"><a name="l00544"></a><span class="lineno">  544</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00545"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a25e54d78f1b424ead16b5e64e6db63eb">  545</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a25e54d78f1b424ead16b5e64e6db63eb">add_pointer_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#af7654c26faa6bbef9898085f10bceb9f">LongIndex</a> pointer_offset) {</div><div class="line"><a name="l00546"></a><span class="lineno">  546</span>&#160;    byte_offset_ += pointer_offset * <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;Element&gt;::value</a> / 8;</div><div class="line"><a name="l00547"></a><span class="lineno">  547</span>&#160;  }</div><div class="line"><a name="l00548"></a><span class="lineno">  548</span>&#160;</div><div class="line"><a name="l00550"></a><span class="lineno">  550</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00551"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#ae7f1dcf320dc23628a1e01bef93451c6">  551</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a5f26df7eaec00b0535fb5193d7ee9618">AccessType</a> *<span class="keyword">get</span>() <span class="keyword">const</span> {</div><div class="line"><a name="l00552"></a><span class="lineno">  552</span>&#160;    <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a5f26df7eaec00b0535fb5193d7ee9618">AccessType</a> *access_ptr = pointer_[iteration_strided_ &amp; 1];</div><div class="line"><a name="l00553"></a><span class="lineno">  553</span>&#160;    <span class="keywordtype">int</span> stride_idx = (iteration_strided_ &amp; ~1);</div><div class="line"><a name="l00554"></a><span class="lineno">  554</span>&#160;</div><div class="line"><a name="l00555"></a><span class="lineno">  555</span>&#160;    <span class="keywordtype">int</span> access_offset =</div><div class="line"><a name="l00556"></a><span class="lineno">  556</span>&#160;        stride_idx * ThreadMap::Delta::kStrided * stride_ / Layout::kFactor +</div><div class="line"><a name="l00557"></a><span class="lineno">  557</span>&#160;        iteration_contiguous_ * ThreadMap::Delta::kContiguous /</div><div class="line"><a name="l00558"></a><span class="lineno">  558</span>&#160;            ThreadMap::kElementsPerAccess;</div><div class="line"><a name="l00559"></a><span class="lineno">  559</span>&#160;    <span class="keywordtype">char</span> *access_byte_ptr =</div><div class="line"><a name="l00560"></a><span class="lineno">  560</span>&#160;        <span class="keyword">reinterpret_cast&lt;</span><span class="keywordtype">char</span> *<span class="keyword">&gt;</span>(access_ptr + access_offset);</div><div class="line"><a name="l00561"></a><span class="lineno">  561</span>&#160;    <span class="keywordflow">return</span> <span class="keyword">reinterpret_cast&lt;</span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a5f26df7eaec00b0535fb5193d7ee9618">AccessType</a> *<span class="keyword">&gt;</span>(access_byte_ptr + byte_offset_);</div><div class="line"><a name="l00562"></a><span class="lineno">  562</span>&#160;  }</div><div class="line"><a name="l00563"></a><span class="lineno">  563</span>&#160;</div><div class="line"><a name="l00565"></a><span class="lineno">  565</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00566"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a6007be94e0b9bc75d315e5ef95fa2420">  566</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> &amp;<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a6007be94e0b9bc75d315e5ef95fa2420">operator++</a>() {</div><div class="line"><a name="l00567"></a><span class="lineno">  567</span>&#160;    ++iteration_contiguous_;</div><div class="line"><a name="l00568"></a><span class="lineno">  568</span>&#160;</div><div class="line"><a name="l00569"></a><span class="lineno">  569</span>&#160;    <span class="keywordflow">if</span> (iteration_contiguous_ &lt; ThreadMap::Iterations::kContiguous)</div><div class="line"><a name="l00570"></a><span class="lineno">  570</span>&#160;      <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00571"></a><span class="lineno">  571</span>&#160;</div><div class="line"><a name="l00572"></a><span class="lineno">  572</span>&#160;    <span class="comment">// Enter here only if (iteration_contiguous_ ==</span></div><div class="line"><a name="l00573"></a><span class="lineno">  573</span>&#160;    <span class="comment">// ThreadMap::Iteration::kContiguous)</span></div><div class="line"><a name="l00574"></a><span class="lineno">  574</span>&#160;    iteration_contiguous_ = 0;</div><div class="line"><a name="l00575"></a><span class="lineno">  575</span>&#160;    ++iteration_strided_;</div><div class="line"><a name="l00576"></a><span class="lineno">  576</span>&#160;</div><div class="line"><a name="l00577"></a><span class="lineno">  577</span>&#160;    <span class="keywordflow">if</span> (iteration_strided_ &lt; ThreadMap::Iterations::kStrided) {</div><div class="line"><a name="l00578"></a><span class="lineno">  578</span>&#160;      <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00579"></a><span class="lineno">  579</span>&#160;    }</div><div class="line"><a name="l00580"></a><span class="lineno">  580</span>&#160;</div><div class="line"><a name="l00581"></a><span class="lineno">  581</span>&#160;    <span class="comment">// Enter here only if (iteration_strided_ == ThreadMap::Iteration::kStrided)</span></div><div class="line"><a name="l00582"></a><span class="lineno">  582</span>&#160;    <span class="comment">// which means we enter the next section.</span></div><div class="line"><a name="l00583"></a><span class="lineno">  583</span>&#160;    iteration_strided_ = 0;</div><div class="line"><a name="l00584"></a><span class="lineno">  584</span>&#160;</div><div class="line"><a name="l00585"></a><span class="lineno">  585</span>&#160;    <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00586"></a><span class="lineno">  586</span>&#160;  }</div><div class="line"><a name="l00587"></a><span class="lineno">  587</span>&#160;</div><div class="line"><a name="l00589"></a><span class="lineno">  589</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00590"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a352c7685cb9a37ba214609fe9ccb12e2">  590</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a352c7685cb9a37ba214609fe9ccb12e2">operator++</a>(<span class="keywordtype">int</span>) {</div><div class="line"><a name="l00591"></a><span class="lineno">  591</span>&#160;    <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> prev(*<span class="keyword">this</span>);</div><div class="line"><a name="l00592"></a><span class="lineno">  592</span>&#160;    this-&gt;<a class="code" href="namespacecutlass.html#a1c7a9e66ca7b5dc7413ea3b8f349530a">operator++</a>();</div><div class="line"><a name="l00593"></a><span class="lineno">  593</span>&#160;</div><div class="line"><a name="l00594"></a><span class="lineno">  594</span>&#160;    <span class="keywordflow">return</span> prev;</div><div class="line"><a name="l00595"></a><span class="lineno">  595</span>&#160;  }</div><div class="line"><a name="l00596"></a><span class="lineno">  596</span>&#160;</div><div class="line"><a name="l00598"></a><span class="lineno">  598</span>&#160;  CUTLASS_DEVICE</div><div class="line"><a name="l00599"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a2cd2b330fdbe50d7514cb051b96a8d85">  599</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a2cd2b330fdbe50d7514cb051b96a8d85">add_tile_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a55aff8c59952d96e4359005dac44db34">TensorCoord</a> <span class="keyword">const</span> &amp;coord) {</div><div class="line"><a name="l00600"></a><span class="lineno">  600</span>&#160;    add_pointer_offset(coord.contiguous() * sections_per_stage_ * stride_ *</div><div class="line"><a name="l00601"></a><span class="lineno">  601</span>&#160;                           ThreadMap::kElementsPerAccess / sections_ +</div><div class="line"><a name="l00602"></a><span class="lineno">  602</span>&#160;                       coord.strided() * Shape::kStrided * stride_ *</div><div class="line"><a name="l00603"></a><span class="lineno">  603</span>&#160;                           Layout::kElementsPerAccess);</div><div class="line"><a name="l00604"></a><span class="lineno">  604</span>&#160;  }</div><div class="line"><a name="l00605"></a><span class="lineno">  605</span>&#160;};</div><div class="line"><a name="l00606"></a><span class="lineno">  606</span>&#160;</div><div class="line"><a name="l00608"></a><span class="lineno">  608</span>&#160;</div><div class="line"><a name="l00616"></a><span class="lineno">  616</span>&#160;<span class="keyword">template</span> &lt;<span class="keyword">typename</span> Shape_, <span class="keyword">typename</span> Element_, <span class="keywordtype">int</span> AdvanceRank,</div><div class="line"><a name="l00617"></a><span class="lineno">  617</span>&#160;          <span class="keyword">typename</span> ThreadMap_, <span class="keywordtype">int</span> Alignment, <span class="keywordtype">int</span> Crosswise&gt;</div><div class="line"><a name="l00618"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html">  618</a></span>&#160;<span class="keyword">class </span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a>&lt;</div><div class="line"><a name="l00619"></a><span class="lineno">  619</span>&#160;    Shape_, Element_,</div><div class="line"><a name="l00620"></a><span class="lineno">  620</span>&#160;    layout::ColumnMajorTensorOpMultiplicandCrosswise&lt;</div><div class="line"><a name="l00621"></a><span class="lineno">  621</span>&#160;        sizeof_bits&lt;Element_&gt;::value, Crosswise&gt;,</div><div class="line"><a name="l00622"></a><span class="lineno">  622</span>&#160;    AdvanceRank, ThreadMap_, Alignment&gt; {</div><div class="line"><a name="l00623"></a><span class="lineno">  623</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00624"></a><span class="lineno">  624</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00625"></a><span class="lineno">  625</span>&#160;      AdvanceRank == 0 || AdvanceRank == 1,</div><div class="line"><a name="l00626"></a><span class="lineno">  626</span>&#160;      <span class="stringliteral">&quot;Specialization for column-major iterator may along advance along the &quot;</span></div><div class="line"><a name="l00627"></a><span class="lineno">  627</span>&#160;      <span class="stringliteral">&quot;columns(rank=0) or rows(rank=1) dimension.&quot;</span>);</div><div class="line"><a name="l00628"></a><span class="lineno">  628</span>&#160;</div><div class="line"><a name="l00629"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#ab234a568898813621a9e3ff9436d5042">  629</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#ab234a568898813621a9e3ff9436d5042">Shape</a> = Shape_;</div><div class="line"><a name="l00630"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a18f3aab646ceffb951b9069be00b9930">  630</a></span>&#160;  <span class="keyword">using</span> Element = Element_;</div><div class="line"><a name="l00631"></a><span class="lineno">  631</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise.html">Layout</a> = <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise.html">layout::ColumnMajorTensorOpMultiplicandCrosswise</a>&lt;</div><div class="line"><a name="l00632"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a1e68bd5d902141ecd4281fcbbcf855be">  632</a></span>&#160;      <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;Element_&gt;::value</a>, Crosswise&gt;;</div><div class="line"><a name="l00633"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a67c0493b9d10db5185437f942bc4374a">  633</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAdvanceRank = AdvanceRank;</div><div class="line"><a name="l00634"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#ad1194d03b3694a66b06fcd2c2b526921">  634</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAlignment = Alignment;</div><div class="line"><a name="l00635"></a><span class="lineno">  635</span>&#160;</div><div class="line"><a name="l00636"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a052f3d5d2f3f2f4578a3b59c8e88a676">  636</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a052f3d5d2f3f2f4578a3b59c8e88a676">Index</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise.html#af9367fe9d6c5d95367d84dbab02dd0fe">Layout::Index</a>;</div><div class="line"><a name="l00637"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a17f3bf28de19feaafff96d2e0c558047">  637</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a17f3bf28de19feaafff96d2e0c558047">LongIndex</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise.html#a8e1f0b54a8c1b3f37df9ec0dd3548985">Layout::LongIndex</a>;</div><div class="line"><a name="l00638"></a><span class="lineno">  638</span>&#160;</div><div class="line"><a name="l00639"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a74ab4aebdcd2527f2f09ad1762b45544">  639</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> = <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef&lt;Element, Layout&gt;</a>;</div><div class="line"><a name="l00640"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#aa5637b83cdd83081e239e44ffe46c466">  640</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#aa5637b83cdd83081e239e44ffe46c466">TensorCoord</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1MatrixCoord.html">Layout::TensorCoord</a>;</div><div class="line"><a name="l00641"></a><span class="lineno">  641</span>&#160;</div><div class="line"><a name="l00642"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a4b27e67450659f3e892f08c0def0fbbe">  642</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a4b27e67450659f3e892f08c0def0fbbe">ThreadMap</a> = ThreadMap_;</div><div class="line"><a name="l00643"></a><span class="lineno">  643</span>&#160;</div><div class="line"><a name="l00645"></a><span class="lineno">  645</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">UnderlyingIterator</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a>&lt;</div><div class="line"><a name="l00646"></a><span class="lineno">  646</span>&#160;      layout::PitchLinearShape&lt;Shape::kRow, Shape::kColumn&gt;, Element,</div><div class="line"><a name="l00647"></a><span class="lineno">  647</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html">layout::TensorOpMultiplicandCrosswise&lt;sizeof_bits&lt;Element_&gt;::value</a>,</div><div class="line"><a name="l00648"></a><span class="lineno">  648</span>&#160;                                            Crosswise&gt;,</div><div class="line"><a name="l00649"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#aa745b5e691ec86d1ec68aa880d16450f">  649</a></span>&#160;      (kAdvanceRank == 0 ? 0 : 1), ThreadMap_&gt;;</div><div class="line"><a name="l00650"></a><span class="lineno">  650</span>&#160;</div><div class="line"><a name="l00651"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#af017aa6ea6f90f1693c0ae274402852e">  651</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#af017aa6ea6f90f1693c0ae274402852e">AccessType</a> = <span class="keyword">typename</span> UnderlyingIterator::AccessType;</div><div class="line"><a name="l00652"></a><span class="lineno">  652</span>&#160;</div><div class="line"><a name="l00653"></a><span class="lineno">  653</span>&#160; <span class="keyword">private</span>:</div><div class="line"><a name="l00655"></a><span class="lineno">  655</span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">UnderlyingIterator</a> iterator_;</div><div class="line"><a name="l00656"></a><span class="lineno">  656</span>&#160;</div><div class="line"><a name="l00657"></a><span class="lineno">  657</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00659"></a><span class="lineno">  659</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00660"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#acc48b323a8a9a8e75e0bfdb77c1cbcc5">  660</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#acc48b323a8a9a8e75e0bfdb77c1cbcc5">RegularTileAccessIterator</a>(<a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> ref,  </div><div class="line"><a name="l00661"></a><span class="lineno">  661</span>&#160;                            <span class="keywordtype">int</span> thread_id   </div><div class="line"><a name="l00662"></a><span class="lineno">  662</span>&#160;                            )</div><div class="line"><a name="l00663"></a><span class="lineno">  663</span>&#160;      : iterator_({ref.<a class="code" href="classcutlass_1_1TensorRef.html#ac7db3ca62ab1dfe0d3ea08bcadbc9352">data</a>(), ref.<a class="code" href="classcutlass_1_1TensorRef.html#a191e88bc0fb310be655d700e937ab97c">stride</a>()}, thread_id) {}</div><div class="line"><a name="l00664"></a><span class="lineno">  664</span>&#160;</div><div class="line"><a name="l00666"></a><span class="lineno">  666</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00667"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a09ed75da16791ee6c46888aa56d2c332">  667</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a09ed75da16791ee6c46888aa56d2c332">set_iteration_index</a>(<span class="keywordtype">int</span> index) { iterator_.set_iteration_index(index); }</div><div class="line"><a name="l00668"></a><span class="lineno">  668</span>&#160;</div><div class="line"><a name="l00670"></a><span class="lineno">  670</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00671"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a97f04453882bf322b9cd180f10416ea0">  671</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a97f04453882bf322b9cd180f10416ea0">add_pointer_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a17f3bf28de19feaafff96d2e0c558047">LongIndex</a> pointer_offset) {</div><div class="line"><a name="l00672"></a><span class="lineno">  672</span>&#160;    iterator_.add_pointer_offset(pointer_offset);</div><div class="line"><a name="l00673"></a><span class="lineno">  673</span>&#160;  }</div><div class="line"><a name="l00674"></a><span class="lineno">  674</span>&#160;</div><div class="line"><a name="l00676"></a><span class="lineno">  676</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00677"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#ae90040a003d5ea7a3521daaa098a233d">  677</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#af017aa6ea6f90f1693c0ae274402852e">AccessType</a> *<span class="keyword">get</span>() <span class="keyword">const</span> {</div><div class="line"><a name="l00678"></a><span class="lineno">  678</span>&#160;    <span class="keywordflow">return</span> <span class="keyword">reinterpret_cast&lt;</span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#af017aa6ea6f90f1693c0ae274402852e">AccessType</a> *<span class="keyword">&gt;</span>(iterator_.get());</div><div class="line"><a name="l00679"></a><span class="lineno">  679</span>&#160;  }</div><div class="line"><a name="l00680"></a><span class="lineno">  680</span>&#160;</div><div class="line"><a name="l00682"></a><span class="lineno">  682</span>&#160;  CUTLASS_DEVICE</div><div class="line"><a name="l00683"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a810cc4b0a557bdc422f4e25112712974">  683</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a810cc4b0a557bdc422f4e25112712974">add_tile_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#aa5637b83cdd83081e239e44ffe46c466">TensorCoord</a> <span class="keyword">const</span> &amp;coord) {</div><div class="line"><a name="l00684"></a><span class="lineno">  684</span>&#160;    iterator_.add_tile_offset({coord.row(), coord.column()});</div><div class="line"><a name="l00685"></a><span class="lineno">  685</span>&#160;  }</div><div class="line"><a name="l00686"></a><span class="lineno">  686</span>&#160;</div><div class="line"><a name="l00688"></a><span class="lineno">  688</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00689"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a98e43fc279be18523a6839bd309695ab">  689</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> &amp;<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a98e43fc279be18523a6839bd309695ab">operator++</a>() {</div><div class="line"><a name="l00690"></a><span class="lineno">  690</span>&#160;    ++iterator_;</div><div class="line"><a name="l00691"></a><span class="lineno">  691</span>&#160;    <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00692"></a><span class="lineno">  692</span>&#160;  }</div><div class="line"><a name="l00693"></a><span class="lineno">  693</span>&#160;</div><div class="line"><a name="l00695"></a><span class="lineno">  695</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00696"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#ab138c25c73db56b7e1cdc9e29ec7a5fd">  696</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#ab138c25c73db56b7e1cdc9e29ec7a5fd">operator++</a>(<span class="keywordtype">int</span>) {</div><div class="line"><a name="l00697"></a><span class="lineno">  697</span>&#160;    <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> prev(*<span class="keyword">this</span>);</div><div class="line"><a name="l00698"></a><span class="lineno">  698</span>&#160;    ++iterator_;</div><div class="line"><a name="l00699"></a><span class="lineno">  699</span>&#160;</div><div class="line"><a name="l00700"></a><span class="lineno">  700</span>&#160;    <span class="keywordflow">return</span> prev;</div><div class="line"><a name="l00701"></a><span class="lineno">  701</span>&#160;  }</div><div class="line"><a name="l00702"></a><span class="lineno">  702</span>&#160;};</div><div class="line"><a name="l00703"></a><span class="lineno">  703</span>&#160;</div><div class="line"><a name="l00705"></a><span class="lineno">  705</span>&#160;</div><div class="line"><a name="l00713"></a><span class="lineno">  713</span>&#160;<span class="keyword">template</span> &lt;<span class="keyword">typename</span> Shape_, <span class="keyword">typename</span> Element_, <span class="keywordtype">int</span> AdvanceRank,</div><div class="line"><a name="l00714"></a><span class="lineno">  714</span>&#160;          <span class="keyword">typename</span> ThreadMap_, <span class="keywordtype">int</span> Alignment, <span class="keywordtype">int</span> Crosswise&gt;</div><div class="line"><a name="l00715"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html">  715</a></span>&#160;<span class="keyword">class </span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a>&lt;Shape_, Element_,</div><div class="line"><a name="l00716"></a><span class="lineno">  716</span>&#160;                                layout::RowMajorTensorOpMultiplicandCrosswise&lt;</div><div class="line"><a name="l00717"></a><span class="lineno">  717</span>&#160;                                    sizeof_bits&lt;Element_&gt;::value, Crosswise&gt;,</div><div class="line"><a name="l00718"></a><span class="lineno">  718</span>&#160;                                AdvanceRank, ThreadMap_, Alignment&gt; {</div><div class="line"><a name="l00719"></a><span class="lineno">  719</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00720"></a><span class="lineno">  720</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00721"></a><span class="lineno">  721</span>&#160;      AdvanceRank == 0 || AdvanceRank == 1,</div><div class="line"><a name="l00722"></a><span class="lineno">  722</span>&#160;      <span class="stringliteral">&quot;Specialization for row-major iterator may along advance along the &quot;</span></div><div class="line"><a name="l00723"></a><span class="lineno">  723</span>&#160;      <span class="stringliteral">&quot;columns(rank=0) or rows(rank=1) dimension.&quot;</span>);</div><div class="line"><a name="l00724"></a><span class="lineno">  724</span>&#160;</div><div class="line"><a name="l00725"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a816c49faa54b8702401b303f65950535">  725</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a816c49faa54b8702401b303f65950535">Shape</a> = Shape_;</div><div class="line"><a name="l00726"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#adb6eead84237597c7146f92825a370bd">  726</a></span>&#160;  <span class="keyword">using</span> Element = Element_;</div><div class="line"><a name="l00727"></a><span class="lineno">  727</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCrosswise.html">Layout</a> = <a class="code" href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCrosswise.html">layout::RowMajorTensorOpMultiplicandCrosswise</a>&lt;</div><div class="line"><a name="l00728"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a0b3842ebd2d0ded853ed99d800e37f6d">  728</a></span>&#160;      <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;Element_&gt;::value</a>, Crosswise&gt;;</div><div class="line"><a name="l00729"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#abdb2a9eac279d6042387de59a2dd92d0">  729</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAdvanceRank = AdvanceRank;</div><div class="line"><a name="l00730"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ac83cf1ee4e2149c2553098b571f3a17c">  730</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kAlignment = Alignment;</div><div class="line"><a name="l00731"></a><span class="lineno">  731</span>&#160;</div><div class="line"><a name="l00732"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ad619429f4f3710665d47a39bd4fbb78c">  732</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ad619429f4f3710665d47a39bd4fbb78c">Index</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCrosswise.html#afb16d769e699fe88e09420cce6096d86">Layout::Index</a>;</div><div class="line"><a name="l00733"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a1a58d2ccf23ef435ec977aadb67ac7f7">  733</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a1a58d2ccf23ef435ec977aadb67ac7f7">LongIndex</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCrosswise.html#a85b214a913b534fc9cc5366664a414e3">Layout::LongIndex</a>;</div><div class="line"><a name="l00734"></a><span class="lineno">  734</span>&#160;</div><div class="line"><a name="l00735"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a2bf364219c3837f8954ff6d49c68d9e9">  735</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> = <a class="code" href="classcutlass_1_1TensorRef.html">TensorRef&lt;Element, Layout&gt;</a>;</div><div class="line"><a name="l00736"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ab6a4152d54eab0b48a90bfafb2d84289">  736</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ab6a4152d54eab0b48a90bfafb2d84289">TensorCoord</a> = <span class="keyword">typename</span> <a class="code" href="structcutlass_1_1MatrixCoord.html">Layout::TensorCoord</a>;</div><div class="line"><a name="l00737"></a><span class="lineno">  737</span>&#160;</div><div class="line"><a name="l00738"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a4ea7a9d82dfdae06b7fe408c65e5019b">  738</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a4ea7a9d82dfdae06b7fe408c65e5019b">ThreadMap</a> = ThreadMap_;</div><div class="line"><a name="l00739"></a><span class="lineno">  739</span>&#160;</div><div class="line"><a name="l00741"></a><span class="lineno">  741</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">UnderlyingIterator</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a>&lt;</div><div class="line"><a name="l00742"></a><span class="lineno">  742</span>&#160;      layout::PitchLinearShape&lt;Shape::kColumn, Shape::kRow&gt;, Element,</div><div class="line"><a name="l00743"></a><span class="lineno">  743</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html">layout::TensorOpMultiplicandCrosswise&lt;sizeof_bits&lt;Element_&gt;::value</a>,</div><div class="line"><a name="l00744"></a><span class="lineno">  744</span>&#160;                                            Crosswise&gt;,</div><div class="line"><a name="l00745"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#addfbe1ed22f504cde6d8332fdbbd9569">  745</a></span>&#160;      (kAdvanceRank == 0 ? 1 : 0), ThreadMap_&gt;;</div><div class="line"><a name="l00746"></a><span class="lineno">  746</span>&#160;</div><div class="line"><a name="l00747"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ab861ef4575cb2ebbfb8278da72e26318">  747</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ab861ef4575cb2ebbfb8278da72e26318">AccessType</a> = <span class="keyword">typename</span> UnderlyingIterator::AccessType;</div><div class="line"><a name="l00748"></a><span class="lineno">  748</span>&#160;</div><div class="line"><a name="l00749"></a><span class="lineno">  749</span>&#160; <span class="keyword">private</span>:</div><div class="line"><a name="l00751"></a><span class="lineno">  751</span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">UnderlyingIterator</a> iterator_;</div><div class="line"><a name="l00752"></a><span class="lineno">  752</span>&#160;</div><div class="line"><a name="l00753"></a><span class="lineno">  753</span>&#160; <span class="keyword">public</span>:</div><div class="line"><a name="l00755"></a><span class="lineno">  755</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00756"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a025187783fb6d708885d31af2492bca4">  756</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a025187783fb6d708885d31af2492bca4">RegularTileAccessIterator</a>(<a class="code" href="classcutlass_1_1TensorRef.html">TensorRef</a> ref,  </div><div class="line"><a name="l00757"></a><span class="lineno">  757</span>&#160;                            <span class="keywordtype">int</span> thread_id   </div><div class="line"><a name="l00758"></a><span class="lineno">  758</span>&#160;                            )</div><div class="line"><a name="l00759"></a><span class="lineno">  759</span>&#160;      : iterator_({ref.<a class="code" href="classcutlass_1_1TensorRef.html#ac7db3ca62ab1dfe0d3ea08bcadbc9352">data</a>(), ref.<a class="code" href="classcutlass_1_1TensorRef.html#a191e88bc0fb310be655d700e937ab97c">stride</a>()}, thread_id) {}</div><div class="line"><a name="l00760"></a><span class="lineno">  760</span>&#160;</div><div class="line"><a name="l00762"></a><span class="lineno">  762</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00763"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ac1e0fe84270ef846336f9ca6969a35e5">  763</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ac1e0fe84270ef846336f9ca6969a35e5">set_iteration_index</a>(<span class="keywordtype">int</span> index) { iterator_.set_iteration_index(index); }</div><div class="line"><a name="l00764"></a><span class="lineno">  764</span>&#160;</div><div class="line"><a name="l00766"></a><span class="lineno">  766</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00767"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a13adaf4c752cb4e0fc5aaf29b2261348">  767</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a13adaf4c752cb4e0fc5aaf29b2261348">add_pointer_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a1a58d2ccf23ef435ec977aadb67ac7f7">LongIndex</a> pointer_offset) {</div><div class="line"><a name="l00768"></a><span class="lineno">  768</span>&#160;    iterator_.add_pointer_offset(pointer_offset);</div><div class="line"><a name="l00769"></a><span class="lineno">  769</span>&#160;  }</div><div class="line"><a name="l00770"></a><span class="lineno">  770</span>&#160;</div><div class="line"><a name="l00772"></a><span class="lineno">  772</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00773"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a71daea97d35fc66a496240371952f872">  773</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ab861ef4575cb2ebbfb8278da72e26318">AccessType</a> *<span class="keyword">get</span>() <span class="keyword">const</span> {</div><div class="line"><a name="l00774"></a><span class="lineno">  774</span>&#160;    <span class="keywordflow">return</span> <span class="keyword">reinterpret_cast&lt;</span><a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ab861ef4575cb2ebbfb8278da72e26318">AccessType</a> *<span class="keyword">&gt;</span>(iterator_.get());</div><div class="line"><a name="l00775"></a><span class="lineno">  775</span>&#160;  }</div><div class="line"><a name="l00776"></a><span class="lineno">  776</span>&#160;</div><div class="line"><a name="l00778"></a><span class="lineno">  778</span>&#160;  CUTLASS_DEVICE</div><div class="line"><a name="l00779"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ac2ffc1bcd610ebc066f8b608de5a1c5a">  779</a></span>&#160;  <span class="keywordtype">void</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ac2ffc1bcd610ebc066f8b608de5a1c5a">add_tile_offset</a>(<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ab6a4152d54eab0b48a90bfafb2d84289">TensorCoord</a> <span class="keyword">const</span> &amp;coord) {</div><div class="line"><a name="l00780"></a><span class="lineno">  780</span>&#160;    iterator_.add_tile_offset({coord.column(), coord.row()});</div><div class="line"><a name="l00781"></a><span class="lineno">  781</span>&#160;  }</div><div class="line"><a name="l00782"></a><span class="lineno">  782</span>&#160;</div><div class="line"><a name="l00784"></a><span class="lineno">  784</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00785"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a76f3aed087b22e12afaa00fbbba21462">  785</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> &amp;<a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a76f3aed087b22e12afaa00fbbba21462">operator++</a>() {</div><div class="line"><a name="l00786"></a><span class="lineno">  786</span>&#160;    ++iterator_;</div><div class="line"><a name="l00787"></a><span class="lineno">  787</span>&#160;    <span class="keywordflow">return</span> *<span class="keyword">this</span>;</div><div class="line"><a name="l00788"></a><span class="lineno">  788</span>&#160;  }</div><div class="line"><a name="l00789"></a><span class="lineno">  789</span>&#160;</div><div class="line"><a name="l00791"></a><span class="lineno">  791</span>&#160;  <a class="code" href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="line"><a name="l00792"></a><span class="lineno"><a class="line" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a2de4681091764ba0aee6e09048ad8fb9">  792</a></span>&#160;  <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a2de4681091764ba0aee6e09048ad8fb9">operator++</a>(<span class="keywordtype">int</span>) {</div><div class="line"><a name="l00793"></a><span class="lineno">  793</span>&#160;    <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">RegularTileAccessIterator</a> prev(*<span class="keyword">this</span>);</div><div class="line"><a name="l00794"></a><span class="lineno">  794</span>&#160;    ++iterator_;</div><div class="line"><a name="l00795"></a><span class="lineno">  795</span>&#160;</div><div class="line"><a name="l00796"></a><span class="lineno">  796</span>&#160;    <span class="keywordflow">return</span> prev;</div><div class="line"><a name="l00797"></a><span class="lineno">  797</span>&#160;  }</div><div class="line"><a name="l00798"></a><span class="lineno">  798</span>&#160;};</div><div class="line"><a name="l00799"></a><span class="lineno">  799</span>&#160;</div><div class="line"><a name="l00801"></a><span class="lineno">  801</span>&#160;}  <span class="comment">// namespace threadblock</span></div><div class="line"><a name="l00802"></a><span class="lineno">  802</span>&#160;}  <span class="comment">// namespace transform</span></div><div class="line"><a name="l00803"></a><span class="lineno">  803</span>&#160;}  <span class="comment">// namespace cutlass</span></div><div class="line"><a name="l00804"></a><span class="lineno">  804</span>&#160;</div><div class="ttc" id="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous_html_a37fd29e6b74010e9a3ae089d6a777724"><div class="ttname"><a href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous.html#a37fd29e6b74010e9a3ae089d6a777724">cutlass::layout::ColumnMajorTensorOpMultiplicandCongruous::LongIndex</a></div><div class="ttdeci">int64_t LongIndex</div><div class="ttdoc">Long index type used for offsets. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:434</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_a810cc4b0a557bdc422f4e25112712974"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a810cc4b0a557bdc422f4e25112712974">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_tile_offset</a></div><div class="ttdeci">CUTLASS_DEVICE void add_tile_offset(TensorCoord const &amp;coord)</div><div class="ttdoc">Adds a tile offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:683</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_a0f1e846cd4287c51e2d6135a8472c1a8"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a0f1e846cd4287c51e2d6135a8472c1a8">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::RegularTileAccessIterator</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator(TensorRef ref, int thread_id)</div><div class="ttdoc">Construct a TileIterator with zero threadblock offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:508</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_aa5637b83cdd83081e239e44ffe46c466"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#aa5637b83cdd83081e239e44ffe46c466">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::TensorCoord</a></div><div class="ttdeci">typename Layout::TensorCoord TensorCoord</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:640</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_a633db64682aa6494c2553e11614b5e1d"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a633db64682aa6494c2553e11614b5e1d">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::RegularTileAccessIterator</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator(TensorRef ref, int thread_id)</div><div class="ttdoc">Construct a TileIterator with zero threadblock offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:275</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_a33a042734128cc06fa72b47420b19c36"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a33a042734128cc06fa72b47420b19c36">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_tile_offset</a></div><div class="ttdeci">CUTLASS_DEVICE void add_tile_offset(TensorCoord const &amp;coord)</div><div class="ttdoc">Adds a tile offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:395</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise_html_a4e8aa7fa89ae4ebd8afe284a9786df27"><div class="ttname"><a href="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html#a4e8aa7fa89ae4ebd8afe284a9786df27">cutlass::layout::TensorOpMultiplicandCrosswise::Index</a></div><div class="ttdeci">int32_t Index</div><div class="ttdoc">Index type used for coordinates. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:640</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_a4ba4f46f5286af5b7b647944cf3de8ad"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a4ba4f46f5286af5b7b647944cf3de8ad">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Index</a></div><div class="ttdeci">typename Layout::Index Index</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:251</div></div>
<div class="ttc" id="namespacecutlass_html"><div class="ttname"><a href="namespacecutlass.html">cutlass</a></div><div class="ttdef"><b>Definition:</b> aligned_buffer.h:35</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_a4ecee87aa180496eff8cb783602322f3"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a4ecee87aa180496eff8cb783602322f3">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::set_iteration_index</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void set_iteration_index(int index)</div><div class="ttdoc">Overrides the internal iteration index. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:538</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1PitchLinearCoord_html"><div class="ttname"><a href="structcutlass_1_1layout_1_1PitchLinearCoord.html">cutlass::layout::PitchLinearCoord</a></div><div class="ttdoc">Coordinate in pitch-linear space. </div><div class="ttdef"><b>Definition:</b> pitch_linear.h:52</div></div>
<div class="ttc" id="tensor__ref_8h_html"><div class="ttname"><a href="tensor__ref_8h.html">tensor_ref.h</a></div><div class="ttdoc">Defines a structure containing strides, bounds, and a pointer to tensor data. </div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_a6007be94e0b9bc75d315e5ef95fa2420"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a6007be94e0b9bc75d315e5ef95fa2420">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator &amp; operator++()</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:566</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous_html_aa455da7f56592fdb70977b1cad108003"><div class="ttname"><a href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous.html#aa455da7f56592fdb70977b1cad108003">cutlass::layout::ColumnMajorTensorOpMultiplicandCongruous::Index</a></div><div class="ttdeci">int32_t Index</div><div class="ttdoc">Index type used for coordinates. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:431</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_a816c49faa54b8702401b303f65950535"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a816c49faa54b8702401b303f65950535">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:725</div></div>
<div class="ttc" id="tensor__op__multiplicand__sm75_8h_html"><div class="ttname"><a href="tensor__op__multiplicand__sm75_8h.html">tensor_op_multiplicand_sm75.h</a></div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCongruous_html_a32c8623b9c3c8490263ea0af24a1410f"><div class="ttname"><a href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCongruous.html#a32c8623b9c3c8490263ea0af24a1410f">cutlass::layout::RowMajorTensorOpMultiplicandCongruous::Index</a></div><div class="ttdeci">int32_t Index</div><div class="ttdoc">Index type used for coordinates. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:536</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise_html"><div class="ttname"><a href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise.html">cutlass::layout::ColumnMajorTensorOpMultiplicandCrosswise</a></div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:734</div></div>
<div class="ttc" id="classcutlass_1_1TensorRef_html_ac7db3ca62ab1dfe0d3ea08bcadbc9352"><div class="ttname"><a href="classcutlass_1_1TensorRef.html#ac7db3ca62ab1dfe0d3ea08bcadbc9352">cutlass::TensorRef::data</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE Element * data() const </div><div class="ttdoc">Returns the pointer to referenced data. </div><div class="ttdef"><b>Definition:</b> tensor_ref.h:254</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCongruous_html_ad49467d9028288b0bb93dbf376ef573a"><div class="ttname"><a href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCongruous.html#ad49467d9028288b0bb93dbf376ef573a">cutlass::layout::RowMajorTensorOpMultiplicandCongruous::LongIndex</a></div><div class="ttdeci">int64_t LongIndex</div><div class="ttdoc">Long index type used for offsets. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:539</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_ab234a568898813621a9e3ff9436d5042"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#ab234a568898813621a9e3ff9436d5042">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:629</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_abf23348f7e8d3b8aaac6f23c116dcf5c"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#abf23348f7e8d3b8aaac6f23c116dcf5c">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::RegularTileAccessIterator</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator(TensorRef ref, int thread_id)</div><div class="ttdoc">Construct a TileIterator with zero threadblock offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:372</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous_html_ab498476001a090017735113863e28898"><div class="ttname"><a href="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous.html#ab498476001a090017735113863e28898">cutlass::layout::TensorOpMultiplicandCongruous::Index</a></div><div class="ttdeci">int32_t Index</div><div class="ttdoc">Index type used for coordinates. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:221</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_ae4927c7f718b52aa80f603d9911b9639"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ae4927c7f718b52aa80f603d9911b9639">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::RegularTileAccessIterator</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator(TensorRef ref, int thread_id)</div><div class="ttdoc">Construct a TileIterator with zero threadblock offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:127</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_a1c4dbad00b218fa641b615a19d611d9a"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a1c4dbad00b218fa641b615a19d611d9a">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:341</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous_html"><div class="ttname"><a href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCongruous.html">cutlass::layout::ColumnMajorTensorOpMultiplicandCongruous</a></div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:422</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCrosswise_html_afb16d769e699fe88e09420cce6096d86"><div class="ttname"><a href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCrosswise.html#afb16d769e699fe88e09420cce6096d86">cutlass::layout::RowMajorTensorOpMultiplicandCrosswise::Index</a></div><div class="ttdeci">int32_t Index</div><div class="ttdoc">Index type used for coordinates. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:843</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise_html_af9367fe9d6c5d95367d84dbab02dd0fe"><div class="ttname"><a href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise.html#af9367fe9d6c5d95367d84dbab02dd0fe">cutlass::layout::ColumnMajorTensorOpMultiplicandCrosswise::Index</a></div><div class="ttdeci">int32_t Index</div><div class="ttdoc">Index type used for coordinates. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:742</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_a4b27e67450659f3e892f08c0def0fbbe"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a4b27e67450659f3e892f08c0def0fbbe">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::ThreadMap</a></div><div class="ttdeci">ThreadMap_ ThreadMap</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:642</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCrosswise_html"><div class="ttname"><a href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCrosswise.html">cutlass::layout::RowMajorTensorOpMultiplicandCrosswise</a></div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:835</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_ad3153ccc12d036260b80a0a6ab4081d5"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#ad3153ccc12d036260b80a0a6ab4081d5">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator &amp; operator++()</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:401</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_a636e7123ac8169f41d47e071e460fb81"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a636e7123ac8169f41d47e071e460fb81">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Index</a></div><div class="ttdeci">typename Layout::Index Index</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:77</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous_html"><div class="ttname"><a href="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous.html">cutlass::layout::TensorOpMultiplicandCongruous</a></div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:213</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_a827059393710930e72337cb7c62b6ef2"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a827059393710930e72337cb7c62b6ef2">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_tile_offset</a></div><div class="ttdeci">CUTLASS_DEVICE void add_tile_offset(TensorCoord const &amp;coord)</div><div class="ttdoc">Adds a tile offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:298</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_a352c7685cb9a37ba214609fe9ccb12e2"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a352c7685cb9a37ba214609fe9ccb12e2">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator operator++(int)</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:590</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_a21ec4fc2d56d5cd3bf58426ae01f369c"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a21ec4fc2d56d5cd3bf58426ae01f369c">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::set_iteration_index</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void set_iteration_index(int index)</div><div class="ttdoc">Overrides the internal iteration index. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:154</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_acc8da22531c619ac3ef5e817fef2d52f"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#acc8da22531c619ac3ef5e817fef2d52f">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::ThreadMap</a></div><div class="ttdeci">ThreadMap_ ThreadMap</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:452</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_a25e54d78f1b424ead16b5e64e6db63eb"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a25e54d78f1b424ead16b5e64e6db63eb">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_pointer_offset</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void add_pointer_offset(LongIndex pointer_offset)</div><div class="ttdoc">Adds a pointer offset in units of Element. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:545</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_a2de4681091764ba0aee6e09048ad8fb9"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a2de4681091764ba0aee6e09048ad8fb9">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator operator++(int)</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:792</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_a8358531564ae671621b6bb34ab10663e"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a8358531564ae671621b6bb34ab10663e">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::set_iteration_index</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void set_iteration_index(int index)</div><div class="ttdoc">Overrides the internal iteration index. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:282</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_a6a7b6b794720ed928b8744c7cde34aff"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a6a7b6b794720ed928b8744c7cde34aff">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::ThreadMap</a></div><div class="ttdeci">ThreadMap_ ThreadMap</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:354</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_a9d7b736eddaf28d6bd6216ba76396be1"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a9d7b736eddaf28d6bd6216ba76396be1">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_pointer_offset</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void add_pointer_offset(LongIndex pointer_offset)</div><div class="ttdoc">Adds a pointer offset in units of Element. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:161</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_ab861ef4575cb2ebbfb8278da72e26318"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ab861ef4575cb2ebbfb8278da72e26318">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::AccessType</a></div><div class="ttdeci">typename UnderlyingIterator::AccessType AccessType</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:747</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_aab0cd2dae6c59807b02b6ee5119d73a3"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#aab0cd2dae6c59807b02b6ee5119d73a3">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:437</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_abc58f5f5ad3c41b62db504ef05bf7a93"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#abc58f5f5ad3c41b62db504ef05bf7a93">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Index</a></div><div class="ttdeci">typename Layout::Index Index</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:446</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous_html_aa04ef0da8d8a859c2b7bb08cb3752d3d"><div class="ttname"><a href="structcutlass_1_1layout_1_1TensorOpMultiplicandCongruous.html#aa04ef0da8d8a859c2b7bb08cb3752d3d">cutlass::layout::TensorOpMultiplicandCongruous::LongIndex</a></div><div class="ttdeci">int64_t LongIndex</div><div class="ttdoc">Long index type used for offsets. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:224</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_a17f3bf28de19feaafff96d2e0c558047"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a17f3bf28de19feaafff96d2e0c558047">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::LongIndex</a></div><div class="ttdeci">typename Layout::LongIndex LongIndex</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:637</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_ace8da2b9203dd41a4130fdbbdc84f556"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#ace8da2b9203dd41a4130fdbbdc84f556">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator operator++(int)</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:408</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_a0e1c1e0c2565df3ade843682d8532435"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a0e1c1e0c2565df3ade843682d8532435">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::TensorCoord</a></div><div class="ttdeci">typename Layout::TensorCoord TensorCoord</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:81</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1PitchLinearShape_html"><div class="ttname"><a href="structcutlass_1_1layout_1_1PitchLinearShape.html">cutlass::layout::PitchLinearShape</a></div><div class="ttdoc">Template defining a shape used by pitch-linear operators. </div><div class="ttdef"><b>Definition:</b> pitch_linear.h:43</div></div>
<div class="ttc" id="array_8h_html"><div class="ttname"><a href="array_8h.html">array.h</a></div><div class="ttdoc">Statically sized array of elements that accommodates all CUTLASS-supported numeric types and is safe ...</div></div>
<div class="ttc" id="cutlass_8h_html_a4b1c9f25ab6eaa25e1f2258dd63e6ce4"><div class="ttname"><a href="cutlass_8h.html#a4b1c9f25ab6eaa25e1f2258dd63e6ce4">CUTLASS_PRAGMA_UNROLL</a></div><div class="ttdeci">#define CUTLASS_PRAGMA_UNROLL</div><div class="ttdef"><b>Definition:</b> cutlass.h:110</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_a13adaf4c752cb4e0fc5aaf29b2261348"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a13adaf4c752cb4e0fc5aaf29b2261348">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_pointer_offset</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void add_pointer_offset(LongIndex pointer_offset)</div><div class="ttdoc">Adds a pointer offset in units of Element. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:767</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_a55aff8c59952d96e4359005dac44db34"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a55aff8c59952d96e4359005dac44db34">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::TensorCoord</a></div><div class="ttdeci">typename Layout::TensorCoord TensorCoord</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:450</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_ad9d32a6458380ec72a6e2315486d20fc"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#ad9d32a6458380ec72a6e2315486d20fc">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::TensorCoord</a></div><div class="ttdeci">typename Layout::TensorCoord TensorCoord</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:352</div></div>
<div class="ttc" id="namespacecutlass_html_a1c7a9e66ca7b5dc7413ea3b8f349530a"><div class="ttname"><a href="namespacecutlass.html#a1c7a9e66ca7b5dc7413ea3b8f349530a">cutlass::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE half_t &amp; operator++(half_t &amp;lhs)</div><div class="ttdef"><b>Definition:</b> half.h:694</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_a4051bd65d1bf0b1b127bf46ad2044b83"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a4051bd65d1bf0b1b127bf46ad2044b83">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::LongIndex</a></div><div class="ttdeci">typename Layout::LongIndex LongIndex</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:78</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCrosswise_html_a85b214a913b534fc9cc5366664a414e3"><div class="ttname"><a href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCrosswise.html#a85b214a913b534fc9cc5366664a414e3">cutlass::layout::RowMajorTensorOpMultiplicandCrosswise::LongIndex</a></div><div class="ttdeci">int64_t LongIndex</div><div class="ttdoc">Long index type used for offsets. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:846</div></div>
<div class="ttc" id="classcutlass_1_1TensorRef_html_a191e88bc0fb310be655d700e937ab97c"><div class="ttname"><a href="classcutlass_1_1TensorRef.html#a191e88bc0fb310be655d700e937ab97c">cutlass::TensorRef::stride</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE Stride stride() const </div><div class="ttdoc">Returns the layout object&amp;#39;s stride vector. </div><div class="ttdef"><b>Definition:</b> tensor_ref.h:277</div></div>
<div class="ttc" id="matrix__shape_8h_html"><div class="ttname"><a href="matrix__shape_8h.html">matrix_shape.h</a></div><div class="ttdoc">Defines a Shape template for matrix tiles. </div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise_html_a8e1f0b54a8c1b3f37df9ec0dd3548985"><div class="ttname"><a href="structcutlass_1_1layout_1_1ColumnMajorTensorOpMultiplicandCrosswise.html#a8e1f0b54a8c1b3f37df9ec0dd3548985">cutlass::layout::ColumnMajorTensorOpMultiplicandCrosswise::LongIndex</a></div><div class="ttdeci">int64_t LongIndex</div><div class="ttdoc">Long index type used for offsets. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:745</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_a5cc867dbd6b5a122e9951ff492f5238a"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a5cc867dbd6b5a122e9951ff492f5238a">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Index</a></div><div class="ttdeci">typename Layout::Index Index</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:348</div></div>
<div class="ttc" id="structcutlass_1_1sizeof__bits_html"><div class="ttname"><a href="structcutlass_1_1sizeof__bits.html">cutlass::sizeof_bits</a></div><div class="ttdoc">Defines the size of an element in bits. </div><div class="ttdef"><b>Definition:</b> numeric_types.h:42</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_a87a657d6b2aca3a6ca421312235d0335"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a87a657d6b2aca3a6ca421312235d0335">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::TensorCoord</a></div><div class="ttdeci">typename Layout::TensorCoord TensorCoord</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:255</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_adeec884a4fce07b0fc82d5ba5dd03fe4"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#adeec884a4fce07b0fc82d5ba5dd03fe4">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator operator++(int)</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:206</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_a98e43fc279be18523a6839bd309695ab"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a98e43fc279be18523a6839bd309695ab">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator &amp; operator++()</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:689</div></div>
<div class="ttc" id="classcutlass_1_1TensorRef_html"><div class="ttname"><a href="classcutlass_1_1TensorRef.html">cutlass::TensorRef&lt; Element, Layout &gt;</a></div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_aa511f61915cdaccd0e39b7a6b8fb469b"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#aa511f61915cdaccd0e39b7a6b8fb469b">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::set_iteration_index</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void set_iteration_index(int index)</div><div class="ttdoc">Overrides the internal iteration index. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:379</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_a052f3d5d2f3f2f4578a3b59c8e88a676"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a052f3d5d2f3f2f4578a3b59c8e88a676">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Index</a></div><div class="ttdeci">typename Layout::Index Index</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:636</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_a18417476d7b76dd34e89b0af174a7bf0"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a18417476d7b76dd34e89b0af174a7bf0">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Element</a></div><div class="ttdeci">Element_ Element</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:245</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_a3d07f09c89750c04f1056ae2b2285296"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a3d07f09c89750c04f1056ae2b2285296">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator &amp; operator++()</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:182</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_a6b2bd7c503e292cdcfa6c18c77cd7baa"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a6b2bd7c503e292cdcfa6c18c77cd7baa">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Element</a></div><div class="ttdeci">Element_ Element</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:70</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_ad619429f4f3710665d47a39bd4fbb78c"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ad619429f4f3710665d47a39bd4fbb78c">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Index</a></div><div class="ttdeci">typename Layout::Index Index</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:732</div></div>
<div class="ttc" id="cutlass_8h_html_a28c2443a142676d3d71effdae1a986b1"><div class="ttname"><a href="cutlass_8h.html#a28c2443a142676d3d71effdae1a986b1">CUTLASS_HOST_DEVICE</a></div><div class="ttdeci">#define CUTLASS_HOST_DEVICE</div><div class="ttdef"><b>Definition:</b> cutlass.h:89</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_a81ddaa615b424060e6442d1328d02e55"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a81ddaa615b424060e6442d1328d02e55">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::LongIndex</a></div><div class="ttdeci">typename Layout::LongIndex LongIndex</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:349</div></div>
<div class="ttc" id="classcutlass_1_1TensorRef_html_a4166ac2a0754574ac21d5d57d74f34e5"><div class="ttname"><a href="classcutlass_1_1TensorRef.html#a4166ac2a0754574ac21d5d57d74f34e5">cutlass::TensorRef::offset</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE LongIndex offset(TensorCoord const &amp;coord) const </div><div class="ttdoc">Computes the offset of an index from the origin of the tensor. </div><div class="ttdef"><b>Definition:</b> tensor_ref.h:301</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_ac50ad97c2081de5cdd9600f1721c9037"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ac50ad97c2081de5cdd9600f1721c9037">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::AccessType</a></div><div class="ttdeci">Array&lt; Element, Layout::kElementsPerAccess &gt; AccessType</div><div class="ttdoc">Element type per access. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:102</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_ac1e0fe84270ef846336f9ca6969a35e5"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ac1e0fe84270ef846336f9ca6969a35e5">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::set_iteration_index</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void set_iteration_index(int index)</div><div class="ttdoc">Overrides the internal iteration index. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:763</div></div>
<div class="ttc" id="platform_8h_html_adde4c9ea91b753491851361a4198c009"><div class="ttname"><a href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a></div><div class="ttdeci">#define static_assert(__e, __m)</div><div class="ttdef"><b>Definition:</b> platform.h:153</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_a4ea7a9d82dfdae06b7fe408c65e5019b"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a4ea7a9d82dfdae06b7fe408c65e5019b">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::ThreadMap</a></div><div class="ttdeci">ThreadMap_ ThreadMap</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:738</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_a2cd2b330fdbe50d7514cb051b96a8d85"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a2cd2b330fdbe50d7514cb051b96a8d85">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_tile_offset</a></div><div class="ttdeci">CUTLASS_DEVICE void add_tile_offset(TensorCoord const &amp;coord)</div><div class="ttdoc">Adds a tile offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:599</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_a97f04453882bf322b9cd180f10416ea0"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a97f04453882bf322b9cd180f10416ea0">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_pointer_offset</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void add_pointer_offset(LongIndex pointer_offset)</div><div class="ttdoc">Adds a pointer offset in units of Element. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:671</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_a3c9014675466aec05102de18ef6eb40a"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a3c9014675466aec05102de18ef6eb40a">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator &amp; operator++()</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:304</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_a3c99340187479be2fae462f4df982bed"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a3c99340187479be2fae462f4df982bed">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:244</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise_html_a07de92ffadfe255537479c37b04cde6f"><div class="ttname"><a href="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html#a07de92ffadfe255537479c37b04cde6f">cutlass::layout::TensorOpMultiplicandCrosswise::LongIndex</a></div><div class="ttdeci">int64_t LongIndex</div><div class="ttdoc">Long index type used for offsets. </div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:643</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_a5f26df7eaec00b0535fb5193d7ee9618"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#a5f26df7eaec00b0535fb5193d7ee9618">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::AccessType</a></div><div class="ttdeci">Array&lt; Element, Layout::kElementsPerAccess &gt; AccessType</div><div class="ttdoc">Element type per access. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:474</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_ab138c25c73db56b7e1cdc9e29ec7a5fd"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#ab138c25c73db56b7e1cdc9e29ec7a5fd">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator operator++(int)</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:696</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_a44c0e7a192429e2f051f47572a89446a"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a44c0e7a192429e2f051f47572a89446a">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_pointer_offset</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void add_pointer_offset(LongIndex pointer_offset)</div><div class="ttdoc">Adds a pointer offset in units of Element. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:383</div></div>
<div class="ttc" id="regular__tile__access__iterator_8h_html"><div class="ttname"><a href="regular__tile__access__iterator_8h.html">regular_tile_access_iterator.h</a></div><div class="ttdoc">Templates implementing the address computation of storing of tiles from pitch-linear rank=2 tensors...</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_acc48b323a8a9a8e75e0bfdb77c1cbcc5"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#acc48b323a8a9a8e75e0bfdb77c1cbcc5">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::RegularTileAccessIterator</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator(TensorRef ref, int thread_id)</div><div class="ttdoc">Construct a TileIterator with zero threadblock offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:660</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_af017aa6ea6f90f1693c0ae274402852e"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#af017aa6ea6f90f1693c0ae274402852e">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::AccessType</a></div><div class="ttdeci">typename UnderlyingIterator::AccessType AccessType</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:651</div></div>
<div class="ttc" id="matrix__coord_8h_html"><div class="ttname"><a href="matrix__coord_8h.html">matrix_coord.h</a></div><div class="ttdoc">Defines a canonical coordinate for rank=2 matrices offering named indices. </div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_ab56d2b152243b8898b9f8a77af5b3508"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#ab56d2b152243b8898b9f8a77af5b3508">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator operator++(int)</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:311</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_acd5af8cbd89b13ad8678be98d495a44b"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#acd5af8cbd89b13ad8678be98d495a44b">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_pointer_offset</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void add_pointer_offset(LongIndex pointer_offset)</div><div class="ttdoc">Adds a pointer offset in units of Element. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:286</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_html"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator.html">cutlass::transform::threadblock::RegularTileAccessIterator</a></div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator.h:48</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72_html_a9e88ba17c1c659b84511c7dbdf9b665a"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__6baada077236f1a368c61c5e11b45b72.html#a9e88ba17c1c659b84511c7dbdf9b665a">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::AccessType</a></div><div class="ttdeci">typename UnderlyingIterator::AccessType AccessType</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:363</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_a9c7b26f7077030e9ac16a7124f3a6450"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a9c7b26f7077030e9ac16a7124f3a6450">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::ThreadMap</a></div><div class="ttdeci">ThreadMap_ ThreadMap</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:257</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_a1f1e0d9d6ec1ba0627b0ff95343c5706"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#a1f1e0d9d6ec1ba0627b0ff95343c5706">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::AccessType</a></div><div class="ttdeci">typename UnderlyingIterator::AccessType AccessType</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:266</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_ad7506791dac3532d745c1d268e7c77f5"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#ad7506791dac3532d745c1d268e7c77f5">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:69</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0_html_a09ed75da16791ee6c46888aa56d2c332"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__a3c11cf1f00ef7a1efb8389ac6e4c6e0.html#a09ed75da16791ee6c46888aa56d2c332">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::set_iteration_index</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE void set_iteration_index(int index)</div><div class="ttdoc">Overrides the internal iteration index. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:667</div></div>
<div class="ttc" id="pitch__linear_8h_html"><div class="ttname"><a href="pitch__linear_8h.html">pitch_linear.h</a></div><div class="ttdoc">Defines layout functions used by TensorRef and derived classes for pitch-linear memory. </div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_a76f3aed087b22e12afaa00fbbba21462"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a76f3aed087b22e12afaa00fbbba21462">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::operator++</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator &amp; operator++()</div><div class="ttdoc">Advances to the next tile in memory. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:785</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise_html"><div class="ttname"><a href="structcutlass_1_1layout_1_1TensorOpMultiplicandCrosswise.html">cutlass::layout::TensorOpMultiplicandCrosswise</a></div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:632</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_ab6a4152d54eab0b48a90bfafb2d84289"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ab6a4152d54eab0b48a90bfafb2d84289">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::TensorCoord</a></div><div class="ttdeci">typename Layout::TensorCoord TensorCoord</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:736</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_ac2ffc1bcd610ebc066f8b608de5a1c5a"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#ac2ffc1bcd610ebc066f8b608de5a1c5a">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_tile_offset</a></div><div class="ttdeci">CUTLASS_DEVICE void add_tile_offset(TensorCoord const &amp;coord)</div><div class="ttdoc">Adds a tile offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:779</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985_html_acee6b05cbcccab9deba3632b35d2f4e7"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__2c1476eaf582bfe972793e17babfe985.html#acee6b05cbcccab9deba3632b35d2f4e7">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::ColumnMajorTensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::LongIndex</a></div><div class="ttdeci">typename Layout::LongIndex LongIndex</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:252</div></div>
<div class="ttc" id="cutlass_8h_html"><div class="ttname"><a href="cutlass_8h.html">cutlass.h</a></div><div class="ttdoc">Basic include for CUTLASS. </div></div>
<div class="ttc" id="structcutlass_1_1MatrixCoord_html"><div class="ttname"><a href="structcutlass_1_1MatrixCoord.html">cutlass::MatrixCoord</a></div><div class="ttdef"><b>Definition:</b> matrix_coord.h:39</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_a1a58d2ccf23ef435ec977aadb67ac7f7"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a1a58d2ccf23ef435ec977aadb67ac7f7">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::LongIndex</a></div><div class="ttdeci">typename Layout::LongIndex LongIndex</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:733</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe_html_af7654c26faa6bbef9898085f10bceb9f"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__e9a9e0f4286f652f55eb9b863b21effe.html#af7654c26faa6bbef9898085f10bceb9f">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::LongIndex</a></div><div class="ttdeci">typename Layout::LongIndex LongIndex</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:447</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876_html_a025187783fb6d708885d31af2492bca4"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__0184b7188941788a96624510a4b2f876.html#a025187783fb6d708885d31af2492bca4">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::RowMajorTensorOpMultiplicandCrosswise&lt; sizeof_bits&lt; Element_ &gt;::value, Crosswise &gt;, AdvanceRank, ThreadMap_, Alignment &gt;::RegularTileAccessIterator</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE RegularTileAccessIterator(TensorRef ref, int thread_id)</div><div class="ttdoc">Construct a TileIterator with zero threadblock offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:756</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_a81cc510ffd092b4b002ef42892ffc0ec"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a81cc510ffd092b4b002ef42892ffc0ec">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::ThreadMap</a></div><div class="ttdeci">ThreadMap_ ThreadMap</div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:83</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f_html_a0b4a33ab3cabb4ffe3a47f5b0ee207d6"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileAccessIterator_3_01Shape___00_01Element__ebf4714349612673e8b6609b763eeb6f.html#a0b4a33ab3cabb4ffe3a47f5b0ee207d6">cutlass::transform::threadblock::RegularTileAccessIterator&lt; Shape_, Element_, layout::TensorOpMultiplicandCongruous&lt; sizeof_bits&lt; Element_ &gt;::value, int(128/sizeof(Element_))&gt;, AdvanceRank, ThreadMap_, Alignment &gt;::add_tile_offset</a></div><div class="ttdeci">CUTLASS_DEVICE void add_tile_offset(TensorCoord const &amp;coord)</div><div class="ttdoc">Adds a tile offset. </div><div class="ttdef"><b>Definition:</b> regular_tile_access_iterator_tensor_op.h:215</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCongruous_html"><div class="ttname"><a href="structcutlass_1_1layout_1_1RowMajorTensorOpMultiplicandCongruous.html">cutlass::layout::RowMajorTensorOpMultiplicandCongruous</a></div><div class="ttdef"><b>Definition:</b> tensor_op_multiplicand_sm75.h:527</div></div>
</div><!-- fragment --></div><!-- contents -->
<!-- start footer part -->
<hr class="footer"/><address class="footer"><small>
Generated by &#160;<a href="http://www.doxygen.org/index.html">
<img class="footer" src="doxygen.png" alt="doxygen"/>
</a> 1.8.11
</small></address>
</body>
</html>
