<!DOCTYPE html>
<html class="writer-html5" lang="en" >
<head>
  <meta charset="utf-8" />
  <meta name="viewport" content="width=device-width, initial-scale=1.0" />
  <title>pygho.backend.Mamamm &mdash; PyGHO 0.0.1 documentation</title>
      <link rel="stylesheet" href="../../../_static/pygments.css" type="text/css" />
      <link rel="stylesheet" href="../../../_static/css/theme.css" type="text/css" />
  <!--[if lt IE 9]>
    <script src="../../../_static/js/html5shiv.min.js"></script>
  <![endif]-->
  
        <script src="../../../_static/jquery.js?v=5d32c60e"></script>
        <script src="../../../_static/_sphinx_javascript_frameworks_compat.js?v=2cd50e6c"></script>
        <script src="../../../_static/documentation_options.js?v=d45e8c67"></script>
        <script src="../../../_static/doctools.js?v=888ff710"></script>
        <script src="../../../_static/sphinx_highlight.js?v=dc90522c"></script>
    <script src="../../../_static/js/theme.js"></script>
    <link rel="index" title="Index" href="../../../genindex.html" />
    <link rel="search" title="Search" href="../../../search.html" /> 
</head>

<body class="wy-body-for-nav"> 
  <div class="wy-grid-for-nav">
    <nav data-toggle="wy-nav-shift" class="wy-nav-side">
      <div class="wy-side-scroll">
        <div class="wy-side-nav-search" >

          
          
          <a href="../../../index.html" class="icon icon-home">
            PyGHO
          </a>
<div role="search">
  <form id="rtd-search-form" class="wy-form" action="../../../search.html" method="get">
    <input type="text" name="q" placeholder="Search docs" aria-label="Search docs" />
    <input type="hidden" name="check_keywords" value="yes" />
    <input type="hidden" name="area" value="default" />
  </form>
</div>
        </div><div class="wy-menu wy-menu-vertical" data-spy="affix" role="navigation" aria-label="Navigation menu">
              <p class="caption" role="heading"><span class="caption-text">Notes</span></p>
<ul>
<li class="toctree-l1"><a class="reference internal" href="../../../notes/installation.html">Installation</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../notes/miniexample.html">Minimal Example</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../notes/datastructure.html">Refined Basic Data Structure</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../notes/hodata.html">Efficient High Order Data Processing</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../notes/operator.html">Operators</a></li>
</ul>
<p class="caption" role="heading"><span class="caption-text">Advanced Tutorial</span></p>
<ul>
<li class="toctree-l1"><a class="reference internal" href="../../../notes/multtensor.html">Multiple Tensor</a></li>
</ul>
<p class="caption" role="heading"><span class="caption-text">Package Reference</span></p>
<ul>
<li class="toctree-l1"><a class="reference internal" href="../../../modules/backend.html">pygho.backend package</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../modules/hodata.html">pygho.hodata package</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../modules/honn.html">pygho.honn package</a></li>
</ul>

        </div>
      </div>
    </nav>

    <section data-toggle="wy-nav-shift" class="wy-nav-content-wrap"><nav class="wy-nav-top" aria-label="Mobile navigation menu" >
          <i data-toggle="wy-nav-top" class="fa fa-bars"></i>
          <a href="../../../index.html">PyGHO</a>
      </nav>

      <div class="wy-nav-content">
        <div class="rst-content">
          <div role="navigation" aria-label="Page navigation">
  <ul class="wy-breadcrumbs">
      <li><a href="../../../index.html" class="icon icon-home" aria-label="Home"></a></li>
          <li class="breadcrumb-item"><a href="../../index.html">Module code</a></li>
      <li class="breadcrumb-item active">pygho.backend.Mamamm</li>
      <li class="wy-breadcrumbs-aside">
      </li>
  </ul>
  <hr/>
</div>
          <div role="main" class="document" itemscope="itemscope" itemtype="http://schema.org/Article">
           <div itemprop="articleBody">
             
  <h1>Source code for pygho.backend.Mamamm</h1><div class="highlight"><pre>
<span></span><span class="kn">from</span> <span class="nn">.MaTensor</span> <span class="kn">import</span> <span class="n">MaskedTensor</span>
<span class="kn">import</span> <span class="nn">torch</span>
<span class="kn">from</span> <span class="nn">torch</span> <span class="kn">import</span> <span class="n">BoolTensor</span><span class="p">,</span> <span class="n">Tensor</span>
<span class="kn">from</span> <span class="nn">typing</span> <span class="kn">import</span> <span class="n">Optional</span><span class="p">,</span> <span class="n">Tuple</span>


<div class="viewcode-block" id="batched_tensordot">
<a class="viewcode-back" href="../../../modules/backend.html#pygho.backend.Mamamm.batched_tensordot">[docs]</a>
<span class="k">def</span> <span class="nf">batched_tensordot</span><span class="p">(</span><span class="n">A</span><span class="p">:</span> <span class="n">Tensor</span><span class="p">,</span> <span class="n">catdim1</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">dim1</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">B</span><span class="p">:</span> <span class="n">Tensor</span><span class="p">,</span>
                      <span class="n">catdim2</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">dim2</span><span class="p">:</span> <span class="nb">int</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="n">Tensor</span><span class="p">:</span>
<span class="w">    </span><span class="sd">&quot;&quot;&quot;</span>
<span class="sd">    Perform a batched tensordot matrix operation.</span>

<span class="sd">    This function computes the tensordot product of two tensors `A` and `B`, where `A` and `B` are batched tensors with specified concatenation dimensions `catdim1` and `catdim2`, and contraction dimensions `dim1` and `dim2`.</span>

<span class="sd">    Args:</span>

<span class="sd">    - A (Tensor): The first batched tensor of shape (catshape1, broadcastshape).</span>
<span class="sd">    - catdim1 (int): The length of catshape1.</span>
<span class="sd">    - dim1 (int): The contraction dimension along `catdim1` of the first tensor.</span>
<span class="sd">    - B (Tensor): The second batched tensor of shape (catshape2, broadcastshape)..</span>
<span class="sd">    - catdim2 (int): The length of catshape2.</span>
<span class="sd">    - dim2 (int): The contraction dimension along `catdim2` of the second tensor.</span>

<span class="sd">    Returns:</span>

<span class="sd">    - Tensor: The result of the batched tensordot operation of shape (\*catshape1\\dim1, \*catshape2\\dim2, \*broadcastshape), where densedim is the common dense dimension of `A` and `B`.</span>

<span class="sd">    Notes:</span>

<span class="sd">    - `catdim1` and `catdim2` specify the number of concatenation dimensions of `A` and `B`, respectively.</span>
<span class="sd">    - `dim1` and `dim2` specify the contraction dimensions along `catdim1` and `catdim2`, respectively.</span>
<span class="sd">    - The function uses optimized paths for specific cases (e.g., when `catdim1=2` and `catdim2=2`).</span>

<span class="sd">    &quot;&quot;&quot;</span>
    <span class="k">assert</span> <span class="n">dim1</span> <span class="o">&lt;</span> <span class="n">catdim1</span><span class="p">,</span> <span class="s2">&quot;contract the masked dim only&quot;</span>
    <span class="k">assert</span> <span class="n">dim2</span> <span class="o">&lt;</span> <span class="n">catdim2</span><span class="p">,</span> <span class="s2">&quot;contract the masked dim only&quot;</span>
    <span class="c1"># print(A.shape, catdim1, dim1, B.shape, catdim2, dim2)</span>
    <span class="n">ndim1</span> <span class="o">=</span> <span class="n">A</span><span class="o">.</span><span class="n">ndim</span>
    <span class="n">densedim1</span> <span class="o">=</span> <span class="n">ndim1</span> <span class="o">-</span> <span class="n">catdim1</span>
    <span class="n">ndim2</span> <span class="o">=</span> <span class="n">B</span><span class="o">.</span><span class="n">ndim</span>
    <span class="n">densedim2</span> <span class="o">=</span> <span class="n">ndim2</span> <span class="o">-</span> <span class="n">catdim2</span>
    <span class="k">assert</span> <span class="n">densedim1</span> <span class="o">==</span> <span class="n">densedim2</span><span class="p">,</span> <span class="s2">&quot;must of the same dense shape&quot;</span>

    <span class="k">if</span> <span class="n">catdim1</span> <span class="o">==</span> <span class="mi">2</span> <span class="ow">and</span> <span class="n">catdim2</span> <span class="o">==</span> <span class="mi">2</span><span class="p">:</span>
        <span class="k">if</span> <span class="n">dim1</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span>
            <span class="n">A</span> <span class="o">=</span> <span class="n">A</span><span class="o">.</span><span class="n">transpose</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span> <span class="mi">1</span><span class="p">)</span>
        <span class="k">if</span> <span class="n">dim2</span> <span class="o">==</span> <span class="mi">1</span><span class="p">:</span>
            <span class="n">B</span> <span class="o">=</span> <span class="n">B</span><span class="o">.</span><span class="n">transpose</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span> <span class="mi">1</span><span class="p">)</span>
        <span class="n">A</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">movedim</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">movedim</span><span class="p">(</span><span class="n">A</span><span class="p">,</span> <span class="mi">0</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">),</span> <span class="mi">0</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">)</span>
        <span class="n">B</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">movedim</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">movedim</span><span class="p">(</span><span class="n">B</span><span class="p">,</span> <span class="mi">0</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">),</span> <span class="mi">0</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">)</span>
        <span class="n">C</span> <span class="o">=</span> <span class="n">A</span> <span class="o">@</span> <span class="n">B</span>
        <span class="n">C</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">movedim</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">movedim</span><span class="p">(</span><span class="n">C</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="mi">0</span><span class="p">),</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span>
        <span class="k">return</span> <span class="n">C</span>
    <span class="c1"># TODO more special case to apply bmm for acceleration?</span>
    <span class="k">else</span><span class="p">:</span>
        <span class="n">A</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">movedim</span><span class="p">(</span><span class="n">A</span><span class="p">,</span> <span class="n">dim1</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">)</span>
        <span class="n">B</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">movedim</span><span class="p">(</span><span class="n">B</span><span class="p">,</span> <span class="n">dim2</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">)</span>
        <span class="k">for</span> <span class="n">_</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">catdim2</span> <span class="o">-</span> <span class="mi">1</span><span class="p">):</span>
            <span class="n">A</span> <span class="o">=</span> <span class="n">A</span><span class="o">.</span><span class="n">unsqueeze</span><span class="p">(</span><span class="n">catdim1</span> <span class="o">-</span> <span class="mi">1</span><span class="p">)</span>
        <span class="k">for</span> <span class="n">_</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">catdim1</span> <span class="o">-</span> <span class="mi">1</span><span class="p">):</span>
            <span class="n">B</span> <span class="o">=</span> <span class="n">B</span><span class="o">.</span><span class="n">unsqueeze</span><span class="p">(</span><span class="mi">0</span><span class="p">)</span>

        <span class="n">C</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">sum</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">multiply</span><span class="p">(</span><span class="n">A</span><span class="p">,</span> <span class="n">B</span><span class="p">),</span> <span class="n">dim</span><span class="o">=-</span><span class="mi">1</span><span class="p">)</span>
        <span class="k">return</span> <span class="n">C</span></div>



<div class="viewcode-block" id="broadcast_denseshape">
<a class="viewcode-back" href="../../../modules/backend.html#pygho.backend.Mamamm.broadcast_denseshape">[docs]</a>
<span class="k">def</span> <span class="nf">broadcast_denseshape</span><span class="p">(</span><span class="n">A</span><span class="p">:</span> <span class="n">Tensor</span><span class="p">,</span> <span class="n">densedim1</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">B</span><span class="p">:</span> <span class="n">Tensor</span><span class="p">,</span>
                         <span class="n">densedim2</span><span class="p">:</span> <span class="nb">int</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="n">Tuple</span><span class="p">[</span><span class="n">Tensor</span><span class="p">,</span> <span class="n">Tensor</span><span class="p">]:</span>
<span class="w">    </span><span class="sd">&quot;&quot;&quot;</span>
<span class="sd">    This function broadcasts the dense shapes of tensors `A` and `B` to the same by adding dimensions of size 1.</span>

<span class="sd">    Args:</span>

<span class="sd">    - A (Tensor): The first tensor.</span>
<span class="sd">    - densedim1 (int): The number of dense dimension of the first tensor.</span>
<span class="sd">    - B (Tensor): The second tensor.</span>
<span class="sd">    - densedim2 (int): The number of dense dimension of the second tensor.</span>

<span class="sd">    Returns:</span>

<span class="sd">    - Tuple[Tensor, Tensor]: A tuple containing the broadcasted tensors `A` and `B` with compatible dense shapes.</span>

<span class="sd">    Notes:</span>

<span class="sd">    - This function adds dimensions with size 1 to the smaller dense shape until both dense shapes match.</span>

<span class="sd">    &quot;&quot;&quot;</span>
    <span class="k">while</span> <span class="n">densedim1</span> <span class="o">&lt;</span> <span class="n">densedim2</span><span class="p">:</span>
        <span class="n">A</span><span class="o">.</span><span class="n">unsqueeze</span><span class="p">(</span><span class="o">-</span><span class="n">densedim1</span> <span class="o">-</span> <span class="mi">1</span><span class="p">)</span>
        <span class="n">densedim1</span> <span class="o">+=</span> <span class="mi">1</span>
    <span class="k">while</span> <span class="n">densedim2</span> <span class="o">&lt;</span> <span class="n">densedim1</span><span class="p">:</span>
        <span class="n">B</span><span class="o">.</span><span class="n">unsqueeze</span><span class="p">(</span><span class="o">-</span><span class="n">densedim2</span> <span class="o">-</span> <span class="mi">1</span><span class="p">)</span>
        <span class="n">densedim2</span> <span class="o">+=</span> <span class="mi">1</span>
    <span class="k">return</span> <span class="n">A</span><span class="p">,</span> <span class="n">B</span></div>



<div class="viewcode-block" id="mamamm">
<a class="viewcode-back" href="../../../modules/backend.html#pygho.backend.Mamamm.mamamm">[docs]</a>
<span class="k">def</span> <span class="nf">mamamm</span><span class="p">(</span><span class="n">A</span><span class="p">:</span> <span class="n">MaskedTensor</span><span class="p">,</span>
           <span class="n">dim1</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span>
           <span class="n">B</span><span class="p">:</span> <span class="n">MaskedTensor</span><span class="p">,</span>
           <span class="n">dim2</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span>
           <span class="n">mask</span><span class="p">:</span> <span class="n">BoolTensor</span><span class="p">,</span>
           <span class="n">broadcast_firstdim</span><span class="p">:</span> <span class="nb">bool</span> <span class="o">=</span> <span class="kc">True</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="n">MaskedTensor</span><span class="p">:</span>
<span class="w">    </span><span class="sd">&quot;&quot;&quot;</span>
<span class="sd">    Batched masked matrix multiplication of two MaskedTensors.</span>

<span class="sd">    This function performs batched matrix multiplication between two MaskedTensors `A` and `B`, where the masked dimensions `dim1` and `dim2` are contracted. The result is a new MaskedTensor with the specified mask.</span>

<span class="sd">    Args:</span>

<span class="sd">    - A (MaskedTensor): The first MaskedTensor with shape (B,\* maskedshape1,\*denseshapeshape).</span>
<span class="sd">    - dim1 (int): The masked dimension to contract in the first tensor `A`.</span>
<span class="sd">    - B (MaskedTensor): The second MaskedTensor with shape (B,\* maskedshape2,\*denseshapeshape).</span>
<span class="sd">    - dim2 (int): The masked dimension to contract in the second tensor `B`.</span>
<span class="sd">    - mask (BoolTensor): The mask to apply to the resulting MaskedTensor.</span>
<span class="sd">    - broadcast_firstdim (bool, optional): If True, broadcast the first dimension (batch dimension) of `A` and `B` to ensure compatibility. Default is True.</span>

<span class="sd">    Returns:</span>

<span class="sd">    - MaskedTensor: A new MaskedTensor with shape (B,\* maskedshape1\dim1,\* maskedshape2\dim2,\*denseshapeshape) and the specified mask.</span>

<span class="sd">    Notes:</span>

<span class="sd">    - This function performs batched matrix multiplication between two MaskedTensors, contracting the specified masked dimensions.</span>
<span class="sd">    &quot;&quot;&quot;</span>
    <span class="n">tA</span> <span class="o">=</span> <span class="n">A</span><span class="o">.</span><span class="n">fill_masked</span><span class="p">(</span><span class="mi">0</span><span class="p">)</span>
    <span class="n">tB</span> <span class="o">=</span> <span class="n">B</span><span class="o">.</span><span class="n">fill_masked</span><span class="p">(</span><span class="mi">0</span><span class="p">)</span>
    <span class="n">densedim1</span> <span class="o">=</span> <span class="n">A</span><span class="o">.</span><span class="n">dense_dim</span>
    <span class="n">densedim2</span> <span class="o">=</span> <span class="n">B</span><span class="o">.</span><span class="n">dense_dim</span>

    <span class="n">tA</span><span class="p">,</span> <span class="n">tB</span> <span class="o">=</span> <span class="n">broadcast_denseshape</span><span class="p">(</span><span class="n">tA</span><span class="p">,</span> <span class="n">densedim1</span><span class="p">,</span> <span class="n">tB</span><span class="p">,</span> <span class="n">densedim2</span><span class="p">)</span>

    <span class="n">densedim</span> <span class="o">=</span> <span class="nb">max</span><span class="p">(</span><span class="n">densedim1</span><span class="p">,</span> <span class="n">densedim2</span><span class="p">)</span>

    <span class="k">if</span> <span class="n">broadcast_denseshape</span><span class="p">:</span>
        <span class="k">assert</span> <span class="n">dim1</span> <span class="o">&gt;</span> <span class="mi">0</span><span class="p">,</span> <span class="s2">&quot;0 dim of A is batch, need to be broadcasted&quot;</span>
        <span class="k">assert</span> <span class="n">dim2</span> <span class="o">&gt;</span> <span class="mi">0</span><span class="p">,</span> <span class="s2">&quot;0 dim of B is batch, need to be broadcasted&quot;</span>

    <span class="k">if</span> <span class="n">broadcast_firstdim</span><span class="p">:</span>
        <span class="n">tA</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">movedim</span><span class="p">(</span><span class="n">tA</span><span class="p">,</span> <span class="mi">0</span><span class="p">,</span> <span class="o">-</span><span class="n">densedim</span> <span class="o">-</span> <span class="mi">1</span><span class="p">)</span>
        <span class="n">tB</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">movedim</span><span class="p">(</span><span class="n">tB</span><span class="p">,</span> <span class="mi">0</span><span class="p">,</span> <span class="o">-</span><span class="n">densedim</span> <span class="o">-</span> <span class="mi">1</span><span class="p">)</span>
        <span class="n">densedim</span> <span class="o">+=</span> <span class="mi">1</span>
        <span class="n">prod</span> <span class="o">=</span> <span class="n">batched_tensordot</span><span class="p">(</span><span class="n">tA</span><span class="p">,</span> <span class="n">A</span><span class="o">.</span><span class="n">masked_dim</span> <span class="o">-</span> <span class="mi">1</span><span class="p">,</span> <span class="n">dim1</span> <span class="o">-</span> <span class="mi">1</span><span class="p">,</span> <span class="n">tB</span><span class="p">,</span>
                                 <span class="n">B</span><span class="o">.</span><span class="n">masked_dim</span> <span class="o">-</span> <span class="mi">1</span><span class="p">,</span> <span class="n">dim2</span> <span class="o">-</span> <span class="mi">1</span><span class="p">)</span>
        <span class="n">prod</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">movedim</span><span class="p">(</span><span class="n">prod</span><span class="p">,</span> <span class="o">-</span><span class="n">densedim</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span>
    <span class="k">else</span><span class="p">:</span>
        <span class="n">prod</span> <span class="o">=</span> <span class="n">batched_tensordot</span><span class="p">(</span><span class="n">tA</span><span class="p">,</span> <span class="n">A</span><span class="o">.</span><span class="n">masked_dim</span><span class="p">,</span> <span class="n">dim1</span><span class="p">,</span> <span class="n">tB</span><span class="p">,</span> <span class="n">B</span><span class="o">.</span><span class="n">masked_dim</span><span class="p">,</span>
                                 <span class="n">dim2</span><span class="p">)</span>
    <span class="k">return</span> <span class="n">MaskedTensor</span><span class="p">(</span><span class="n">prod</span><span class="p">,</span> <span class="n">mask</span><span class="p">)</span></div>

</pre></div>

           </div>
          </div>
          <footer>

  <hr/>

  <div role="contentinfo">
    <p>&#169; Copyright 2023.</p>
  </div>

  Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
    <a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
    provided by <a href="https://readthedocs.org">Read the Docs</a>.
   

</footer>
        </div>
      </div>
    </section>
  </div>
  <script>
      jQuery(function () {
          SphinxRtdTheme.Navigation.enable(true);
      });
  </script> 

</body>
</html>