Skip to content

Commit fc4ec1b

Browse files
author
GitHub Actions
committed
Update docs
1 parent 8181c8f commit fc4ec1b

File tree

3 files changed

+3
-3
lines changed

3 files changed

+3
-3
lines changed

_sources/deeplearning_operators/matmul.md.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -109,7 +109,7 @@ def matmul(M, N, K, block_M, block_N, block_K, dtype="float16", accum_dtype="flo
109109
func = matmul(1024, 1024, 1024, 128, 128, 32)
110110

111111
# 2. JIT-compile the kernel for NVIDIA GPU
112-
jit_kernel = tilelang.JITKernel(func, out_idx=[2], target="cuda")
112+
jit_kernel = tilelang.compile(func, out_idx=[2], target="cuda")
113113

114114
import torch
115115

deeplearning_operators/matmul.html

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -326,7 +326,7 @@ <h3>Basic Structure<a class="headerlink" href="#basic-structure" title="Permalin
326326
<span class="n">func</span> <span class="o">=</span> <span class="n">matmul</span><span class="p">(</span><span class="mi">1024</span><span class="p">,</span> <span class="mi">1024</span><span class="p">,</span> <span class="mi">1024</span><span class="p">,</span> <span class="mi">128</span><span class="p">,</span> <span class="mi">128</span><span class="p">,</span> <span class="mi">32</span><span class="p">)</span>
327327

328328
<span class="c1"># 2. JIT-compile the kernel for NVIDIA GPU</span>
329-
<span class="n">jit_kernel</span> <span class="o">=</span> <span class="n">tilelang</span><span class="o">.</span><span class="n">JITKernel</span><span class="p">(</span><span class="n">func</span><span class="p">,</span> <span class="n">out_idx</span><span class="o">=</span><span class="p">[</span><span class="mi">2</span><span class="p">],</span> <span class="n">target</span><span class="o">=</span><span class="s2">&quot;cuda&quot;</span><span class="p">)</span>
329+
<span class="n">jit_kernel</span> <span class="o">=</span> <span class="n">tilelang</span><span class="o">.</span><span class="n">compile</span><span class="p">(</span><span class="n">func</span><span class="p">,</span> <span class="n">out_idx</span><span class="o">=</span><span class="p">[</span><span class="mi">2</span><span class="p">],</span> <span class="n">target</span><span class="o">=</span><span class="s2">&quot;cuda&quot;</span><span class="p">)</span>
330330

331331
<span class="kn">import</span> <span class="nn">torch</span>
332332

0 commit comments

Comments
 (0)