Rename ir to ttir in Binary::asm()

triton-lang · ptillet · Apr 23, 2021 · Apr 23, 2021 · Apr 23, 2021 · Apr 23, 2021
commit 38ee6a3ef1882536b7b18d7eab81f6088209a0a5
diff --git a/python/triton/code_gen.py b/python/triton/code_gen.py
@@ -396,7 +396,7 @@ def __init__(self, module, kernel, num_warps, shared_mem, ir_asm):
         self.num_warps = num_warps
 
     def asm(self, mode):
-        if mode == 'ir':
+        if mode == 'ttir':
             return self.ir_asm
         if mode == 'ptx':
             return self.module.ptx()

diff --git a/python/tutorials/01-vector-add.py b/python/tutorials/01-vector-add.py
@@ -54,10 +54,10 @@ def add(x, y):
     #  - torch.tensor objects are implicitly converted to pointers to their first element.
     #  - `triton.jit`'ed functions can be subscripted with a launch grid to obtain a callable GPU kernel
     #  - don't forget to pass meta-parameters as keywords arguments
-    kernel = _add[grid](x, y, z, N, BLOCK=1024)
+    _add[grid](x, y, z, N, BLOCK=1024)
     # We return a handle to z but, since `torch.cuda.synchronize()` hasn't been called, the kernel is still
     # running asynchronously.
-    return z, kernel
+    return z
 
 
 # %%
@@ -68,16 +68,11 @@ def add(x, y):
 x = torch.rand(size, device='cuda')
 y = torch.rand(size, device='cuda')
 za = x + y
-zb, kernel = add(x, y)
+zb = add(x, y)
 print(za)
 print(zb)
 print(f'The maximum difference between torch and triton is ' f'{torch.max(torch.abs(za - zb))}')
 
-# print asm
-# print(kernel.asm('ir'))
-# print(kernel.asm('ptx'))
-# print(kernel.asm('llir'))
-
 # %%
 # Seems like we're good to go!