test

pytorch · lanluo-nvidia · Oct 6, 2024 · Oct 6, 2024 · Oct 6, 2024 · Oct 6, 2024
commit 7ddf56f27b9886c91b3c1c4de91d4b864283fc47
diff --git a/tests/py/dynamo/conversion/test_attention.py b/tests/py/dynamo/conversion/test_attention.py
@@ -34,27 +34,26 @@ def forward(self, query, key, value):
             enable_passes=True,
         )
 
-    @unittest.skip("need to change to custom dynamic shapes")
     @parameterized.expand(
         [
-            # (
-            #     "4d-2d",
-            #     (4, 2, 16, 32),
-            #     (6, 3, 32, 64),
-            #     (32, 8, 64, 128),
-            #     (4, 32),
-            #     (4, 64),
-            #     (16, 128),
-            # ),
-            # (
-            #     "4d-3d",
-            #     (2, 2, 2, 2),
-            #     (3, 3, 3, 4),
-            #     (3, 4, 4, 5),
-            #     (2, 3, 2),
-            #     (3, 3, 4),
-            #     (4, 5, 5),
-            # ),
+            (
+                "4d-2d",
+                (4, 2, 16, 32),
+                (6, 3, 32, 64),
+                (32, 8, 64, 128),
+                (4, 32),
+                (4, 64),
+                (16, 128),
+            ),
+            (
+                "4d-3d",
+                (2, 2, 2, 2),
+                (3, 3, 3, 4),
+                (3, 4, 4, 5),
+                (2, 3, 2),
+                (3, 3, 4),
+                (4, 5, 5),
+            ),
             (
                 "4d-4d",
                 (4, 2, 12, 4),
@@ -66,6 +65,7 @@ def forward(self, query, key, value):
             ),
         ]
     )
+    @unittest.skip("need to change to custom dynamic shapes")
     def test_sdpa_no_causal_dynamic_shape_with_scale(
         self,
         _,
@@ -146,7 +146,6 @@ def forward(self, query, key, value):
             enable_passes=True,
         )
 
-    @unittest.skip("need to change to custom dynamic shapes")
     @parameterized.expand(
         [
             (
@@ -169,6 +168,7 @@ def forward(self, query, key, value):
             ),
         ]
     )
+    @unittest.skip("need to change to custom dynamic shapes")
     def test_sdpa_no_causal_no_scale_dynamic_shape(
         self,
         _,
@@ -217,7 +217,6 @@ def forward(self, query, key, value):
 
         self.run_test_with_dynamic_shape(SDPA(), inputs)
 
-    @unittest.skip("need to change to custom dynamic shapes")
     @parameterized.expand(
         [
             (
@@ -252,6 +251,7 @@ def forward(self, query, key, value):
             ),
         ]
     )
+    @unittest.skip("need to change to custom dynamic shapes")
     def test_sdpa_causal_dynamic_shape(
         self,
         _,
@@ -295,11 +295,11 @@ def forward(self, query, key, value):
 
         self.run_test_with_dynamic_shape(SDPA(), inputs)
 
-    # it is already added in the integration test
+    @parameterized.expand([((32, 8, 128, 64), (32, 8, 128, 64))])
+    # it is already added in the test_composite_aten_op.py as integration test
     @unittest.skip(
         "skip torch.nn.functional.scaled_dot_product_attention converter test"
     )
-    @parameterized.expand([((32, 8, 128, 64), (32, 8, 128, 64))])
     def test_sdpa_causal(self, query_shape, key_shape):
         class SDPA(nn.Module):
             def forward(self, query, key, value):

diff --git a/tests/py/dynamo/conversion/test_composite_aten_op.py b/tests/py/dynamo/conversion/test_composite_aten_op.py
@@ -0,0 +1,194 @@
+import unittest
+
+import pytest
+import torch
+import torch.nn as nn
+import torch_tensorrt as torchtrt
+from parameterized import parameterized
+from torch.export import Dim
+from torch_tensorrt import Input
+from torch_tensorrt.dynamo.utils import COSINE_THRESHOLD, cosine_similarity
+
+assertions = unittest.TestCase()
+
+
+@pytest.mark.unit
+@parameterized.expand(
+    [
+        ((5,), (5,)),
+        (
+            (
+                2,
+                3,
+            ),
+            (
+                2,
+                3,
+            ),
+        ),
+    ]
+)
+def test_atan2_out_static_shape(input_shape, out_shape):
+    class atan2(torch.nn.Module):
+        def forward(self, lhs_val, rhs_val, out):
+            return torch.ops.aten.atan2.out(lhs_val, rhs_val, out=out)
+
+    model = atan2().eval().cuda()
+    inputs = (
+        torch.randn(input_shape).cuda(),
+        torch.randn(input_shape).cuda(),
+        torch.randn(out_shape).cuda(),
+    )
+    compile_spec = {
+        "inputs": inputs,
+        "ir": "dynamo",
+        "min_block_size": 1,
+    }
+
+    trt_model = torchtrt.compile(model, **compile_spec)
+    py_outputs = model(*inputs)
+    trt_outputs = trt_model(*inputs)
+    cos_sim = cosine_similarity(py_outputs, trt_outputs)
+    assertions.assertTrue(
+        cos_sim > COSINE_THRESHOLD,
+        msg=f"test_atan2_out_static_shape model TRT outputs don't match with the pytorch model. Cosine sim score: {cos_sim} Threshold: {COSINE_THRESHOLD}",
+    )
+
+
+@pytest.mark.unit
+@parameterized.expand(
+    [
+        (
+            (
+                1,
+                2,
+            ),
+            (2, 3),
+            (2, 4),
+        ),
+    ]
+)
+def test_atan2_out_dynamic_shape(min_shape, opt_shape, max_shape):
+    class atan2(torch.nn.Module):
+        def forward(self, lhs_val, rhs_val, out):
+            return torch.ops.aten.atan2.out(lhs_val, rhs_val, out=out)
+
+    model = atan2().eval().cuda()
+    input_spec = [
+        Input(
+            min_shape=min_shape,
+            opt_shape=opt_shape,
+            max_shape=max_shape,
+        ),
+        Input(
+            min_shape=min_shape,
+            opt_shape=opt_shape,
+            max_shape=max_shape,
+        ),
+        Input(
+            min_shape=min_shape,
+            opt_shape=opt_shape,
+            max_shape=max_shape,
+        ),
+    ]
+
+    compile_spec = {
+        "inputs": input_spec,
+        "ir": "dynamo",
+        "min_block_size": 1,
+    }
+
+    trt_model = torchtrt.compile(model, **compile_spec)
+    inputs = (
+        torch.randn(max_shape).cuda(),
+        torch.randn(max_shape).cuda(),
+        torch.randn(max_shape).cuda(),
+    )
+    py_outputs = model(*inputs)
+    trt_outputs = trt_model(*inputs)
+    cos_sim = cosine_similarity(py_outputs, trt_outputs)
+    assertions.assertTrue(
+        cos_sim > COSINE_THRESHOLD,
+        msg=f"test_atan2_out_dynamic_shape model TRT outputs don't match with the pytorch model. Cosine sim score: {cos_sim} Threshold: {COSINE_THRESHOLD}",
+    )
+
+
+@parameterized.expand(
+    [
+        ((32, 8, 128, 64), (32, 8, 128, 64), True, None),
+        ((32, 32, 128, 64), (32, 8, 128, 64), True, 0.1),
+    ]
+)
+def test_sdpa_static_shape(query_shape, key_shape, is_causal, scale):
+    class SDPA(nn.Module):
+        def forward(self, query, key, value):
+            return torch.nn.functional.scaled_dot_product_attention(
+                query, key, value, None, 0.0, is_causal=is_causal, scale=scale
+            )
+
+    model = SDPA().eval().cuda()
+
+    query = torch.randn(query_shape, dtype=torch.float16).cuda()
+    key = torch.randn(key_shape, dtype=torch.float16).cuda()
+    value = torch.randn(key_shape, dtype=torch.float16).cuda()
+    inputs = (query, key, value)
+    compile_spec = {
+        "inputs": inputs,
+        "ir": "dynamo",
+        "min_block_size": 1,
+    }
+
+    trt_model = torchtrt.compile(model, **compile_spec)
+    py_outputs = model(*inputs)
+    trt_outputs = trt_model(*inputs)
+    cos_sim = cosine_similarity(py_outputs, trt_outputs)
+    assertions.assertTrue(
+        cos_sim > COSINE_THRESHOLD,
+        msg=f"test_sdpa_static_shape model TRT outputs don't match with the pytorch model. Cosine sim score: {cos_sim} Threshold: {COSINE_THRESHOLD}",
+    )
+
+
+@parameterized.expand(
+    [
+        (True, None),
+        (True, 0.1),
+        (False, None),
+    ]
+)
+def test_sdpa_dynamic_shape(is_causal, scale):
+    class SDPA(nn.Module):
+        def forward(self, query, key, value):
+            return torch.nn.functional.scaled_dot_product_attention(
+                query, key, value, None, 0.0, is_causal=is_causal, scale=scale
+            )
+
+    model = SDPA().eval().cuda()
+
+    # N: batch_size
+    dyn_N = Dim("dyn_N", min=2, max=4)
+
+    # query tensor shape (N, ..., Hq, L, E)
+    query = torch.randn((3, 3, 4, 64), dtype=torch.float16).cuda()
+    # key tensor shape (N,...,H, S, E)
+    key = torch.randn((3, 3, 4, 64), dtype=torch.float16).cuda()
+    # value tensor shape (N, ..., H, S, Ev)
+    value = torch.randn((3, 3, 4, 64), dtype=torch.float16).cuda()
+
+    dynamic_shapes = {"query": {0: dyn_N}, "key": {0: dyn_N}, "value": {0: dyn_N}}
+    inputs = (query, key, value)
+
+    exp_program = torch.export.export(model, inputs, dynamic_shapes=dynamic_shapes)
+
+    compile_spec = {
+        "inputs": inputs,
+        "ir": "dynamo",
+        "min_block_size": 1,
+    }
+    trt_model = torchtrt.dynamo.compile(exp_program, **compile_spec)
+    py_outputs = model(*inputs)
+    trt_outputs = trt_model(*inputs)
+    cos_sim = cosine_similarity(py_outputs, trt_outputs)
+    assertions.assertTrue(
+        cos_sim > COSINE_THRESHOLD,
+        msg=f"test_sdpa_dynamic_shape model TRT outputs don't match with the pytorch model. Cosine sim score: {cos_sim} Threshold: {COSINE_THRESHOLD}",
+    )