Make transfer_to_logical_device copy the tensor during eager execution (

#239) Currently eager and generate don't have the same semantics. Generate would create a new value while in eager we return the same tensor. It is desirable to have the same behavior in both paths, this will allow us to catch in-place errors on the torch level and not during IREE execution. The only downside is that during eager it will be slower. This is far less of headache. Signed-off-by: Boian Petkantchin <boian.petkantchin@amd.com>
iree-org · Oct 23, 2024 · 00dcee7 · 00dcee7
1 parent ae9a51c
commit 00dcee7
Show file tree

Hide file tree

Showing 2 changed files with 2 additions and 2 deletions.
diff --git a/iree/turbine/ops/iree.py b/iree/turbine/ops/iree.py
@@ -89,7 +89,7 @@ def select(self, ksel: KernelSelection):
         ksel.return_tensor(ta.t).specialize_dims(*spec)
 
     def eager_execute(self, device_moniker, tensor):
-        return tensor
+        return tensor.clone()
 
     def generate(self, ksel: KernelSelection, kb: KernelBuilder):
         moniker = cast(AttrArg, ksel.arg_descs[0]).v

diff --git a/tests/ops/iree_test.py b/tests/ops/iree_test.py
@@ -36,7 +36,7 @@ class TransferToLogicalDeviceTest(unittest.TestCase):
     def testEager(self):
         t1 = torch.randn(3, 4)
         t2 = ops.iree.transfer_to_logical_device("1", t1)
-        self.assertIs(t1, t2)
+        assert torch.all(t1 == t2)
 
     def testAOT(self):
         class MyModule(nn.Module):