Make dtensor tests device agnostic (#155687)

amathewc · pytorchmergebot · commit b8ace6f95105 · 2025-06-21T04:51:59.000Z
## MOTIVATION This PR is a continuation of #154840 and we are trying to make the tests more device agnostic by removing hard coded references to any particular device. Please refer to this RFC as well: pytorch/rfcs#66 ## CHANGES 1. test_convolution_ops.py: - Replace "cuda" with self.device_type 2. test_random_ops.py: - Remove setting and using TYPE_DEVICE variable since device_type is set as per the environment (device) in DTensorTestBase class. - Replace "cuda" with self.device_type Pull Request resolved: #155687 Approved by: https://github.com/EikanWang, https://github.com/d4l3k
diff --git a/test/distributed/tensor/test_convolution_ops.py b/test/distributed/tensor/test_convolution_ops.py
@@ -187,7 +187,7 @@ def test_depthwise_convolution(self):
     @skip_if_lt_x_gpu(2)
     def test_conv_backward_none_grad_inp(self):
         device_mesh = init_device_mesh(
-            device_type="cuda", mesh_shape=(self.world_size,)
+            device_type=self.device_type, mesh_shape=(self.world_size,)
         )
         conv = nn.Conv2d(64, 64, 3, padding=1).train()
         x = torch.randn(1, 64, 32, 32)
diff --git a/test/distributed/tensor/test_random_ops.py b/test/distributed/tensor/test_random_ops.py
@@ -24,7 +24,7 @@
 from torch.distributed.tensor._utils import compute_local_shape_and_global_offset
 from torch.distributed.tensor.debug import CommDebugMode
 from torch.distributed.tensor.parallel import ColwiseParallel, parallelize_module
-from torch.testing._internal.common_utils import run_tests, TEST_HPU
+from torch.testing._internal.common_utils import run_tests
 from torch.testing._internal.distributed._tensor.common_dtensor import (
     DTensorTestBase,
     skip_if_lt_x_gpu,
@@ -33,9 +33,6 @@
 )
 
 
-TYPE_DEVICE = "hpu" if TEST_HPU else "cuda"
-
-
 class DistTensorRandomInitTest(DTensorTestBase):
     def _run_init_op(self, init_op, *args, **kwargs):
         device_mesh = self.build_device_mesh()
@@ -55,7 +52,7 @@ def _run_init_op(self, init_op, *args, **kwargs):
             self.assertEqual(local_tensor_clone, dtensor.to_local())
         else:
             # create DTensor from Tensor
-            _tensor = torch.empty(*input_size, device=TYPE_DEVICE)
+            _tensor = torch.empty(*input_size, device=self.device_type)
             dtensor = distribute_tensor(_tensor, device_mesh, [Shard(1)])
 
             # DTensor random init
@@ -173,7 +170,9 @@ def test_tp_model_meta_init(self):
             self.assertEqual(model.weight.device, torch.device("meta"))
 
         # actual initialization
-        device = torch.device("cuda", torch.cuda.current_device())
+        device = torch.device(
+            self.device_type, torch.get_device_module(self.device_type).current_device()
+        )
         model.to_empty(device=device)
         model.reset_parameters()
         self.assertTrue(
@@ -224,7 +223,9 @@ def test_fsdp_tp_model_meta_init(self):
             self.assertEqual(model.weight.device, torch.device("meta"))
 
         # actual initialization
-        device = torch.device("cuda", torch.cuda.current_device())
+        device = torch.device(
+            self.device_type, torch.get_device_module(self.device_type).current_device()
+        )
         model.to_empty(device=device)
         model.reset_parameters()
         self.assertTrue(
@@ -266,7 +267,9 @@ def test_rng_tracker_init(self):
         # seed synchronization now does NOT happen after the first `distribute_tensor`
         # call
         dt = distribute_tensor(
-            torch.empty([self.world_size], device=TYPE_DEVICE), device_mesh, [Shard(0)]
+            torch.empty([self.world_size], device=self.device_type),
+            device_mesh,
+            [Shard(0)],
         )
         self.assertTrue(random._rng_tracker is None)
         # seed synchronization only happens after `manual_seed` or the first DTensor
@@ -366,7 +369,7 @@ def test_deterministic_dropout_1d(self):
         size = [4, 4]
 
         dtensor = distribute_tensor(
-            torch.empty(*size, device=TYPE_DEVICE), device_mesh, [Shard(1)]
+            torch.empty(*size, device=self.device_type), device_mesh, [Shard(1)]
         )
 
         # a random op call shifts the offset
@@ -571,7 +574,9 @@ def test_hsdp_tp_model_meta_init(self):
             self.assertEqual(model.weight.device, torch.device("meta"))
 
         # actual initialization
-        device = torch.device("cuda", torch.cuda.current_device())
+        device = torch.device(
+            self.device_type, torch.get_device_module(self.device_type).current_device()
+        )
         model.to_empty(device=device)
         model.reset_parameters()
         self.assertTrue(

Original file line number	Diff line number	Diff line change
`@@ -187,7 +187,7 @@ def test_depthwise_convolution(self):`
`187`	`187`	`@skip_if_lt_x_gpu(2)`
`188`	`188`	`def test_conv_backward_none_grad_inp(self):`
`189`	`189`	`device_mesh = init_device_mesh(`
`190`		`- device_type="cuda", mesh_shape=(self.world_size,)`
	`190`	`+ device_type=self.device_type, mesh_shape=(self.world_size,)`
`191`	`191`	`)`
`192`	`192`	`conv = nn.Conv2d(64, 64, 3, padding=1).train()`
`193`	`193`	`x = torch.randn(1, 64, 32, 32)`