PaddlePaddle · youge325 · Apr 11, 2026 · Apr 12, 2026 · Apr 13, 2026 · Copilot
diff --git a/paddle/phi/api/include/compat/ATen/core/TensorBody.h b/paddle/phi/api/include/compat/ATen/core/TensorBody.h
@@ -138,20 +138,17 @@ class Tensor : public TensorBase {
   }
 
   Tensor toBackend(c10::Backend b) const {
-    if (b == c10::Backend::CPU) {
-      PaddlePlace place(phi::AllocationType::CPU);
-      return tensor_.copy_to(place, true);
-    } else if (b == c10::Backend::CUDA) {
-      auto place = paddle::DefaultGPUPlace();
-      return tensor_.copy_to(place, true);
-    } else if (b == c10::Backend::XPU) {
-      PaddlePlace place(phi::AllocationType::XPU);
-      return tensor_.copy_to(place, true);
-    } else if (b == c10::Backend::IPU) {
-      PaddlePlace place(phi::AllocationType::IPU);
-      return tensor_.copy_to(place, true);
-    } else {
-      PD_CHECK(false, "Unsupported backend");
+    switch (b) {
+      case c10::Backend::CPU:
+        return tensor_.copy_to(PaddlePlace(phi::AllocationType::CPU), true);
+      case c10::Backend::CUDA:
+        return tensor_.copy_to(paddle::DefaultGPUPlace(), true);
+      case c10::Backend::XPU:
+        return tensor_.copy_to(paddle::DefaultXPUPlace(), true);
+      case c10::Backend::IPU:
+        return tensor_.copy_to(PaddlePlace(phi::IPUPlace()), true);
+      default:
+        PD_CHECK(false, "Unsupported backend");
     }
     return tensor_;
   }

diff --git a/paddle/phi/api/include/compat/ATen/ops/to.h b/paddle/phi/api/include/compat/ATen/ops/to.h
@@ -39,11 +39,11 @@ inline at::Tensor Tensor::to(
     phi::Place place;
     switch (dev.type()) {
       case c10::DeviceType::CPU:
-        place = phi::CPUPlace();
-        break;
       case c10::DeviceType::CUDA:
-        place = dev.has_index() ? phi::GPUPlace(dev.index())
-                                : paddle::DefaultGPUPlace();
+      case c10::DeviceType::XPU:
+      case c10::DeviceType::IPU:
+      case c10::DeviceType::CUSTOM:
+        place = dev._PD_GetInner();
         break;
       default:
         PD_THROW("Unsupported device type: ", dev.type());

diff --git a/paddle/phi/api/include/compat/c10/core/Device.h b/paddle/phi/api/include/compat/c10/core/Device.h
@@ -133,9 +133,9 @@ struct Device final {
       case DeviceType::CUDA:
         return has_index() ? phi::GPUPlace(index_) : paddle::DefaultGPUPlace();
       case DeviceType::XPU:
-        return phi::XPUPlace(has_index() ? index_ : 0);
+        return has_index() ? phi::XPUPlace(index_) : paddle::DefaultXPUPlace();
       case DeviceType::IPU:
-        return phi::IPUPlace(has_index() ? index_ : 0);
+        return has_index() ? phi::IPUPlace(index_) : phi::IPUPlace();
       case DeviceType::CUSTOM:
         return phi::CustomPlace(
             custom_device_type_.empty() ? "custom" : custom_device_type_,

diff --git a/test/cpp/compat/ATen_basic_test.cc b/test/cpp/compat/ATen_basic_test.cc
@@ -26,6 +26,9 @@
 #include <c10/cuda/CUDAFunctions.h>
 #include <c10/cuda/CUDAGuard.h>
 #endif
+#ifdef PADDLE_WITH_XPU
+#include "paddle/phi/core/platform/device/xpu/xpu_info.h"
+#endif
 #include "ATen/ATen.h"
 #include "gtest/gtest.h"
 #include "paddle/common/macros.h"
@@ -434,6 +437,61 @@ TEST(TensorBodyTest, ToBackendUnsupportedBranch) {
   ASSERT_THROW(t.toBackend(static_cast<c10::Backend>(-1)), ::std::exception);
 }
 
+TEST(TensorBodyTest, ToBackendCpuBranchCoverage) {
+  at::Tensor t = at::ones({1}, at::kFloat);
+  at::Tensor cpu_t = t.toBackend(c10::Backend::CPU);
+
+  ASSERT_EQ(cpu_t.device().type(), c10::DeviceType::CPU);
+  ASSERT_TRUE(cpu_t.equal(t));
+}
+
+TEST(TensorBodyTest, ToBackendCudaBranchCoverage) {
+  at::Tensor t = at::ones({1}, at::kFloat);
+
+  try {
+    at::Tensor cuda_t = t.toBackend(c10::Backend::CUDA);
+    ASSERT_EQ(cuda_t.device().type(), c10::DeviceType::CUDA);
+  } catch (const std::exception&) {
+    SUCCEED();
+  }
+}
+
+TEST(TensorBodyTest, ToBackendXpuBranchCoverage) {
+  at::Tensor t = at::ones({1}, at::kFloat);
+
+  try {
+    at::Tensor xpu_t = t.toBackend(c10::Backend::XPU);
+    ASSERT_EQ(xpu_t.device().type(), c10::DeviceType::XPU);
+  } catch (const std::exception&) {
+    SUCCEED();
+  }
+}
+
+TEST(TensorBodyTest, ToBackendIpuBranchCoverage) {
+  at::Tensor t = at::ones({1}, at::kFloat);
+
+  try {
+    at::Tensor ipu_t = t.toBackend(c10::Backend::IPU);
+    ASSERT_EQ(ipu_t.device().type(), c10::DeviceType::IPU);
+  } catch (const std::exception&) {
+    SUCCEED();
+  }
+}
+
+#ifdef PADDLE_WITH_XPU
+TEST(TensorBodyTest, ToBackendXpuUsesCurrentDevice) {
+  if (paddle::platform::GetXPUDeviceCount() < 2) {
+    return;
+  }
+  paddle::platform::XPUDeviceGuard guard(1);
+  at::Tensor t = at::ones({1}, at::kFloat);
+  at::Tensor xpu_t = t.toBackend(c10::Backend::XPU);
+
+  ASSERT_EQ(xpu_t.device().type(), c10::DeviceType::XPU);
+  ASSERT_EQ(xpu_t.device().index(), 1);
+}
+#endif
+
 TEST(TensorBodyTest, MetaUnsupportedBranch) {
   at::Tensor t = at::ones({1}, at::kFloat);
   ASSERT_THROW((void)t.meta(), ::std::exception);

diff --git a/test/cpp/compat/ATen_empty_test.cc b/test/cpp/compat/ATen_empty_test.cc
@@ -19,6 +19,13 @@
 #include <ATen/ops/empty.h>
 #include <c10/core/ScalarType.h>
 #include <c10/core/TensorOptions.h>
+#if defined(PADDLE_WITH_CUDA) || defined(PADDLE_WITH_HIP)
+#include <c10/cuda/CUDAFunctions.h>
+#include <c10/cuda/CUDAGuard.h>
+#endif
+#ifdef PADDLE_WITH_XPU
+#include "paddle/phi/core/platform/device/xpu/xpu_info.h"
+#endif
 
 #include "ATen/ATen.h"
 #include "gtest/gtest.h"
@@ -55,8 +62,6 @@ TEST(ATenEmptyTest, ExplicitArgsCpu) {
 // ======================== pin_memory tests ========================
 
 #if defined(PADDLE_WITH_CUDA) || defined(PADDLE_WITH_HIP)
-#include <c10/cuda/CUDAFunctions.h>
-#include <c10/cuda/CUDAGuard.h>
 
 // TensorOptions overload: pin_memory via options
 TEST(ATenEmptyTest, PinMemoryViaTensorOptions) {
@@ -154,3 +159,17 @@ TEST(ATenEmptyTest, EmptyCudaOptionsHelperDefaultDeviceUsesCurrentDevice) {
 }
 
 #endif  // PADDLE_WITH_CUDA || PADDLE_WITH_HIP
+
+#ifdef PADDLE_WITH_XPU
+TEST(ATenEmptyTest, DefaultXpuDeviceUsesCurrentDevice) {
+  if (paddle::platform::GetXPUDeviceCount() < 2) {
+    return;
+  }
+  paddle::platform::XPUDeviceGuard guard(1);
+  at::Tensor t =
+      at::empty({8}, at::TensorOptions().dtype(at::kFloat).device(at::kXPU));
+
+  ASSERT_EQ(t.device().type(), c10::DeviceType::XPU);
+  ASSERT_EQ(t.device().index(), 1);
+}
+#endif
diff --git a/test/cpp/compat/ATen_to_test.cc b/test/cpp/compat/ATen_to_test.cc
@@ -25,6 +25,9 @@
 #include <c10/cuda/CUDAFunctions.h>
 #include <c10/cuda/CUDAGuard.h>
 #endif
+#ifdef PADDLE_WITH_XPU
+#include "paddle/phi/core/platform/device/xpu/xpu_info.h"
+#endif
 #include "ATen/ATen.h"
 #include "gtest/gtest.h"
 #include "paddle/phi/common/float16.h"
@@ -150,9 +153,9 @@ TEST(TensorToTest, ToCopyAndUnsupportedDeviceBranches) {
                            std::nullopt);
   EXPECT_TRUE(pinned.equal(t));
 
-  EXPECT_THROW(
-      t.to(at::TensorOptions().device(c10::Device(c10::DeviceType::XPU, 0))),
-      ::std::exception);
+  EXPECT_THROW(t.to(at::TensorOptions().device(
+                   c10::Device(static_cast<c10::DeviceType>(-1), 0))),
+               ::std::exception);
 }
 
 // ---- Overload 3: to(Device, ScalarType) ----
@@ -244,3 +247,34 @@ TEST(TensorToTest, ToDeviceWithoutIndexUsesCurrentCudaDevice) {
   ASSERT_EQ(result.device().index(), 1);
 }
 #endif
+
+#ifdef PADDLE_WITH_XPU
+TEST(TensorToTest, ToDevice_CPUToXPU) {
+  if (paddle::platform::GetXPUDeviceCount() == 0) {
+    return;
+  }
+  at::Tensor t = at::tensor({5.0f}, at::kFloat);
+  at::Tensor result = t.to(c10::Device(c10::kXPU, 0),
+                           at::kFloat,
+                           /*non_blocking=*/false,
+                           /*copy=*/false);
+
+  ASSERT_EQ(result.device().type(), c10::DeviceType::XPU);
+  ASSERT_EQ(result.device().index(), 0);
+}
+
+TEST(TensorToTest, ToDeviceWithoutIndexUsesCurrentXpuDevice) {
+  if (paddle::platform::GetXPUDeviceCount() < 2) {
+    return;
+  }
+  paddle::platform::XPUDeviceGuard guard(1);
+  at::Tensor t = at::tensor({5.0f}, at::kFloat);
+  at::Tensor result = t.to(c10::Device(c10::kXPU),
+                           at::kFloat,
+                           /*non_blocking=*/false,
+                           /*copy=*/false);
+
+  ASSERT_EQ(result.device().type(), c10::DeviceType::XPU);
+  ASSERT_EQ(result.device().index(), 1);
+}
+#endif
diff --git a/test/cpp/compat/c10_Device_test.cc b/test/cpp/compat/c10_Device_test.cc
@@ -18,6 +18,9 @@
 #include <c10/cuda/CUDAFunctions.h>
 #include <c10/cuda/CUDAGuard.h>
 #endif
+#ifdef PADDLE_WITH_XPU
+#include "paddle/phi/core/platform/device/xpu/xpu_info.h"
+#endif
 
 #include <sstream>
 #include <unordered_map>
@@ -130,8 +133,22 @@ TEST(DeviceCompatTest, DeviceParseAndPlaceBranches) {
   EXPECT_EQ(cuda_no_index._PD_GetInner().GetDeviceId(), 0);
 #endif
   c10::Device xpu_no_index(c10::DeviceType::XPU);
+#ifdef PADDLE_WITH_XPU
+  auto xpu_device_count = paddle::platform::GetXPUDeviceCount();
+  if (xpu_device_count > 0) {
+    EXPECT_EQ(xpu_no_index._PD_GetInner().GetType(), phi::AllocationType::XPU);
+  }
+  if (xpu_device_count >= 2) {
+    paddle::platform::XPUDeviceGuard guard(1);
+    EXPECT_EQ(c10::Device(c10::DeviceType::XPU)._PD_GetInner().GetDeviceId(),
+              1);
+  } else if (xpu_device_count == 1) {
+    EXPECT_EQ(xpu_no_index._PD_GetInner().GetDeviceId(), 0);
+  }
+#else
   EXPECT_EQ(xpu_no_index._PD_GetInner().GetType(), phi::AllocationType::XPU);
   EXPECT_EQ(xpu_no_index._PD_GetInner().GetDeviceId(), 0);
+#endif
   c10::Device ipu_no_index(c10::DeviceType::IPU);
   EXPECT_EQ(ipu_no_index._PD_GetInner().GetType(), phi::AllocationType::IPU);
   EXPECT_EQ(ipu_no_index._PD_GetInner().GetDeviceId(), 0);