Friendly handle mem_get_info's runtime error message (pytorch#146899)

# Motivation Friendly handle the runtime error message if the device doesn't support querying the available free memory. See intel/torch-xpu-ops#1352 Pull Request resolved: pytorch#146899 Approved by: https://github.com/EikanWang
Ryo-not-rio · Feb 24, 2025 · 24532f8 · 24532f8
1 parent 6f05cd2
commit 24532f8
Showing 1 changed file with 9 additions and 2 deletions.
diff --git a/torch/csrc/xpu/Module.cpp b/torch/csrc/xpu/Module.cpp
@@ -380,8 +380,15 @@ static void initXpuMethodBindings(PyObject* module) {
   m.def("_xpu_getMemoryInfo", [](c10::DeviceIndex device_index) {
 #if SYCL_COMPILER_VERSION >= 20250000
     auto total = at::xpu::getDeviceProperties(device_index)->global_mem_size;
-    auto free = c10::xpu::get_raw_device(device_index)
-                    .get_info<sycl::ext::intel::info::device::free_memory>();
+    auto& device = c10::xpu::get_raw_device(device_index);
+    TORCH_CHECK(
+        device.has(sycl::aspect::ext_intel_free_memory),
+        "The device (",
+        at::xpu::getDeviceProperties(device_index)->name,
+        ") doesn't support querying the available free memory. ",
+        "You can file an issue at https://github.com/pytorch/pytorch/issues ",
+        "to help us prioritize its implementation.");
+    auto free = device.get_info<sycl::ext::intel::info::device::free_memory>();
     return std::make_tuple(free, total);
 #else
   TORCH_CHECK_NOT_IMPLEMENTED(