Error Handling: make XLATensor::Create() return status type. (#9544)

ysiraichi · web-flow · commit 095faec1e7b6 · 2025-08-08T15:32:11.000-03:00
diff --git a/test/cpp/test_tensor.cpp b/test/cpp/test_tensor.cpp
@@ -101,8 +101,8 @@ TEST_F(TensorTest, TestAdd) {
   at::Tensor c = a.add(b, 1.0);
 
   ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-    XLATensorPtr dev_a = XLATensor::Create(a, device);
-    XLATensorPtr dev_b = XLATensor::Create(b, device);
+    XLATensorPtr dev_a = GetValueOrThrow(XLATensor::Create(a, device));
+    XLATensorPtr dev_b = GetValueOrThrow(XLATensor::Create(b, device));
     XLATensorPtr dev_c = tensor_methods::add(dev_a, dev_b, 1.0);
 
     AllClose(c, dev_c);
@@ -121,8 +121,8 @@ TEST_F(TensorTest, TestIntegerAdd) {
           at::isIntegralType(type) ? at::Scalar(int64_t(1)) : at::Scalar(1.0);
       at::Tensor c = a.add(b, one);
 
-      XLATensorPtr dev_a = XLATensor::Create(a, device);
-      XLATensorPtr dev_b = XLATensor::Create(b, device);
+      XLATensorPtr dev_a = GetValueOrThrow(XLATensor::Create(a, device));
+      XLATensorPtr dev_b = GetValueOrThrow(XLATensor::Create(b, device));
       XLATensorPtr dev_c = tensor_methods::add(dev_a, dev_b, one);
 
       EXPECT_TRUE(EqualValuesNoElementTypeCheck(
@@ -135,7 +135,7 @@ TEST_F(TensorTest, TestSize) {
   at::Tensor input = at::rand({2, 1, 4, 6}, at::TensorOptions(at::kFloat));
   int rank = input.dim();
   ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-    XLATensorPtr dev_input = XLATensor::Create(input, device);
+    XLATensorPtr dev_input = GetValueOrThrow(XLATensor::Create(input, device));
     for (int dim = -rank; dim < rank; ++dim) {
       EXPECT_EQ(input.size(dim), dev_input->size(dim));
     }
@@ -151,8 +151,10 @@ TEST_F(TensorTest, TestRrelu) {
       at::Tensor noise = at::zeros_like(input);
       at::Tensor output =
           at::rrelu_with_noise(input, noise, lower, upper, training);
-      XLATensorPtr dev_input = XLATensor::Create(input, device);
-      XLATensorPtr dev_noise = XLATensor::Create(noise, device);
+      XLATensorPtr dev_input =
+          GetValueOrThrow(XLATensor::Create(input, device));
+      XLATensorPtr dev_noise =
+          GetValueOrThrow(XLATensor::Create(noise, device));
       XLATensorPtr dev_outputs = tensor_methods::rrelu_with_noise(
           dev_input, dev_noise, lower, upper, training);
       AllClose(output, dev_outputs);
@@ -167,7 +169,7 @@ TEST_F(TensorTest, TestThreshold) {
   float value = 20;
   at::Tensor output = at::threshold(input, threshold, value);
   ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-    XLATensorPtr dev_input = XLATensor::Create(input, device);
+    XLATensorPtr dev_input = GetValueOrThrow(XLATensor::Create(input, device));
     XLATensorPtr dev_output =
         tensor_methods::threshold(dev_input, threshold, value);
     AllClose(output, dev_output);
@@ -185,9 +187,10 @@ TEST_F(TensorTest, TestAddMatMul) {
   at::Tensor bias = at::rand({labels}, at::TensorOptions(at::kFloat));
   at::Tensor output = at::addmm(bias, input, weight);
   ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-    XLATensorPtr dev_input = XLATensor::Create(input, device);
-    XLATensorPtr dev_weight = XLATensor::Create(weight, device);
-    XLATensorPtr dev_bias = XLATensor::Create(bias, device);
+    XLATensorPtr dev_input = GetValueOrThrow(XLATensor::Create(input, device));
+    XLATensorPtr dev_weight =
+        GetValueOrThrow(XLATensor::Create(weight, device));
+    XLATensorPtr dev_bias = GetValueOrThrow(XLATensor::Create(bias, device));
     XLATensorPtr dev_output =
         tensor_methods::addmm(dev_input, dev_weight, dev_bias);
     AllClose(output, dev_output);
@@ -198,7 +201,7 @@ TEST_F(TensorTest, TestTranspose) {
   at::Tensor input = at::rand({2, 3}, at::TensorOptions(at::kFloat));
   at::Tensor output = at::transpose(input, 0, 1);
   ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-    XLATensorPtr dev_input = XLATensor::Create(input, device);
+    XLATensorPtr dev_input = GetValueOrThrow(XLATensor::Create(input, device));
     XLATensorPtr dev_output = tensor_methods::transpose(dev_input, 0, 1);
     AllClose(output, dev_output);
   });
@@ -208,7 +211,7 @@ TEST_F(TensorTest, TestView) {
   at::Tensor input = at::rand({32, 20, 4, 4}, at::TensorOptions(at::kFloat));
   at::Tensor output = input.view({-1, 320});
   ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-    XLATensorPtr dev_input = XLATensor::Create(input, device);
+    XLATensorPtr dev_input = GetValueOrThrow(XLATensor::Create(input, device));
     XLATensorPtr dev_output = tensor_methods::view(dev_input, {-1, 320});
     AllClose(output, dev_output);
   });
@@ -289,7 +292,8 @@ TEST_F(TensorTest, TestMaxPool2D) {
                          /*padding=*/{padding, padding}, /*dilation=*/{1, 1},
                          /*ceil_mode=*/false);
       ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-        XLATensorPtr dev_input = XLATensor::Create(input, device);
+        XLATensorPtr dev_input =
+            GetValueOrThrow(XLATensor::Create(input, device));
         auto dev_output = tensor_methods::max_pool_nd(
             dev_input,
             /*spatial_dim_count=*/2,
@@ -313,7 +317,8 @@ TEST_F(TensorTest, TestMaxPool2DNonSquare) {
           /*padding=*/{padding, padding + 1}, /*dilation=*/{1, 1},
           /*ceil_mode=*/false);
       ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-        XLATensorPtr dev_input = XLATensor::Create(input, device);
+        XLATensorPtr dev_input =
+            GetValueOrThrow(XLATensor::Create(input, device));
         auto dev_output = tensor_methods::max_pool_nd(
             dev_input,
             /*spatial_dim_count=*/2,
@@ -341,7 +346,8 @@ TEST_F(TensorTest, TestAvgPool2D) {
                            /*ceil_mode=*/false, count_include_pad,
                            /*divisor_override=*/std::nullopt);
         ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-          XLATensorPtr dev_input = XLATensor::Create(input, device);
+          XLATensorPtr dev_input =
+              GetValueOrThrow(XLATensor::Create(input, device));
           XLATensorPtr dev_output = tensor_methods::avg_pool_nd(
               dev_input,
               /*spatial_dim_count=*/2,
@@ -371,7 +377,8 @@ TEST_F(TensorTest, TestAvgPool2DNonSquare) {
             /*count_include_pad=*/count_include_pad,
             /*divisor_override=*/std::nullopt);
         ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-          XLATensorPtr dev_input = XLATensor::Create(input, device);
+          XLATensorPtr dev_input =
+              GetValueOrThrow(XLATensor::Create(input, device));
           XLATensorPtr dev_output = tensor_methods::avg_pool_nd(
               dev_input,
               /*spatial_dim_count=*/2,
@@ -409,15 +416,20 @@ TEST_F(TensorTest, TestBatchNorm1D) {
           /*running_mean=*/running_mean, /*running_var=*/running_var,
           /*training=*/training, /*momentum=*/momentum, /*eps=*/eps);
       ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-        XLATensorPtr xla_input = XLATensor::Create(input, device);
-        XLATensorPtr xla_weight = undef_weight_bias
-                                      ? XLATensorPtr()
-                                      : XLATensor::Create(weight, device);
-        XLATensorPtr xla_bias = undef_weight_bias
-                                    ? XLATensorPtr()
-                                    : XLATensor::Create(bias, device);
-        XLATensorPtr xla_running_mean = XLATensor::Create(running_mean, device);
-        XLATensorPtr xla_running_var = XLATensor::Create(running_var, device);
+        XLATensorPtr xla_input =
+            GetValueOrThrow(XLATensor::Create(input, device));
+        XLATensorPtr xla_weight =
+            undef_weight_bias
+                ? XLATensorPtr()
+                : GetValueOrThrow(XLATensor::Create(weight, device));
+        XLATensorPtr xla_bias =
+            undef_weight_bias
+                ? XLATensorPtr()
+                : GetValueOrThrow(XLATensor::Create(bias, device));
+        XLATensorPtr xla_running_mean =
+            GetValueOrThrow(XLATensor::Create(running_mean, device));
+        XLATensorPtr xla_running_var =
+            GetValueOrThrow(XLATensor::Create(running_var, device));
         auto xla_output = tensor_methods::native_batch_norm(
             /*input=*/xla_input, /*weight=*/xla_weight, /*bias=*/xla_bias,
             /*running_mean=*/xla_running_mean, /*running_var=*/xla_running_var,
@@ -474,11 +486,14 @@ TEST_F(TensorTest, TestConv2D) {
                     /*output_padding=*/{output_padding, output_padding},
                     /*groups=*/groups, false, false, false);
                 ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-                  XLATensorPtr dev_input = XLATensor::Create(input, device);
-                  XLATensorPtr dev_weight = XLATensor::Create(weight, device);
+                  XLATensorPtr dev_input =
+                      GetValueOrThrow(XLATensor::Create(input, device));
+                  XLATensorPtr dev_weight =
+                      GetValueOrThrow(XLATensor::Create(weight, device));
                   XLATensorPtr dev_output;
                   if (with_bias) {
-                    XLATensorPtr dev_bias = XLATensor::Create(bias, device);
+                    XLATensorPtr dev_bias =
+                        GetValueOrThrow(XLATensor::Create(bias, device));
                     dev_output = tensor_methods::convolution_overrideable(
                         dev_input, dev_weight, dev_bias,
                         /*stride=*/{stride, stride},
@@ -543,11 +558,14 @@ TEST_F(TensorTest, TestConv2DNonSquare) {
                     /*groups=*/groups, false, false, false);
 
                 ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-                  XLATensorPtr dev_input = XLATensor::Create(input, device);
-                  XLATensorPtr dev_weight = XLATensor::Create(weight, device);
+                  XLATensorPtr dev_input =
+                      GetValueOrThrow(XLATensor::Create(input, device));
+                  XLATensorPtr dev_weight =
+                      GetValueOrThrow(XLATensor::Create(weight, device));
                   XLATensorPtr dev_output;
                   if (with_bias) {
-                    XLATensorPtr dev_bias = XLATensor::Create(bias, device);
+                    XLATensorPtr dev_bias =
+                        GetValueOrThrow(XLATensor::Create(bias, device));
                     dev_output = tensor_methods::convolution_overrideable(
                         dev_input, dev_weight, dev_bias,
                         /*stride=*/{stride, stride + 1},
@@ -616,11 +634,14 @@ TEST_F(TensorTest, TestConv3D) {
                     {output_padding, output_padding, output_padding},
                     /*groups=*/groups, false, false, false);
                 ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-                  XLATensorPtr dev_input = XLATensor::Create(input, device);
-                  XLATensorPtr dev_weight = XLATensor::Create(weight, device);
+                  XLATensorPtr dev_input =
+                      GetValueOrThrow(XLATensor::Create(input, device));
+                  XLATensorPtr dev_weight =
+                      GetValueOrThrow(XLATensor::Create(weight, device));
                   XLATensorPtr dev_output;
                   if (with_bias) {
-                    XLATensorPtr dev_bias = XLATensor::Create(bias, device);
+                    XLATensorPtr dev_bias =
+                        GetValueOrThrow(XLATensor::Create(bias, device));
                     dev_output = tensor_methods::convolution_overrideable(
                         dev_input, dev_weight, dev_bias,
                         /*stride=*/{stride, stride, stride},
@@ -688,10 +709,14 @@ TEST_F(TensorTest, TestConv3D) {
 //                     {output_padding, output_padding + 1, output_padding},
 //                     /*groups=*/groups, false, false, false);
 //                 ForEachDevice([&](const torch::lazy::BackendDevice& device) {
-//                   XLATensorPtr dev_input = XLATensor::Create(input, device);
-//                   XLATensorPtr dev_weight = XLATensor::Create(weight,
-//                   device); XLATensorPtr dev_output; if (with_bias) {
-//                     XLATensorPtr dev_bias = XLATensor::Create(bias, device);
+//                   XLATensorPtr dev_input =
+//                   GetValueOrThrow(XLATensor::Create(input, device));
+//                   XLATensorPtr dev_weight =
+//                   GetValueOrThrow(XLATensor::Create(weight, device);
+//                   XLATensorPtr dev_output;
+//                   if (with_bias) {
+//                     XLATensorPtr dev_bias =
+//                     GetValueOrThrow(XLATensor::Create(bias, device));
 //                     dev_output = tensor_methods::convolution_overrideable(
 //                         dev_input, dev_weight, dev_bias,
 //                         /*stride=*/{stride, stride + 1, stride + 1},
diff --git a/torch_xla/csrc/aten_xla_bridge.cpp b/torch_xla/csrc/aten_xla_bridge.cpp
@@ -186,8 +186,9 @@ XLATensorPtr GetOrCreateXlaTensor(const at::Tensor& tensor,
   }
 
   auto xtensor = GetXlaTensor(tensor);
-  return xtensor.ok() ? xtensor.value()
-                      : XLATensor::Create(inner_tensor, device);
+  return xtensor.ok()
+             ? xtensor.value()
+             : GetValueOrThrow(XLATensor::Create(inner_tensor, device));
 }
 
 XLATensorPtr GetOrCreateXlaTensor(const std::optional<at::Tensor>& tensor,
@@ -478,7 +479,8 @@ at::Tensor CreateXlaTensor(
     at::Tensor tensor,
     const std::optional<torch::lazy::BackendDevice>& device) {
   if (tensor.defined() && device) {
-    XLATensorPtr xla_tensor = XLATensor::Create(std::move(tensor), *device);
+    XLATensorPtr xla_tensor =
+        GetValueOrThrow(XLATensor::Create(std::move(tensor), *device));
     tensor = AtenFromXlaTensor(xla_tensor);
   }
   return tensor;
diff --git a/torch_xla/csrc/tensor.cpp b/torch_xla/csrc/tensor.cpp
@@ -61,9 +61,15 @@ bool CanApplySharding(const XLATensor::ShardingSpecPtr sharding) {
 
 XLATensor::Data::~Data() { XLAGraphExecutor::Get()->UnregisterTensor(this); }
 
-XLATensorPtr XLATensor::Create(const at::Tensor& tensor,
-                               const torch::lazy::BackendDevice& device) {
-  XLA_CHECK_EQ(tensor.device().type(), at::kCPU);
+absl::StatusOr<absl_nonnull XLATensorPtr> XLATensor::Create(
+    const at::Tensor& tensor, const torch::lazy::BackendDevice& device) {
+  if (!tensor.is_cpu()) {
+    return XLA_ERROR_WITH_LOCATION(absl::InvalidArgumentError(absl::StrCat(
+        "Could not create an XLATensor out of the provided tensor. Expected "
+        "tensor data to be on CPU. Got: ",
+        c10::DeviceTypeName(tensor.device().type()),
+        ". Consider moving the tensor to CPU.")));
+  }
   XLATensorPtr xtensor =
       c10::make_intrusive<XLATensor>(XLATensor(tensor, device));
   XLAGraphExecutor::Get()->RegisterTensor(xtensor->data());
@@ -621,7 +627,7 @@ std::vector<XLATensorPtr> XLATensor::MakeOutputTensors(
 XLATensorPtr XLATensor::CopyTensorToDevice(
     const torch::lazy::BackendDevice& device) {
   // TODO: This can be optimized via proper XRT/XLA computation.
-  return Create(ToTensor(/*detached=*/true), device);
+  return GetValueOrThrow(Create(ToTensor(/*detached=*/true), device));
 }
 
 torch::lazy::Value XLATensor::MaybeCastIrValue(
diff --git a/torch_xla/csrc/tensor.h b/torch_xla/csrc/tensor.h
@@ -9,6 +9,7 @@
 #include <memory>
 #include <string>
 
+#include "absl/base/nullability.h"
 #include "torch_xla/csrc/runtime/util.h"
 #include "torch_xla/csrc/view.h"
 
@@ -149,8 +150,8 @@ class XLATensor : public torch::lazy::LazyTensor {
     bool is_cloned = false;
   };
 
-  static XLATensorPtr Create(const at::Tensor& tensor,
-                             const torch::lazy::BackendDevice& device);
+  static absl::StatusOr<absl_nonnull XLATensorPtr> Create(
+      const at::Tensor& tensor, const torch::lazy::BackendDevice& device);
   static XLATensorPtr Create(
       torch::lazy::BackendDataPtr handle,
       std::optional<at::ScalarType> logical_element_type = std::nullopt);
diff --git a/torch_xla/csrc/tensor_methods.cpp b/torch_xla/csrc/tensor_methods.cpp
@@ -1336,8 +1336,9 @@ std::tuple<XLATensorPtr, XLATensorPtr> cummax(const XLATensorPtr& input,
     at::Tensor val =
         at::empty(shape_, at::TensorOptions().dtype(input->dtype()));
     at::Tensor idx = at::empty(shape_, at::TensorOptions().dtype(at::kLong));
-    return std::make_tuple(input->Create(val, input->GetDevice()),
-                           input->Create(idx, input->GetDevice()));
+    return std::make_tuple(
+        GetValueOrThrow(XLATensor::Create(val, input->GetDevice())),
+        GetValueOrThrow(XLATensor::Create(idx, input->GetDevice())));
   }
   torch::lazy::NodePtr node =
       torch_xla::MakeNode<CumMax>(input->GetIrValue(), canonical_dim);

Original file line number	Diff line number	Diff line change
`@@ -186,8 +186,9 @@ XLATensorPtr GetOrCreateXlaTensor(const at::Tensor& tensor,`
`186`	`186`	`}`
`187`	`187`
`188`	`188`	`auto xtensor = GetXlaTensor(tensor);`
`189`		`- return xtensor.ok() ? xtensor.value()`
`190`		`- : XLATensor::Create(inner_tensor, device);`
	`189`	`+ return xtensor.ok()`
	`190`	`+ ? xtensor.value()`
	`191`	`+ : GetValueOrThrow(XLATensor::Create(inner_tensor, device));`
`191`	`192`	`}`
`192`	`193`
`193`	`194`	`XLATensorPtr GetOrCreateXlaTensor(const std::optional<at::Tensor>& tensor,`
`@@ -478,7 +479,8 @@ at::Tensor CreateXlaTensor(`
`478`	`479`	`at::Tensor tensor,`
`479`	`480`	`const std::optional<torch::lazy::BackendDevice>& device) {`
`480`	`481`	`if (tensor.defined() && device) {`
`481`		`- XLATensorPtr xla_tensor = XLATensor::Create(std::move(tensor), *device);`
	`482`	`+ XLATensorPtr xla_tensor =`
	`483`	`+ GetValueOrThrow(XLATensor::Create(std::move(tensor), *device));`
`482`	`484`	`tensor = AtenFromXlaTensor(xla_tensor);`
`483`	`485`	`}`
`484`	`486`	`return tensor;`