pytorch
diff --git a/‎.github/scripts/run_tests.sh‎
Lines changed: 1 addition & 0 deletions b/‎.github/scripts/run_tests.sh‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎BUILD‎
Lines changed: 1 addition & 0 deletions b/‎BUILD‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎test/cpp/BUILD‎
Lines changed: 9 additions & 0 deletions b/‎test/cpp/BUILD‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎test/cpp/cpp_test_util.cpp‎
Lines changed: 6 additions & 6 deletions b/‎test/cpp/cpp_test_util.cpp‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎test/cpp/run_tests.sh‎
Lines changed: 2 additions & 1 deletion b/‎test/cpp/run_tests.sh‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎test/cpp/test_replication.cpp‎
Lines changed: 3 additions & 3 deletions b/‎test/cpp/test_replication.cpp‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎test/cpp/test_runtime.cpp‎
Lines changed: 26 additions & 0 deletions b/‎test/cpp/test_runtime.cpp‎
Lines changed: 26 additions & 0 deletions
diff --git a/‎test/cpp/test_xla_sharding.cpp‎
Lines changed: 8 additions & 7 deletions b/‎test/cpp/test_xla_sharding.cpp‎
Lines changed: 8 additions & 7 deletions
diff --git a/‎torch_xla/csrc/aten_fallback.cpp‎
Lines changed: 1 addition & 1 deletion b/‎torch_xla/csrc/aten_fallback.cpp‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎torch_xla/csrc/aten_xla_bridge.cpp‎
Lines changed: 4 additions & 3 deletions b/‎torch_xla/csrc/aten_xla_bridge.cpp‎
Lines changed: 4 additions & 3 deletions
@@ -53,6 +53,7 @@ function run_torch_xla_cpp_tests() {
                "test_lazy"
                "test_replication"
                "test_tensor"
+               "test_runtime"
                # disable test_xla_backend_intf since it is flaky on upstream
                #"test_xla_backend_intf"
                "test_xla_sharding")
 
@@ -77,6 +77,7 @@ test_suite(
         "//test/cpp:test_replication",
         "//test/cpp:test_tensor",
         "//test/cpp:test_xla_sharding",
+        "//test/cpp:test_runtime",
         "//torch_xla/csrc/runtime:pjrt_computation_client_test",
         # "//torch_xla/csrc/runtime:ifrt_computation_client_test",
     ],
 
@@ -149,3 +149,12 @@ ptxla_cc_test(
     )
     for test in glob(["test_aten_xla_tensor*cpp"])
 ]
+
+ptxla_cc_test(
+    name = "test_runtime",
+    srcs = ["test_runtime.cpp"],
+    deps = [
+        "//torch_xla/csrc/runtime:runtime",
+        "@com_google_googletest//:gtest_main",
+    ],
+)
@@ -225,14 +225,14 @@ void WithAllDevices(
     std::vector<torch::lazy::BackendDevice> devices;
     std::vector<torch::lazy::BackendDevice> all_devices;
     for (const auto& device_str :
-         torch_xla::runtime::GetComputationClient()->GetLocalDevices()) {
+         torch_xla::runtime::GetComputationClientOrDie()->GetLocalDevices()) {
       torch::lazy::BackendDevice device = ParseDeviceString(device_str);
       if (device.type() == device_type.type) {
         devices.push_back(device);
       }
     }
     for (const auto& device_str :
-         torch_xla::runtime::GetComputationClient()->GetAllDevices()) {
+         torch_xla::runtime::GetComputationClientOrDie()->GetAllDevices()) {
       torch::lazy::BackendDevice device = ParseDeviceString(device_str);
       if (device.type() == device_type.type) {
         all_devices.push_back(device);
@@ -283,17 +283,17 @@ std::vector<torch_xla::runtime::ComputationClient::DataPtr> Execute(
   std::vector<torch_xla::runtime::ComputationClient::CompileInstance> instances;
   instances.push_back(
       {std::move(computation), device.toString(),
-       torch_xla::runtime::GetComputationClient()->GetCompilationDevices(
+       torch_xla::runtime::GetComputationClientOrDie()->GetCompilationDevices(
            device.toString(), {}),
        &shape});
 
   std::vector<
       std::shared_ptr<torch_xla::runtime::ComputationClient::Computation>>
-      computations = torch_xla::runtime::GetComputationClient()->Compile(
+      computations = torch_xla::runtime::GetComputationClientOrDie()->Compile(
           std::move(instances));
 
   torch_xla::runtime::ComputationClient::ExecuteComputationOptions options;
-  return torch_xla::runtime::GetComputationClient()->ExecuteComputation(
+  return torch_xla::runtime::GetComputationClientOrDie()->ExecuteComputation(
       *computations.front(), UnwrapXlaData(lowering_ctx.GetParametersData()),
       device.toString(), options);
 }
@@ -302,7 +302,7 @@ std::vector<at::Tensor> Fetch(
     absl::Span<const torch_xla::runtime::ComputationClient::DataPtr>
         device_data) {
   std::vector<xla::Literal> literals =
-      torch_xla::runtime::GetComputationClient()->TransferFromDevice(
+      torch_xla::runtime::GetComputationClientOrDie()->TransferFromDevice(
           device_data);
   std::vector<at::Tensor> tensors;
   for (auto& literal : literals) {
 
@@ -99,7 +99,8 @@ if [[ "$RUN_CPP_TESTS" == "cpp_tests" ]]; then
               "test_tensor"
               # disable test_xla_backend_intf since it is flaky on upstream
               #"test_xla_backend_intf"
-              "test_xla_sharding")
+              "test_xla_sharding"
+              "test_runtime")
 fi
 for name in "${test_names[@]}"; do
   echo "Running $name cpp test..."
 
@@ -48,7 +48,7 @@ void TestSingleReplication(
   }
   std::vector<torch_xla::runtime::ComputationClient::ComputationPtr>
       compiled_computations =
-          torch_xla::runtime::GetComputationClient()->Compile(
+          torch_xla::runtime::GetComputationClientOrDie()->Compile(
               std::move(instances));
 
   std::vector<at::Tensor> tensors;
@@ -65,7 +65,7 @@ void TestSingleReplication(
   for (size_t i = 0; i < device_strings.size(); ++i) {
     auto executor = [&, i]() {
       results[i] =
-          torch_xla::runtime::GetComputationClient()->ExecuteComputation(
+          torch_xla::runtime::GetComputationClientOrDie()->ExecuteComputation(
               *compiled_computations[i],
               {std::dynamic_pointer_cast<
                   torch_xla::runtime::ComputationClient::Data>(
@@ -79,7 +79,7 @@ void TestSingleReplication(
 
   for (size_t i = 0; i < results.size(); ++i) {
     std::vector<xla::Literal> literals =
-        torch_xla::runtime::GetComputationClient()->TransferFromDevice(
+        torch_xla::runtime::GetComputationClientOrDie()->TransferFromDevice(
             results[i]);
     ASSERT_EQ(literals.size(), 1);
 
 
@@ -0,0 +1,26 @@
+#include <gtest/gtest.h>
+
+#include "torch_xla/csrc/runtime/runtime.h"
+
+namespace torch_xla::runtime {
+
+TEST(RuntimeTest, ComputationClientInitialization) {
+  ComputationClient* client;
+
+  client = GetComputationClientIfInitialized();
+  EXPECT_EQ(client, nullptr);
+
+  // Initialize the ComputationClient.
+  // Check all the APIs return the same valid ComputationClient.
+
+  client = GetComputationClientOrDie();
+  ASSERT_NE(client, nullptr);
+
+  auto status = GetComputationClient();
+  ASSERT_TRUE(status.ok());
+
+  EXPECT_EQ(status.value(), client);
+  EXPECT_EQ(GetComputationClientIfInitialized(), client);
+}
+
+}  // namespace torch_xla::runtime
@@ -332,14 +332,15 @@ TEST_F(XLAShardingTest, CreateTensorsData) {
       CreateTensorsData(tensors, shardings, devices);
 
   int64_t n_devices =
-      torch_xla::runtime::GetComputationClient()->GetLocalDevices().size();
+      torch_xla::runtime::GetComputationClientOrDie()->GetLocalDevices().size();
   if (n_devices > 1) {
     // null sharding is treated as replicated.
     auto xla_data =
         std::dynamic_pointer_cast<torch_xla::runtime::ComputationClient::Data>(
             tensors_data[0]);
     std::vector<torch_xla::runtime::ComputationClient::DataPtr> shards =
-        torch_xla::runtime::GetComputationClient()->GetDataShards(xla_data);
+        torch_xla::runtime::GetComputationClientOrDie()->GetDataShards(
+            xla_data);
     EXPECT_EQ(shards.size(), n_devices);
     EXPECT_TRUE(xla::Shape::Equal().IgnoreLayout()(xla_data->shape(),
                                                    shards[0]->shape()));
@@ -349,7 +350,7 @@ TEST_F(XLAShardingTest, CreateTensorsData) {
     auto sharded_xla_data =
         std::dynamic_pointer_cast<torch_xla::runtime::ComputationClient::Data>(
             tensors_data[1]);
-    shards = torch_xla::runtime::GetComputationClient()->GetDataShards(
+    shards = torch_xla::runtime::GetComputationClientOrDie()->GetDataShards(
         sharded_xla_data);
     EXPECT_EQ(shards.size(), n_devices);
     EXPECT_TRUE(xla::Shape::Equal().IgnoreLayout()(sharded_xla_data->shape(),
@@ -360,7 +361,7 @@ TEST_F(XLAShardingTest, CreateTensorsData) {
     sharded_xla_data =
         std::dynamic_pointer_cast<torch_xla::runtime::ComputationClient::Data>(
             tensors_data[2]);
-    shards = torch_xla::runtime::GetComputationClient()->GetDataShards(
+    shards = torch_xla::runtime::GetComputationClientOrDie()->GetDataShards(
         sharded_xla_data);
     EXPECT_EQ(shards.size(), n_devices);
     EXPECT_TRUE(xla::Shape::Equal().IgnoreLayout()(sharded_xla_data->shape(),
@@ -372,7 +373,7 @@ TEST_F(XLAShardingTest, CreateTensorsData) {
 TEST_F(XLAShardingTest, PrepareOutputShardingPropagation) {
   xla::Shape shape = xla::ShapeUtil::MakeShape(xla::PrimitiveType::F32, {4, 4});
   int64_t n_devices =
-      torch_xla::runtime::GetComputationClient()->GetLocalDevices().size();
+      torch_xla::runtime::GetComputationClientOrDie()->GetLocalDevices().size();
   xla::Array<int64_t> tile_assignment({1, n_devices});
   tile_assignment.FillIota(0);
   xla::OpSharding tiled = xla::HloSharding::Tile(tile_assignment).ToProto();
@@ -395,15 +396,15 @@ TEST_F(XLAShardingTest, PrepareOutputShardingPropagation) {
 
   std::vector<
       std::shared_ptr<torch_xla::runtime::ComputationClient::Computation>>
-      computations = torch_xla::runtime::GetComputationClient()->Compile(
+      computations = torch_xla::runtime::GetComputationClientOrDie()->Compile(
           std::move(instances));
   torch_xla::runtime::ComputationClient::ComputationPtr computation =
       std::make_shared<torch_xla::runtime::ComputationClient::Computation>(
           "add", std::move(computations[0]->move_computation()));
 
   // Prepare output sharding propagation, expect a sharded output placeholder.
   std::vector<XLATensorPtr> tensors{XLATensor::Create(
-      torch_xla::runtime::GetComputationClient()->CreateDataPlaceholder(
+      torch_xla::runtime::GetComputationClientOrDie()->CreateDataPlaceholder(
           bridge::GetDefaultDevice()->toString(), std::move(shape)))};
   std::vector<torch::lazy::BackendDataPtr> data_placeholders;
   std::vector<XLATensor::ShardingSpecPtr> sharding_specs;
 
@@ -77,7 +77,7 @@ bool UseOpenXLAFallbackOnCUDA(const c10::OperatorHandle& op) {
   //      support running OpenXLA fallback operations on CUDA if the current
   //      PyTorch/XLA DeviceType is not CUDA.
   bool device_is_cuda =
-      runtime::GetComputationClient()->GetDeviceType().getType() ==
+      runtime::GetComputationClientOrDie()->GetDeviceType().getType() ==
       XlaDeviceType::CUDA;
 
   //   3. PyTorch must have been compiled with CUDA support. Otherwise, our
 
@@ -56,7 +56,7 @@ class AtenXlaDeviceMapper {
       devices_ordinals_[devices_.back()] = 0;
     } else {
       for (auto& device_str :
-           torch_xla::runtime::GetComputationClient()->GetLocalDevices()) {
+           torch_xla::runtime::GetComputationClientOrDie()->GetLocalDevices()) {
         devices_.emplace_back(ParseDeviceString(device_str));
         devices_ordinals_[devices_.back()] = devices_.size() - 1;
       }
@@ -366,8 +366,9 @@ std::string ToXlaString(const c10::Device& device) {
 
 const torch::lazy::BackendDevice* GetDefaultDevice() {
   static std::string default_device_spec =
-      UseVirtualDevice() ? "SPMD:0"
-                         : runtime::GetComputationClient()->GetDefaultDevice();
+      UseVirtualDevice()
+          ? "SPMD:0"
+          : runtime::GetComputationClientOrDie()->GetDefaultDevice();
   XLA_CHECK(!default_device_spec.empty());
   static const torch::lazy::BackendDevice default_device =
       ParseDeviceString(default_device_spec);
Original file line number	Diff line number	Diff line change
`@@ -149,3 +149,12 @@ ptxla_cc_test(`
`149`	`149`	`)`
`150`	`150`	`for test in glob(["test_aten_xla_tensor*cpp"])`
`151`	`151`	`]`
	`152`	`+`
	`153`	`+ptxla_cc_test(`
	`154`	`+ name = "test_runtime",`
	`155`	`+ srcs = ["test_runtime.cpp"],`
	`156`	`+ deps = [`
	`157`	`+ "//torch_xla/csrc/runtime:runtime",`
	`158`	`+ "@com_google_googletest//:gtest_main",`
	`159`	`+ ],`
	`160`	`+)`