Add Jet Accelerator

terryheo · copybara-github · commit fda5ee989e81 · 2025-10-17T13:27:51.000-07:00
This is an experimental legacy TFLite Jet based GPU Accelerator.
It doesn't support GPU TensorBuffer binding like other GPU Accelerator but
uses CPU memory TensorBuffer.

Also added benchmark_jet, gpu_numerics_check_jet

LiteRT-PiperOrigin-RevId: 820808902
diff --git a/litert/cc/BUILD b/litert/cc/BUILD
@@ -602,6 +602,63 @@ litert_device_test(
 #     ],
 # )
 #
+# # Should use `--copt=-DCL_DELEGATE_NO_GL` to build for Desktop.
+# cc_test(
+#     name = "litert_compiled_model_jetgpu_test",
+#     srcs = [":litert_compiled_model_jetgpu_test.cc"],
+#     data = [
+#         "//litert/test:mlir_test_data",
+#         "//litert/test:tflite_test_data",
+#     ],
+#     tags = [
+#         "no_oss",
+#         "notap",
+#         "requires-gpu-nvidia",
+#     ],
+#     deps = [
+#         "@com_google_googletest//:gtest_main",
+#         "@com_google_absl//absl/container:flat_hash_map",
+#         "@com_google_absl//absl/debugging:leak_check",
+#         "@com_google_absl//absl/log:absl_log",
+#         "@com_google_absl//absl/strings:string_view",
+#         "@com_google_absl//absl/types:span",
+#         "//litert/c:litert_common",
+#         "//litert/c:litert_environment_options",
+#         "//litert/c:litert_event",
+#         "//litert/c:litert_event_type",
+#         "//litert/c:litert_profiler_event",
+#         "//litert/c:litert_tensor_buffer",
+#         "//litert/c:litert_tensor_buffer_types",
+#         "//litert/cc:litert_compiled_model",
+#         "//litert/cc:litert_element_type",
+#         "//litert/cc:litert_environment",
+#         "//litert/cc:litert_event",
+#         "//litert/cc:litert_expected",
+#         "//litert/cc:litert_layout",
+#         "//litert/cc:litert_macros",
+#         "//litert/cc:litert_model",
+#         "//litert/cc:litert_options",
+#         "//litert/cc:litert_profiler",
+#         "//litert/cc:litert_tensor_buffer",
+#         "//litert/cc/internal:litert_platform_support",
+#         "//litert/cc/options:litert_gpu_options",
+#         "//litert/cc/options:litert_runtime_options",
+#         "//litert/runtime/accelerators/gpu/google:jet_gpu_accelerator",  # buildcleaner: keep
+#         "//litert/test:common",
+#         "//litert/test:matchers",
+#         "//litert/test:simple_model",
+#         "@opencl_headers",
+#     ] + select({
+#         "@org_tensorflow//tensorflow:android": [
+#             "//tflite/delegates/gpu/cl:cl_device",
+#             "//tflite/delegates/gpu/cl:gl_interop",
+#             "//tflite/delegates/gpu/cl:opencl_wrapper",
+#             "//tflite/delegates/gpu/gl:egl_environment",
+#         ],
+#         "//conditions:default": [],
+#     }),
+# )
+#
 # copybara:uncomment_end
 
 cc_library(
diff --git a/litert/cc/litert_compiled_model_jetgpu_test.cc b/litert/cc/litert_compiled_model_jetgpu_test.cc
@@ -0,0 +1,131 @@
+// Copyright 2025 Google LLC.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include <cstring>
+#include <tuple>
+#include <utility>
+
+#include <gmock/gmock.h>
+#include <gtest/gtest.h>
+#include "absl/debugging/leak_check.h"  // from @com_google_absl
+#include "absl/log/absl_log.h"  // from @com_google_absl
+#include "absl/strings/string_view.h"  // from @com_google_absl
+#include "absl/types/span.h"  // from @com_google_absl
+#include "litert/c/litert_common.h"
+#include "litert/c/litert_tensor_buffer_types.h"
+#include "litert/cc/litert_compiled_model.h"
+#include "litert/cc/litert_environment.h"
+#include "litert/cc/litert_expected.h"
+#include "litert/cc/litert_macros.h"
+#include "litert/cc/litert_model.h"
+#include "litert/cc/litert_options.h"
+#include "litert/cc/litert_tensor_buffer.h"
+#include "litert/cc/options/litert_gpu_options.h"
+#include "litert/test/common.h"
+#include "litert/test/matchers.h"
+#include "litert/test/testdata/simple_model_test_vectors.h"
+
+using testing::FloatNear;
+using testing::Pointwise;
+
+namespace litert {
+namespace {
+
+using TestParams = std::tuple<LiteRtDelegatePrecision>;
+
+Expected<Options> CreateGpuOptions(const TestParams& params) {
+  LITERT_ASSIGN_OR_RETURN(auto gpu_options, GpuOptions::Create());
+  LITERT_RETURN_IF_ERROR(gpu_options.SetDelegatePrecision(std::get<0>(params)));
+
+  LITERT_ASSIGN_OR_RETURN(litert::Options options, Options::Create());
+  options.SetHardwareAccelerators(kLiteRtHwAcceleratorGpu);
+  options.AddOpaqueOptions(std::move(gpu_options));
+  return std::move(options);
+}
+
+class ParameterizedTest : public ::testing::TestWithParam<TestParams> {};
+
+TEST_P(ParameterizedTest, Basic) {
+  // To workaround the memory leak in Nvidia's driver
+  absl::LeakCheckDisabler disable_leak_check;
+
+  LITERT_ASSERT_OK_AND_ASSIGN(
+      auto model,
+      Model::CreateFromFile(testing::GetTestFilePath(kModelFileName)));
+
+  auto env = litert::Environment::Create({});
+  ASSERT_TRUE(env);
+
+  LITERT_ASSERT_OK_AND_ASSIGN(auto options, CreateGpuOptions(GetParam()));
+  LITERT_ASSERT_OK_AND_ASSIGN(auto compiled_model,
+                              CompiledModel::Create(*env, model, options));
+
+  LITERT_ASSERT_OK_AND_ASSIGN(auto signatures, model.GetSignatures());
+  EXPECT_EQ(signatures.size(), 1);
+
+  auto signature_key = signatures[0].Key();
+  EXPECT_EQ(signature_key, Model::DefaultSignatureKey());
+  size_t signature_index = 0;
+
+  LITERT_ASSERT_OK_AND_ASSIGN(
+      auto input_buffers, compiled_model.CreateInputBuffers(signature_index));
+
+  LITERT_ASSERT_OK_AND_ASSIGN(
+      auto output_buffers, compiled_model.CreateOutputBuffers(signature_index));
+
+  // Fill model inputs.
+  auto input_names = signatures[0].InputNames();
+  EXPECT_EQ(input_names.size(), 2);
+  EXPECT_EQ(input_names.at(0), "arg0");
+  EXPECT_EQ(input_names.at(1), "arg1");
+  LITERT_ASSERT_OK_AND_ASSIGN(auto buffer0_type, input_buffers[0].BufferType());
+  EXPECT_EQ(buffer0_type, kLiteRtTensorBufferTypeHostMemory);
+  ASSERT_TRUE(input_buffers[0].Write<float>(
+      absl::MakeConstSpan(kTestInput0Tensor, kTestInput0Size)));
+  LITERT_ASSERT_OK_AND_ASSIGN(auto buffer1_type, input_buffers[0].BufferType());
+  EXPECT_EQ(buffer1_type, kLiteRtTensorBufferTypeHostMemory);
+  ASSERT_TRUE(input_buffers[1].Write<float>(
+      absl::MakeConstSpan(kTestInput1Tensor, kTestInput1Size)));
+
+  // Execute model.
+  compiled_model.Run(signature_index, input_buffers, output_buffers);
+
+  // Check model output.
+  auto output_names = signatures[0].OutputNames();
+  EXPECT_EQ(output_names.size(), 1);
+  EXPECT_EQ(output_names.at(0), "tfl.add");
+  LITERT_ASSERT_OK_AND_ASSIGN(auto output_type, input_buffers[0].BufferType());
+  EXPECT_EQ(output_type, kLiteRtTensorBufferTypeHostMemory);
+  {
+    auto lock_and_addr = litert::TensorBufferScopedLock::Create<const float>(
+        output_buffers[0], TensorBuffer::LockMode::kRead);
+    ASSERT_TRUE(lock_and_addr);
+    auto output = absl::MakeSpan(lock_and_addr->second, kTestOutputSize);
+    for (auto i = 0; i < kTestOutputSize; ++i) {
+      ABSL_LOG(INFO) << "Result: " << output[i] << "\t" << kTestOutputTensor[i];
+    }
+    EXPECT_THAT(output, Pointwise(FloatNear(1e-5), kTestOutputTensor));
+  }
+}
+
+INSTANTIATE_TEST_SUITE_P(
+    CompiledModelWebGpuTest, ParameterizedTest,
+    ::testing::Combine(::testing::ValuesIn<LiteRtDelegatePrecision>({
+        kLiteRtDelegatePrecisionDefault,
+        kLiteRtDelegatePrecisionFp16,
+        kLiteRtDelegatePrecisionFp32,
+    })));
+
+}  // namespace
+}  // namespace litert
diff --git a/litert/tools/BUILD b/litert/tools/BUILD
@@ -534,6 +534,21 @@ cc_binary(
     ],
 )
 
+cc_binary(
+    name = "gpu_numerics_check_jet",
+    srcs = ["gpu_numerics_check.cc"],
+    tags = [
+        "notap",
+        "requires-gpu-nvidia",
+    ],
+    deps = NUMERICS_CHECK_DEPS + [
+        "//litert/cc/options:litert_gpu_options",
+        # copybara:uncomment_begin(google-only)
+        # "//litert/runtime/accelerators/gpu/google:jet_gpu_accelerator",  # buildcleaner: keep
+        # copybara:uncomment_end
+    ],
+)
+
 cc_binary(
     name = "analyze_model_main",
     srcs = ["analyze_model_main.cc"],
@@ -593,6 +608,20 @@ cc_binary(
     ],
 )
 
+cc_binary(
+    name = "benchmark_model_jet",
+    tags = [
+        "notap",
+        "requires-gpu-nvidia",
+    ],
+    deps = [
+        ":benchmark_model_main",
+        # copybara:uncomment_begin(google-only)
+        # "//litert/runtime/accelerators/gpu/google:jet_gpu_accelerator",  # buildcleaner: keep
+        # copybara:uncomment_end
+    ],
+)
+
 cc_library(
     name = "benchmark_stripped_litert_model",
     srcs = ["benchmark_stripped_litert_model.cc"],