Skip to content

Commit 73f19aa

Browse files
committed
Update on "gemma3 e2e runner on cuda"
This diff introduces e2e runner for gemma3 model on cuda delegating using AOTI library, which is guarded by CI. Also other necessary infrastructure updates for building and running the `gemma3 e2e runner` on CUDA devices. Differential Revision: [D85087532](https://our.internmc.facebook.com/intern/diff/D85087532/) [ghstack-poisoned]
2 parents 7f80aa0 + 1777ee8 commit 73f19aa

File tree

2 files changed

+6
-2
lines changed

2 files changed

+6
-2
lines changed

examples/models/gemma3/CMakeLists.txt

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -117,6 +117,8 @@ if(NOT CMAKE_BUILD_TYPE STREQUAL "Debug")
117117
endif()
118118
endif()
119119

120-
target_include_directories(gemma3_e2e_runner PUBLIC ${_common_include_directories})
120+
target_include_directories(
121+
gemma3_e2e_runner PUBLIC ${_common_include_directories}
122+
)
121123
target_link_libraries(gemma3_e2e_runner PUBLIC ${link_libraries})
122124
target_compile_options(gemma3_e2e_runner PUBLIC ${_common_compile_options})

extension/llm/runner/multimodal_prefiller.cpp

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -94,7 +94,9 @@ Result<uint64_t> MultimodalPrefiller::prefill(
9494
if (expected_dtype == ::executorch::aten::ScalarType::BFloat16) {
9595
// Convert to bfloat16 for model input
9696
auto image_tensor_return = convert_to_bfloat16(image_tensor);
97-
ET_CHECK_OK_OR_RETURN_ERROR(image_tensor_return.error(), "Failed to convert image tensor to bfloat16");
97+
ET_CHECK_OK_OR_RETURN_ERROR(
98+
image_tensor_return.error(),
99+
"Failed to convert image tensor to bfloat16");
98100
image_tensor = image_tensor_return.get();
99101
}
100102

0 commit comments

Comments
 (0)