Update on "Reuse GELU implementation from PyTorch core"

swolchok · swolchok · commit 03a87cc101b0 · 2025-01-15T11:15:19.000-08:00
kernels/optimized doesn't need to support embedded systems, so it can just take a header-only dep on PyTorch. Note that, because we will pick up Sleef internally and ignore it externally thanks to ATen vec, this PR gets to enable optimized GELU in OSS. Testing: CI to make sure this doesn't break mobile build modes; happy to take advice on anything not currently covered that might break. Differential Revision: [D66335522](https://our.internmc.facebook.com/intern/diff/D66335522/) [ghstack-poisoned]
diff --git a/build/Utils.cmake b/build/Utils.cmake
@@ -321,3 +321,16 @@ function(resolve_python_executable)
     )
   endif()
 endfunction()
+
+# find_package(Torch CONFIG REQUIRED) replacement for targets that
+# have a header-only Torch dependency. Because find_package sets
+# variables in the parent scope, we use a macro to preserve this
+# rather than maintaining our own list of those variables.
+macro(find_package_torch_headers)
+  # We cannot simply use CMAKE_FIND_ROOT_PATH_BOTH, because that does
+  # not propagate into TorchConfig.cmake.
+  set(OLD_CMAKE_FIND_ROOT_PATH_MODE_PACKAGE ${CMAKE_FIND_ROOT_PATH_MODE_PACKAGE})
+  set(CMAKE_FIND_ROOT_PATH_MODE_PACKAGE BOTH)
+  find_package(Torch CONFIG REQUIRED)
+  set(CMAKE_FIND_ROOT_PATH_MODE_PACKAGE ${OLD_CMAKE_FIND_ROOT_PATH_MODE_PACKAGE})
+endmacro()
diff --git a/kernels/optimized/CMakeLists.txt b/kernels/optimized/CMakeLists.txt
@@ -63,14 +63,7 @@ message("Generated files ${gen_command_sources}")
 
 list(TRANSFORM _optimized_kernels__srcs PREPEND "${EXECUTORCH_ROOT}/")
 add_library(optimized_kernels ${_optimized_kernels__srcs})
-# We require Torch headers, which setup.py puts in CMAKE_PREFIX_PATH
-# for us. Toolchains that we might be using for cross-compiling could
-# set CMAKE_FIND_ROOT_PATH, which prevents find_package from finding
-# headers not rooted under CMAKE_FIND_ROOT_PATH. This is reasonable
-# for binary dependencies because they probably aren't built for the
-# target platform, but for our header-only use case, we should just
-# ignore CMAKE_FIND_ROOT_PATH.
-find_package(Torch CONFIG REQUIRED NO_CMAKE_FIND_ROOT_PATH)
+find_package_torch_headers()
 target_include_directories(optimized_kernels PRIVATE ${TORCH_INCLUDE_DIRS})
 target_link_libraries(
   optimized_kernels PRIVATE executorch_core cpublas extension_threadpool