Schlep in Chromium Zlib

jart · jart · commit 2232b0ef49ee · 2024-08-18T09:21:35.000-07:00
Now that ggml-rocm.dll is 200mb we need a faster DEFLATE algorithm so it
gets self-extracted faster. This is provided by Cosmpo Libc which favors
using Mark Adler's Puff library by default which saves 40kb of code size
diff --git a/llamafile/cuda.c b/llamafile/cuda.c
@@ -51,6 +51,11 @@ __static_yoink("llama.cpp/ggml-common.h");
 __static_yoink("llama.cpp/ggml-backend.h");
 __static_yoink("llama.cpp/ggml-backend-impl.h");
 
+// yoink the fastest zlib deflate impl from cosmo libc
+__static_yoink("_Cz_inflateInit2");
+__static_yoink("_Cz_inflate");
+__static_yoink("_Cz_inflateEnd");
+
 #define THESTRING(x) #x
 #define STRINGIFY(x) THESTRING(x)
 #define ARMS_ONLY(x) (!IsAarch64() ? "-DIGNORE" STRINGIFY(__COUNTER__) : x)