From 0eab110fe2e4b3017c25c67a43b87952f45c31da Mon Sep 17 00:00:00 2001
From: Gilad S <giladgd@gmail.com>
Date: Tue, 29 Jul 2025 03:48:28 +0300
Subject: [PATCH 1/2] build: update CUDA version in the CI

---
 .github/workflows/build.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 32605a11..61107652 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -113,7 +113,7 @@ jobs:
         if: matrix.config.name == 'Windows for x64'
         uses: Jimver/cuda-toolkit@v0.2.15
         with:
-          cuda: '12.2.0'
+          cuda: '12.4.0'
           method: 'network'
           sub-packages: '["nvcc", "cudart", "cublas", "cublas_dev", "thrust", "visual_studio_integration"]'
           use-local-cache: false
@@ -122,7 +122,7 @@ jobs:
         if: matrix.config.name == 'Ubuntu'
         uses: Jimver/cuda-toolkit@v0.2.15
         with:
-          cuda: '12.2.0'
+          cuda: '12.4.0'
           method: 'network'
 
       - name: Install Vulkan SDK on Windows for x64

From b399d5294a26ca10ae02f2d61c9a598a1c9a4f84 Mon Sep 17 00:00:00 2001
From: Gilad S <giladgd@gmail.com>
Date: Tue, 29 Jul 2025 03:48:48 +0300
Subject: [PATCH 2/2] fix: add missing GGUF types

---
 src/gguf/types/GgufMetadataTypes.ts | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/src/gguf/types/GgufMetadataTypes.ts b/src/gguf/types/GgufMetadataTypes.ts
index 5f8a48e1..85a67a93 100644
--- a/src/gguf/types/GgufMetadataTypes.ts
+++ b/src/gguf/types/GgufMetadataTypes.ts
@@ -35,6 +35,7 @@ export const enum GgufArchitectureType {
     gemma = "gemma",
     gemma2 = "gemma2",
     gemma3 = "gemma3",
+    gemma3n = "gemma3n",
     starcoder2 = "starcoder2",
     mamba = "mamba",
     xverse = "xverse",
@@ -56,6 +57,7 @@ export const enum GgufArchitectureType {
     jais = "jais",
     nemotron = "nemotron",
     exaone = "exaone",
+    exaone4 = "exaone4",
     rwkv6 = "rwkv6",
     rwkv6qwen2 = "rwkv6qwen2",
     rwkv7 = "rwkv7",
@@ -66,6 +68,10 @@ export const enum GgufArchitectureType {
     wavtokenizerDec = "wavtokenizer-dec",
     plm = "plm",
     bailingmoe = "bailingmoe",
+    dots1 = "dots1",
+    arcee = "arcee",
+    ernie4_5 = "ernie4_5",
+    clip = "clip",
     unknown = "(unknown)"
 }
 
@@ -244,8 +250,8 @@ export type GgufMetadataTokenizer = {
         readonly pre?: "default" | "llama3" | "llama-v3" | "llama-bpe" | "deepseek-llm" | "deepseek-coder" | "falcon" | "falcon3" |
             "pixtral" | "mpt" | "starcoder" | "gpt-2" | "phi-2" | "jina-es" | "jina-de" | "jina-v1-en" | "jina-v2-es" | "jina-v2-de" |
             "jina-v2-code" | "refact" | "command-r" | "qwen2" | "stablelm2" | "olmo" | "dbrx" | "smaug-bpe" | "poro-chat" | "chatglm-bpe" |
-            "viking" | "jais" | "tekken" | "smollm" | "codeshell" | "bloom" | "gpt3-finnish" | "exaone" | "chameleon" | "minerva-7b" |
-            "megrez" | "gpt-4o" | "superbpe" | "trillion" | "bailingmoe" | string,
+            "viking" | "jais" | "tekken" | "smollm" | "codeshell" | "bloom" | "gpt3-finnish" | "exaone" | "exaone4" | "chameleon" |
+            "minerva-7b" | "megrez" | "gpt-4o" | "superbpe" | "trillion" | "bailingmoe" | string,
         readonly tokens: readonly string[],
         readonly token_type: GgufMetadataTokenizerTokenType[],
         readonly token_type_count?: number,