From 0eab110fe2e4b3017c25c67a43b87952f45c31da Mon Sep 17 00:00:00 2001 From: Gilad S Date: Tue, 29 Jul 2025 03:48:28 +0300 Subject: [PATCH 1/2] build: update CUDA version in the CI --- .github/workflows/build.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml index 32605a11..61107652 100644 --- a/.github/workflows/build.yml +++ b/.github/workflows/build.yml @@ -113,7 +113,7 @@ jobs: if: matrix.config.name == 'Windows for x64' uses: Jimver/cuda-toolkit@v0.2.15 with: - cuda: '12.2.0' + cuda: '12.4.0' method: 'network' sub-packages: '["nvcc", "cudart", "cublas", "cublas_dev", "thrust", "visual_studio_integration"]' use-local-cache: false @@ -122,7 +122,7 @@ jobs: if: matrix.config.name == 'Ubuntu' uses: Jimver/cuda-toolkit@v0.2.15 with: - cuda: '12.2.0' + cuda: '12.4.0' method: 'network' - name: Install Vulkan SDK on Windows for x64 From b399d5294a26ca10ae02f2d61c9a598a1c9a4f84 Mon Sep 17 00:00:00 2001 From: Gilad S Date: Tue, 29 Jul 2025 03:48:48 +0300 Subject: [PATCH 2/2] fix: add missing GGUF types --- src/gguf/types/GgufMetadataTypes.ts | 10 ++++++++-- 1 file changed, 8 insertions(+), 2 deletions(-) diff --git a/src/gguf/types/GgufMetadataTypes.ts b/src/gguf/types/GgufMetadataTypes.ts index 5f8a48e1..85a67a93 100644 --- a/src/gguf/types/GgufMetadataTypes.ts +++ b/src/gguf/types/GgufMetadataTypes.ts @@ -35,6 +35,7 @@ export const enum GgufArchitectureType { gemma = "gemma", gemma2 = "gemma2", gemma3 = "gemma3", + gemma3n = "gemma3n", starcoder2 = "starcoder2", mamba = "mamba", xverse = "xverse", @@ -56,6 +57,7 @@ export const enum GgufArchitectureType { jais = "jais", nemotron = "nemotron", exaone = "exaone", + exaone4 = "exaone4", rwkv6 = "rwkv6", rwkv6qwen2 = "rwkv6qwen2", rwkv7 = "rwkv7", @@ -66,6 +68,10 @@ export const enum GgufArchitectureType { wavtokenizerDec = "wavtokenizer-dec", plm = "plm", bailingmoe = "bailingmoe", + dots1 = "dots1", + arcee = "arcee", + ernie4_5 = "ernie4_5", + clip = "clip", unknown = "(unknown)" } @@ -244,8 +250,8 @@ export type GgufMetadataTokenizer = { readonly pre?: "default" | "llama3" | "llama-v3" | "llama-bpe" | "deepseek-llm" | "deepseek-coder" | "falcon" | "falcon3" | "pixtral" | "mpt" | "starcoder" | "gpt-2" | "phi-2" | "jina-es" | "jina-de" | "jina-v1-en" | "jina-v2-es" | "jina-v2-de" | "jina-v2-code" | "refact" | "command-r" | "qwen2" | "stablelm2" | "olmo" | "dbrx" | "smaug-bpe" | "poro-chat" | "chatglm-bpe" | - "viking" | "jais" | "tekken" | "smollm" | "codeshell" | "bloom" | "gpt3-finnish" | "exaone" | "chameleon" | "minerva-7b" | - "megrez" | "gpt-4o" | "superbpe" | "trillion" | "bailingmoe" | string, + "viking" | "jais" | "tekken" | "smollm" | "codeshell" | "bloom" | "gpt3-finnish" | "exaone" | "exaone4" | "chameleon" | + "minerva-7b" | "megrez" | "gpt-4o" | "superbpe" | "trillion" | "bailingmoe" | string, readonly tokens: readonly string[], readonly token_type: GgufMetadataTokenizerTokenType[], readonly token_type_count?: number,