From e50b41ed77271f4eb657c4b38732cd59f0337c4a Mon Sep 17 00:00:00 2001
From: Anthony DePasquale <anthony@depasquale.org>
Date: Sat, 27 Dec 2025 16:49:52 +0100
Subject: [PATCH 1/6] Add revision option to embedding model ID

---
 Libraries/MLXEmbedders/Load.swift   |  5 +++--
 Libraries/MLXEmbedders/Models.swift | 10 +++++-----
 2 files changed, 8 insertions(+), 7 deletions(-)

diff --git a/Libraries/MLXEmbedders/Load.swift b/Libraries/MLXEmbedders/Load.swift
index 9e4955ce..4e1adbe5 100644
--- a/Libraries/MLXEmbedders/Load.swift
+++ b/Libraries/MLXEmbedders/Load.swift
@@ -87,11 +87,12 @@ func prepareModelDirectory(
 ) async throws -> URL {
     do {
         switch configuration.id {
-        case .id(let id):
+        case .id(let id, let revision):
             let repo = Hub.Repo(id: id)
             let modelFiles = ["*.safetensors", "config.json", "*/config.json"]
             return try await hub.snapshot(
-                from: repo, matching: modelFiles, progressHandler: progressHandler)
+                from: repo, revision: revision, matching: modelFiles,
+                progressHandler: progressHandler)
 
         case .directory(let directory):
             return directory
diff --git a/Libraries/MLXEmbedders/Models.swift b/Libraries/MLXEmbedders/Models.swift
index ac954b94..6cf1fe1e 100644
--- a/Libraries/MLXEmbedders/Models.swift
+++ b/Libraries/MLXEmbedders/Models.swift
@@ -22,7 +22,7 @@ public struct ModelConfiguration: Sendable {
     /// The backing storage for the model's location.
     public enum Identifier: Sendable {
         /// A Hugging Face Hub repository identifier (e.g., "BAAI/bge-small-en-v1.5").
-        case id(String)
+        case id(String, revision: String = "main")
         /// A file system URL pointing to a local model directory.
         case directory(URL)
     }
@@ -36,7 +36,7 @@ public struct ModelConfiguration: Sendable {
     /// it returns a path-based name (e.g., "ParentDir/ModelDir").
     public var name: String {
         switch id {
-        case .id(let string):
+        case .id(let string, _):
             string
         case .directory(let url):
             url.deletingLastPathComponent().lastPathComponent + "/" + url.lastPathComponent
@@ -60,11 +60,11 @@ public struct ModelConfiguration: Sendable {
     ///   - tokenizerId: Optional alternate repo for the tokenizer.
     ///   - overrideTokenizer: Optional specific tokenizer implementation name.
     public init(
-        id: String,
+        id: String, revision: String = "main",
         tokenizerId: String? = nil,
         overrideTokenizer: String? = nil
     ) {
-        self.id = .id(id)
+        self.id = .id(id, revision: revision)
         self.tokenizerId = tokenizerId
         self.overrideTokenizer = overrideTokenizer
     }
@@ -90,7 +90,7 @@ public struct ModelConfiguration: Sendable {
     /// - Returns: A `URL` pointing to the local directory.
     public func modelDirectory(hub: HubApi = HubApi()) -> URL {
         switch id {
-        case .id(let id):
+        case .id(let id, _):
             let repo = Hub.Repo(id: id)
             return hub.localRepoLocation(repo)
 

From 6909ad92b3af650c3c46ecc6bea66ccdb9f28c7d Mon Sep 17 00:00:00 2001
From: Anthony DePasquale <anthony@depasquale.org>
Date: Sat, 27 Dec 2025 16:28:55 +0100
Subject: [PATCH 2/6] Use `AutoTokenizer.from()` for faster tokenizer loading

---
 Libraries/MLXEmbedders/EmbeddingModel.swift | 10 +--
 Libraries/MLXEmbedders/Tokenizer.swift      | 66 ++----------------
 Libraries/MLXLMCommon/Tokenizer.swift       | 74 +++++++--------------
 3 files changed, 32 insertions(+), 118 deletions(-)

diff --git a/Libraries/MLXEmbedders/EmbeddingModel.swift b/Libraries/MLXEmbedders/EmbeddingModel.swift
index 3c7037b7..9c41e6f5 100644
--- a/Libraries/MLXEmbedders/EmbeddingModel.swift
+++ b/Libraries/MLXEmbedders/EmbeddingModel.swift
@@ -50,17 +50,11 @@ public actor ModelContainer {
         modelDirectory: URL,
         configuration: ModelConfiguration
     ) async throws {
-        // Load tokenizer config and model in parallel using async let.
-        async let tokenizerConfigTask = loadTokenizerConfig(
-            configuration: configuration, hub: hub)
-
+        async let tokenizerTask = loadTokenizer(configuration: configuration, hub: hub)
         self.model = try loadSynchronous(
             modelDirectory: modelDirectory, modelName: configuration.name)
         self.pooler = loadPooling(modelDirectory: modelDirectory)
-
-        let (tokenizerConfig, tokenizerData) = try await tokenizerConfigTask
-        self.tokenizer = try PreTrainedTokenizer(
-            tokenizerConfig: tokenizerConfig, tokenizerData: tokenizerData)
+        self.tokenizer = try await tokenizerTask
     }
 
     /// Perform an action on the model and/or tokenizer. Callers _must_ eval any `MLXArray` before returning as
diff --git a/Libraries/MLXEmbedders/Tokenizer.swift b/Libraries/MLXEmbedders/Tokenizer.swift
index e7300f22..ace094b9 100644
--- a/Libraries/MLXEmbedders/Tokenizer.swift
+++ b/Libraries/MLXEmbedders/Tokenizer.swift
@@ -18,66 +18,14 @@ import Tokenizers
 ///   or standard network/parsing errors.
 public func loadTokenizer(configuration: ModelConfiguration, hub: HubApi) async throws -> Tokenizer
 {
-    let (tokenizerConfig, tokenizerData) = try await loadTokenizerConfig(
-        configuration: configuration, hub: hub)
-
-    return try PreTrainedTokenizer(
-        tokenizerConfig: tokenizerConfig, tokenizerData: tokenizerData)
-}
-
-/// Retrieves the raw configuration and data files required to build a tokenizer.
-///
-/// This internal helper handles the logic of determining where to fetch files from.
-/// It includes a robust fallback: if a network request fails due to lack of internet
-/// connectivity, it attempts to load the files from the local model directory.
-///
-/// - Parameters:
-///   - configuration: The model configuration providing the `tokenizerId` or `modelDirectory`.
-///   - hub: The `HubApi` interface for remote or local file resolution.
-/// - Returns: A tuple containing the `tokenizerConfig` and `tokenizerData` configurations.
-/// - Throws: `NSURLError` for network issues (other than offline status).
-/// - Throws: `EmbedderError.missingTokenizerConfig` if the configuration files are
-///   successfully accessed but do not contain a valid `tokenizerConfig` payload.
-///   This typically occurs when the model repository or directory is missing a
-///   `tokenizer_config.json` file.
-func loadTokenizerConfig(
-    configuration: ModelConfiguration,
-    hub: HubApi
-) async throws -> (Config, Config) {
-    // from AutoTokenizer.from() -- this lets us override parts of the configuration
-    let config: LanguageModelConfigurationFromHub
-
     switch configuration.id {
-    case .id(let id):
-        do {
-            // Attempt to load from the remote Hub or Hub cache
-            let loaded = LanguageModelConfigurationFromHub(
-                modelName: configuration.tokenizerId ?? id, hubApi: hub)
-
-            // Trigger an async fetch to verify the config exists
-            _ = try await loaded.tokenizerConfig
-            config = loaded
-        } catch {
-            let nserror = error as NSError
-            if nserror.domain == NSURLErrorDomain
-                && nserror.code == NSURLErrorNotConnectedToInternet
-            {
-                // Fallback: Internet connection is offline, load from the local model directory
-                config = LanguageModelConfigurationFromHub(
-                    modelFolder: configuration.modelDirectory(hub: hub), hubApi: hub)
-            } else {
-                // Re-throw if it's a critical error (e.g., 404, parsing error)
-                throw error
-            }
-        }
+    case .id(let id, let revision):
+        return try await AutoTokenizer.from(
+            pretrained: configuration.tokenizerId ?? id,
+            hubApi: hub,
+            revision: revision
+        )
     case .directory(let directory):
-        // Load directly from a specified local directory
-        config = LanguageModelConfigurationFromHub(modelFolder: directory, hubApi: hub)
-    }
-
-    guard let tokenizerConfig = try await config.tokenizerConfig else {
-        throw EmbedderError.missingTokenizerConfig
+        return try await AutoTokenizer.from(modelFolder: directory, hubApi: hub)
     }
-    let tokenizerData = try await config.tokenizerData
-    return (tokenizerConfig, tokenizerData)
 }
diff --git a/Libraries/MLXLMCommon/Tokenizer.swift b/Libraries/MLXLMCommon/Tokenizer.swift
index 1d14fa1e..bd2a0f2f 100644
--- a/Libraries/MLXLMCommon/Tokenizer.swift
+++ b/Libraries/MLXLMCommon/Tokenizer.swift
@@ -10,13 +10,21 @@ struct TokenizerError: Error {
 
 public func loadTokenizer(configuration: ModelConfiguration, hub: HubApi) async throws -> Tokenizer
 {
-    let (tokenizerConfig, tokenizerData) = try await loadTokenizerConfig(
-        configuration: configuration, hub: hub)
-
-    return try PreTrainedTokenizer(
-        tokenizerConfig: tokenizerConfig, tokenizerData: tokenizerData)
+    switch configuration.id {
+    case .id(let id, let revision):
+        return try await AutoTokenizer.from(
+            pretrained: configuration.tokenizerId ?? id,
+            hubApi: hub,
+            revision: revision
+        )
+    case .directory(let directory):
+        return try await AutoTokenizer.from(modelFolder: directory, hubApi: hub)
+    }
 }
 
+@available(
+    *, deprecated, message: "Use LanguageModelConfigurationFromHub from swift-transformers directly"
+)
 public func loadTokenizerConfig(configuration: ModelConfiguration, hub: HubApi) async throws -> (
     Config, Config
 ) {
@@ -48,60 +56,24 @@ public func loadTokenizerConfig(configuration: ModelConfiguration, hub: HubApi)
         config = LanguageModelConfigurationFromHub(modelFolder: directory, hubApi: hub)
     }
 
-    guard var tokenizerConfig = try await config.tokenizerConfig else {
+    guard let tokenizerConfig = try await config.tokenizerConfig else {
         throw TokenizerError(message: "missing config")
     }
     let tokenizerData = try await config.tokenizerData
 
-    tokenizerConfig = updateTokenizerConfig(tokenizerConfig)
-
     return (tokenizerConfig, tokenizerData)
 }
 
-private func updateTokenizerConfig(_ tokenizerConfig: Config) -> Config {
-    // Workaround: replacement tokenizers for unhandled values in swift-transformers
-    if let tokenizerClass = tokenizerConfig.tokenizerClass?.string(),
-        let replacement = replacementTokenizers[tokenizerClass]
-    {
-        if var dictionary = tokenizerConfig.dictionary() {
-            dictionary["tokenizer_class"] = .init(replacement)
-            return Config(dictionary)
-        }
-    }
-    return tokenizerConfig
-}
-
-public class TokenizerReplacementRegistry: @unchecked Sendable {
-
-    // Note: using NSLock as we have very small (just dictionary get/set)
-    // critical sections and expect no contention. this allows the methods
-    // to remain synchronous.
-    private let lock = NSLock()
-
-    /// overrides for TokenizerModel/knownTokenizers
-    private var replacementTokenizers = [
-        "InternLM2Tokenizer": "PreTrainedTokenizer",
-        "Qwen2Tokenizer": "PreTrainedTokenizer",
-        "Qwen3Tokenizer": "PreTrainedTokenizer",
-        "CohereTokenizer": "PreTrainedTokenizer",
-        "GPTNeoXTokenizer": "PreTrainedTokenizer",
-        "TokenizersBackend": "PreTrainedTokenizer",
-    ]
-
-    public subscript(key: String) -> String? {
-        get {
-            lock.withLock {
-                replacementTokenizers[key]
-            }
-        }
-        set {
-            lock.withLock {
-                replacementTokenizers[key] = newValue
-            }
-        }
-    }
-}
+@available(
+    *, unavailable,
+    message: "Use AutoTokenizer.register(_:for:) from swift-transformers instead"
+)
+public class TokenizerReplacementRegistry: @unchecked Sendable {}
 
+@available(
+    *, unavailable,
+    message: "Use AutoTokenizer.register(_:for:) from swift-transformers instead"
+)
 public let replacementTokenizers = TokenizerReplacementRegistry()
 
 public protocol StreamingDetokenizer: IteratorProtocol<String> {

From 58faf2ffc4859b1a8bdf6820ceb0278fdf5f4ba4 Mon Sep 17 00:00:00 2001
From: Anthony DePasquale <anthony@depasquale.org>
Date: Tue, 6 Jan 2026 21:01:24 +0100
Subject: [PATCH 3/6] Deprecate overrideTokenizer (now handled by
 swift-transformers)

---
 Libraries/MLXLLM/LLMModelFactory.swift         | 5 -----
 Libraries/MLXLMCommon/ModelConfiguration.swift | 4 ++++
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/Libraries/MLXLLM/LLMModelFactory.swift b/Libraries/MLXLLM/LLMModelFactory.swift
index d23ef3e6..7840de9d 100644
--- a/Libraries/MLXLLM/LLMModelFactory.swift
+++ b/Libraries/MLXLLM/LLMModelFactory.swift
@@ -104,7 +104,6 @@ public class LLMRegistry: AbstractModelRegistry, @unchecked Sendable {
 
     static public let codeLlama13b4bit = ModelConfiguration(
         id: "mlx-community/CodeLlama-13b-Instruct-hf-4bit-MLX",
-        overrideTokenizer: "PreTrainedTokenizer",
         defaultPrompt: "func sortArray(_ array: [Int]) -> String { <FILL_ME> }"
     )
 
@@ -136,21 +135,18 @@ public class LLMRegistry: AbstractModelRegistry, @unchecked Sendable {
 
     static public let gemma2bQuantized = ModelConfiguration(
         id: "mlx-community/quantized-gemma-2b-it",
-        overrideTokenizer: "PreTrainedTokenizer",
         // https://www.promptingguide.ai/models/gemma
         defaultPrompt: "what is the difference between lettuce and cabbage?"
     )
 
     static public let gemma_2_9b_it_4bit = ModelConfiguration(
         id: "mlx-community/gemma-2-9b-it-4bit",
-        overrideTokenizer: "PreTrainedTokenizer",
         // https://www.promptingguide.ai/models/gemma
         defaultPrompt: "What is the difference between lettuce and cabbage?"
     )
 
     static public let gemma_2_2b_it_4bit = ModelConfiguration(
         id: "mlx-community/gemma-2-2b-it-4bit",
-        overrideTokenizer: "PreTrainedTokenizer",
         // https://www.promptingguide.ai/models/gemma
         defaultPrompt: "What is the difference between lettuce and cabbage?"
     )
@@ -191,7 +187,6 @@ public class LLMRegistry: AbstractModelRegistry, @unchecked Sendable {
 
     static public let qwen205b4bit = ModelConfiguration(
         id: "mlx-community/Qwen1.5-0.5B-Chat-4bit",
-        overrideTokenizer: "PreTrainedTokenizer",
         defaultPrompt: "why is the sky blue?"
     )
 
diff --git a/Libraries/MLXLMCommon/ModelConfiguration.swift b/Libraries/MLXLMCommon/ModelConfiguration.swift
index d4478d1d..21dcef2c 100644
--- a/Libraries/MLXLMCommon/ModelConfiguration.swift
+++ b/Libraries/MLXLMCommon/ModelConfiguration.swift
@@ -28,6 +28,10 @@ public struct ModelConfiguration: Sendable {
     public let tokenizerId: String?
 
     /// overrides for TokenizerModel/knownTokenizers -- useful before swift-transformers is updated
+    @available(
+        *, deprecated,
+        message: "No longer used. swift-transformers now handles tokenizer remapping internally."
+    )
     public let overrideTokenizer: String?
 
     /// A reasonable default prompt for the model

From 57043668fa796e267179011d532868b3fee4f427 Mon Sep 17 00:00:00 2001
From: Anthony DePasquale <anthony@depasquale.org>
Date: Tue, 6 Jan 2026 21:10:46 +0100
Subject: [PATCH 4/6] Temporary pin to swift-transformers (remove before
 merging)

---
 Package.swift | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/Package.swift b/Package.swift
index 0eb3dbf3..f93707f1 100644
--- a/Package.swift
+++ b/Package.swift
@@ -28,8 +28,8 @@ let package = Package(
     dependencies: [
         .package(url: "https://github.com/ml-explore/mlx-swift", .upToNextMinor(from: "0.30.6")),
         .package(
-            url: "https://github.com/huggingface/swift-transformers",
-            .upToNextMinor(from: "1.1.6")
+            url: "https://github.com/DePasqualeOrg/swift-transformers",
+            revision: "3faa2e45343054388073008cc3ac32c3dee9a85a"
         ),
     ],
     targets: [

From d4ffcdfb61703699a14cc8aa4d7f79db79b50223 Mon Sep 17 00:00:00 2001
From: Anthony DePasquale <anthony@depasquale.org>
Date: Tue, 17 Feb 2026 17:49:16 +0100
Subject: [PATCH 5/6] Remove overrideTokenizer (handled by swift-transformers)

---
 Libraries/MLXLMCommon/ModelConfiguration.swift | 16 +++-------------
 1 file changed, 3 insertions(+), 13 deletions(-)

diff --git a/Libraries/MLXLMCommon/ModelConfiguration.swift b/Libraries/MLXLMCommon/ModelConfiguration.swift
index 21dcef2c..f39157f2 100644
--- a/Libraries/MLXLMCommon/ModelConfiguration.swift
+++ b/Libraries/MLXLMCommon/ModelConfiguration.swift
@@ -27,13 +27,6 @@ public struct ModelConfiguration: Sendable {
     /// pull the tokenizer from an alternate id
     public let tokenizerId: String?
 
-    /// overrides for TokenizerModel/knownTokenizers -- useful before swift-transformers is updated
-    @available(
-        *, deprecated,
-        message: "No longer used. swift-transformers now handles tokenizer remapping internally."
-    )
-    public let overrideTokenizer: String?
-
     /// A reasonable default prompt for the model
     public var defaultPrompt: String
 
@@ -48,15 +41,13 @@ public struct ModelConfiguration: Sendable {
 
     public init(
         id: String, revision: String = "main",
-        tokenizerId: String? = nil, overrideTokenizer: String? = nil,
+        tokenizerId: String? = nil,
         defaultPrompt: String = "hello",
         extraEOSTokens: Set<String> = [],
-        toolCallFormat: ToolCallFormat? = nil,
-        preparePrompt: (@Sendable (String) -> String)? = nil
+        toolCallFormat: ToolCallFormat? = nil
     ) {
         self.id = .id(id, revision: revision)
         self.tokenizerId = tokenizerId
-        self.overrideTokenizer = overrideTokenizer
         self.defaultPrompt = defaultPrompt
         self.extraEOSTokens = extraEOSTokens
         self.toolCallFormat = toolCallFormat
@@ -64,7 +55,7 @@ public struct ModelConfiguration: Sendable {
 
     public init(
         directory: URL,
-        tokenizerId: String? = nil, overrideTokenizer: String? = nil,
+        tokenizerId: String? = nil,
         defaultPrompt: String = "hello",
         extraEOSTokens: Set<String> = [],
         eosTokenIds: Set<Int> = [],
@@ -72,7 +63,6 @@ public struct ModelConfiguration: Sendable {
     ) {
         self.id = .directory(directory)
         self.tokenizerId = tokenizerId
-        self.overrideTokenizer = overrideTokenizer
         self.defaultPrompt = defaultPrompt
         self.extraEOSTokens = extraEOSTokens
         self.eosTokenIds = eosTokenIds

From 70a6635a8d9931221c269dd3a3c483a21078d166 Mon Sep 17 00:00:00 2001
From: Anthony DePasquale <anthony@depasquale.org>
Date: Tue, 17 Feb 2026 17:51:30 +0100
Subject: [PATCH 6/6] Clean up

---
 Libraries/MLXLLM/LLMModelFactory.swift            |  5 +----
 Libraries/MLXLMCommon/ModelConfiguration.swift    |  4 ++--
 Libraries/MLXLMCommon/ModelFactory.swift          | 10 +++++-----
 Libraries/MLXVLM/README.md                        |  2 +-
 skills/mlx-swift-lm/references/embeddings.md      |  2 +-
 skills/mlx-swift-lm/references/model-container.md |  6 +++---
 6 files changed, 13 insertions(+), 16 deletions(-)

diff --git a/Libraries/MLXLLM/LLMModelFactory.swift b/Libraries/MLXLLM/LLMModelFactory.swift
index 7840de9d..03502eb9 100644
--- a/Libraries/MLXLLM/LLMModelFactory.swift
+++ b/Libraries/MLXLLM/LLMModelFactory.swift
@@ -128,10 +128,7 @@ public class LLMRegistry: AbstractModelRegistry, @unchecked Sendable {
         id: "mlx-community/Phi-3.5-MoE-instruct-4bit",
         defaultPrompt: "What is the gravity on Mars and the moon?",
         extraEOSTokens: ["<|end|>"]
-    ) {
-        prompt in
-        "<|user|>\n\(prompt)<|end|>\n<|assistant|>\n"
-    }
+    )
 
     static public let gemma2bQuantized = ModelConfiguration(
         id: "mlx-community/quantized-gemma-2b-it",
diff --git a/Libraries/MLXLMCommon/ModelConfiguration.swift b/Libraries/MLXLMCommon/ModelConfiguration.swift
index f39157f2..07393022 100644
--- a/Libraries/MLXLMCommon/ModelConfiguration.swift
+++ b/Libraries/MLXLMCommon/ModelConfiguration.swift
@@ -24,7 +24,7 @@ public struct ModelConfiguration: Sendable {
         }
     }
 
-    /// pull the tokenizer from an alternate id
+    /// Alternate repo ID to use for the tokenizer
     public let tokenizerId: String?
 
     /// A reasonable default prompt for the model
@@ -72,7 +72,7 @@ public struct ModelConfiguration: Sendable {
     public func modelDirectory(hub: HubApi = HubApi()) -> URL {
         switch id {
         case .id(let id, _):
-            // download the model weights and config
+            // Download the model weights and config
             let repo = Hub.Repo(id: id)
             return hub.localRepoLocation(repo)
 
diff --git a/Libraries/MLXLMCommon/ModelFactory.swift b/Libraries/MLXLMCommon/ModelFactory.swift
index 5f77ac21..144e34e2 100644
--- a/Libraries/MLXLMCommon/ModelFactory.swift
+++ b/Libraries/MLXLMCommon/ModelFactory.swift
@@ -207,15 +207,15 @@ public func loadModelContainer(
     }
 }
 
-/// Load a model given a huggingface identifier.
+/// Load a model given a Hugging Face identifier.
 ///
-/// This will load and return a ``ModelContext``.  This holds the model and tokenzier without
+/// This will load and return a ``ModelContext``.  This holds the model and tokenizer without
 /// an `actor` providing an isolation context.  Use this call when you control the isolation context
 /// and can hold the ``ModelContext`` directly.
 ///
 /// - Parameters:
 ///   - hub: optional HubApi -- by default uses ``defaultHubApi``
-///   - id: huggingface model identifier, e.g "mlx-community/Qwen3-4B-4bit"
+///   - id: Hugging Face model identifier, e.g "mlx-community/Qwen3-4B-4bit"
 ///   - progressHandler: optional callback for progress
 /// - Returns: a ``ModelContext``
 public func loadModel(
@@ -229,14 +229,14 @@ public func loadModel(
     }
 }
 
-/// Load a model given a huggingface identifier.
+/// Load a model given a Hugging Face identifier.
 ///
 /// This will load and return a ``ModelContainer``.  This holds a ``ModelContext``
 /// inside an actor providing isolation control for the values.
 ///
 /// - Parameters:
 ///   - hub: optional HubApi -- by default uses ``defaultHubApi``
-///   - id: huggingface model identifier, e.g "mlx-community/Qwen3-4B-4bit"
+///   - id: Hugging Face model identifier, e.g "mlx-community/Qwen3-4B-4bit"
 ///   - progressHandler: optional callback for progress
 /// - Returns: a ``ModelContainer``
 public func loadModelContainer(
diff --git a/Libraries/MLXVLM/README.md b/Libraries/MLXVLM/README.md
index 83120543..63dd8532 100644
--- a/Libraries/MLXVLM/README.md
+++ b/Libraries/MLXVLM/README.md
@@ -298,7 +298,7 @@ media as needed. For example it might:
 - modify the prompt by injecting `<image>` tokens that the model expects
 
 In the python implementations, much of this code typically lives in the `transformers`
-package from huggingface -- inspection will be required to determine which code
+package from Hugging Face -- inspection will be required to determine which code
 is called and what it does. You can examine the processors in the `Models` directory:
 they reference the files and functions that they are based on.
 
diff --git a/skills/mlx-swift-lm/references/embeddings.md b/skills/mlx-swift-lm/references/embeddings.md
index 753c27e6..e7a0f850 100644
--- a/skills/mlx-swift-lm/references/embeddings.md
+++ b/skills/mlx-swift-lm/references/embeddings.md
@@ -248,7 +248,7 @@ print("Similarity: \(similarity)")  // ~0.85
 ```swift
 public struct ModelConfiguration: Sendable {
     public enum Identifier: Sendable {
-        case id(String)          // HuggingFace ID
+        case id(String)          // Hugging Face ID
         case directory(URL)      // Local path
     }
 
diff --git a/skills/mlx-swift-lm/references/model-container.md b/skills/mlx-swift-lm/references/model-container.md
index 11d19067..07a8f67d 100644
--- a/skills/mlx-swift-lm/references/model-container.md
+++ b/skills/mlx-swift-lm/references/model-container.md
@@ -2,7 +2,7 @@
 
 ## Overview
 
-`ModelContainer` is the thread-safe wrapper for language models, providing exclusive access to model resources during inference. `ModelConfiguration` describes model identity and settings. Factory classes handle model instantiation from HuggingFace or local directories.
+`ModelContainer` is the thread-safe wrapper for language models, providing exclusive access to model resources during inference. `ModelConfiguration` describes model identity and settings. Factory classes handle model instantiation from Hugging Face or local directories.
 
 ## Quick Reference
 
@@ -124,7 +124,7 @@ for await event in stream {
 ### Creating Configurations
 
 ```swift
-// From HuggingFace model ID
+// From Hugging Face model ID
 let config = ModelConfiguration(
     id: "mlx-community/Llama-3.2-3B-Instruct-4bit",
     defaultPrompt: "Hello",
@@ -227,7 +227,7 @@ Map `model_type` from config.json to model initializers:
 
 ## Loading Flow
 
-1. **Download**: Model weights fetched from HuggingFace (cached locally)
+1. **Download**: Model weights fetched from Hugging Face (cached locally)
 2. **Parse config.json**: Determine `model_type` and configuration
 3. **Create model**: TypeRegistry maps type to initializer
 4. **Load weights**: `.safetensors` files loaded into model