Clarify parallelism in comments

DePasqualeOrg · DePasqualeOrg · commit 12c48ac9ec97 · 2026-01-06T20:52:34.000+01:00
diff --git a/Libraries/Embedders/EmbeddingModel.swift b/Libraries/Embedders/EmbeddingModel.swift
@@ -46,8 +46,7 @@ public actor ModelContainer {
     public init(
         hub: HubApi, modelDirectory: URL, configuration: ModelConfiguration
     ) async throws {
-        // Start tokenizer config loading asynchronously, then load model synchronously.
-        // Both operations run in parallel because async let begins execution immediately.
+        // Load tokenizer config and model in parallel using async let.
         async let tokenizerConfigTask = loadTokenizerConfig(
             configuration: configuration, hub: hub)
 
diff --git a/Libraries/Embedders/Load.swift b/Libraries/Embedders/Load.swift
@@ -90,8 +90,7 @@ public func load(
     let modelDirectory = try await prepareModelDirectory(
         hub: hub, configuration: configuration, progressHandler: progressHandler)
 
-    // Start tokenizer loading asynchronously, then load model synchronously.
-    // Both operations run in parallel because async let begins execution immediately.
+    // Load tokenizer and model in parallel using async let.
     async let tokenizerTask = loadTokenizer(configuration: configuration, hub: hub)
     let model = try loadSynchronous(modelDirectory: modelDirectory, modelName: configuration.name)
     let tokenizer = try await tokenizerTask
diff --git a/Libraries/MLXLLM/LLMModelFactory.swift b/Libraries/MLXLLM/LLMModelFactory.swift
@@ -503,8 +503,7 @@ public final class LLMModelFactory: ModelFactory {
                 configurationURL.lastPathComponent, configuration.name, error)
         }
 
-        // Start tokenizer loading asynchronously, then load weights synchronously.
-        // Both operations run in parallel because async let begins execution immediately.
+        // Load tokenizer and weights in parallel using async let.
         async let tokenizerTask = loadTokenizer(configuration: configuration, hub: hub)
 
         try loadWeights(
diff --git a/Libraries/MLXVLM/VLMModelFactory.swift b/Libraries/MLXVLM/VLMModelFactory.swift
@@ -282,8 +282,10 @@ public final class VLMModelFactory: ModelFactory {
                 configurationURL.lastPathComponent, configuration.name, error)
         }
 
-        // Start tokenizer and processor config loading asynchronously, then load weights synchronously.
-        // All three operations run in parallel because async let begins execution immediately.
+        // Load tokenizer, processor config, and weights in parallel using async let.
+        // Note: loadProcessorConfig does synchronous I/O but is marked async to enable
+        // parallel scheduling. This may briefly block a cooperative thread pool thread,
+        // but the config file is small and model loading is not a high-concurrency path.
         async let tokenizerTask = loadTokenizer(configuration: configuration, hub: hub)
         async let processorConfigTask = loadProcessorConfig(from: modelDirectory)
 
@@ -331,6 +333,7 @@ private struct ProcessorConfigError: Error {
 }
 
 /// Loads processor configuration, preferring preprocessor_config.json over processor_config.json.
+/// Marked async to enable parallel scheduling via async let, though the underlying I/O is synchronous.
 /// Throws ProcessorConfigError wrapping any underlying error with the filename.
 private func loadProcessorConfig(from modelDirectory: URL) async throws -> (
     Data, BaseProcessorConfiguration

Original file line number	Diff line number	Diff line change
`@@ -503,8 +503,7 @@ public final class LLMModelFactory: ModelFactory {`
`503`	`503`	`configurationURL.lastPathComponent, configuration.name, error)`
`504`	`504`	`}`
`505`	`505`
`506`		`- // Start tokenizer loading asynchronously, then load weights synchronously.`
`507`		`- // Both operations run in parallel because async let begins execution immediately.`
	`506`	`+ // Load tokenizer and weights in parallel using async let.`
`508`	`507`	`async let tokenizerTask = loadTokenizer(configuration: configuration, hub: hub)`
`509`	`508`
`510`	`509`	`try loadWeights(`