Uncodedtech
diff --git a/‎internal/ai/vision/README.md‎
Lines changed: 48 additions & 30 deletions b/‎internal/ai/vision/README.md‎
Lines changed: 48 additions & 30 deletions
diff --git a/‎internal/ai/vision/engine.go‎
Lines changed: 1 addition & 9 deletions b/‎internal/ai/vision/engine.go‎
Lines changed: 1 addition & 9 deletions
diff --git a/‎internal/ai/vision/engine_ollama.go‎
Lines changed: 1 addition & 0 deletions b/‎internal/ai/vision/engine_ollama.go‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎internal/ai/vision/engine_openai.go‎
Lines changed: 9 additions & 0 deletions b/‎internal/ai/vision/engine_openai.go‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎internal/ai/vision/model.go‎
Lines changed: 3 additions & 3 deletions b/‎internal/ai/vision/model.go‎
Lines changed: 3 additions & 3 deletions
@@ -53,41 +53,59 @@ The `vision.yml` file is usually kept in the `storage/config` directory (overrid
 
 The model `Options` adjust model parameters such as temperature, top-p, and schema constraints when using [Ollama](ollama/README.md) or [OpenAI](openai/README.md):
 
-| Option            | Default                                                                                 | Description                                                                             |
-|-------------------|-----------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------|
-| `Temperature`     | engine default (`0.1` for Ollama)                                                       | Controls randomness with a value between `0.01` and `2.0`; not used for OpenAI's GPT-5. |
-| `TopK`            | engine default (model-specific)                                                         | Limits sampling to the top K tokens to reduce rare or noisy outputs.                    |
-| `TopP`            | engine default (`0.9` for some Ollama label defaults; unset for OpenAI)                 | Nucleus sampling; keeps the smallest token set whose cumulative probability ≥ `p`.      |
-| `MinP`            | engine default (unset unless provided)                                                  | Drops tokens whose probability mass is below `p`, trimming the long tail.               |
-| `TypicalP`        | engine default (unset unless provided)                                                  | Keeps tokens with typicality under the threshold; combine with TopP/MinP for flow.      |
-| `Seed`            | random per run (unless set)                                                             | Fix for reproducible outputs; unset for more variety between runs.                      |
-| `RepeatLastN`     | engine default (model-specific)                                                         | Number of recent tokens considered for repetition penalties.                            |
-| `RepeatPenalty`   | engine default (model-specific)                                                         | Multiplier >1 discourages repeating the same tokens or phrases.                         |
-| `NumPredict`      | engine default (Ollama only)                                                            | Ollama-specific max output tokens; synonymous intent with `MaxOutputTokens`.            |
-| `MaxOutputTokens` | engine default (OpenAI caption 512, labels 1024)                                        | Upper bound on generated tokens; adapters raise low values to defaults.                 |
-| `ForceJson`       | engine-specific (`true` for OpenAI labels; `false` for Ollama labels; captions `false`) | Forces structured output when enabled.                                                  |
-| `SchemaVersion`   | derived from schema name                                                                | Override when coordinating schema migrations.                                           |
-| `Stop`            | engine default                                                                          | Array of stop sequences (e.g., `["\\n\\n"]`).                                           |
-| `NumThread`       | runtime auto                                                                            | Caps CPU threads for local engines.                                                     |
-| `NumCtx`          | engine default                                                                          | Context window length (tokens).                                                         |
+| Option             | Default                                                                                 | Description                                                                             |
+|--------------------|-----------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------|
+| `Temperature`      | engine default (`0.1` for Ollama)                                                       | Controls randomness with a value between `0.01` and `2.0`; not used for OpenAI's GPT-5. |
+| `TopK`             | engine default (model-specific)                                                         | Limits sampling to the top K tokens to reduce rare or noisy outputs.                    |
+| `TopP`             | engine default (`0.9` for some Ollama label defaults; unset for OpenAI)                 | Nucleus sampling; keeps the smallest token set whose cumulative probability ≥ `p`.      |
+| `MinP`             | engine default (unset unless provided)                                                  | Drops tokens whose probability mass is below `p`, trimming the long tail.               |
+| `TypicalP`         | engine default (unset unless provided)                                                  | Keeps tokens with typicality under the threshold; combine with TopP/MinP for flow.      |
+| `Seed`             | random per run (unless set)                                                             | Fix for reproducible outputs; unset for more variety between runs.                      |
+| `RepeatLastN`      | engine default (model-specific)                                                         | Number of recent tokens considered for repetition penalties.                            |
+| `RepeatPenalty`    | engine default (model-specific)                                                         | Multiplier >1 discourages repeating the same tokens or phrases.                         |
+| `PenalizeNewline`  | engine default                                                                          | Whether to apply repetition penalties to newline tokens.                                |
+| `PresencePenalty`  | engine default (OpenAI-style)                                                           | Increases the likelihood of introducing new tokens by penalizing existing ones.         |
+| `FrequencyPenalty` | engine default (OpenAI-style)                                                           | Penalizes tokens in proportion to their frequency so far.                               |
+| `TfsZ`             | engine default                                                                          | Tail free sampling parameter; lower values reduce repetition.                           |
+| `NumKeep`          | engine default (Ollama)                                                                 | How many tokens to keep from the prompt before sampling starts.                         |
+| `NumPredict`       | engine default (Ollama only)                                                            | Ollama-specific max output tokens; synonymous intent with `MaxOutputTokens`.            |
+| `MaxOutputTokens`  | engine default (OpenAI caption 512, labels 1024)                                        | Upper bound on generated tokens; adapters raise low values to defaults.                 |
+| `ForceJson`        | engine-specific (`true` for OpenAI labels; `false` for Ollama labels; captions `false`) | Forces structured output when enabled.                                                  |
+| `SchemaVersion`    | derived from schema name                                                                | Override when coordinating schema migrations.                                           |
+| `Stop`             | engine default                                                                          | Array of stop sequences (e.g., `["\\n\\n"]`).                                           |
+| `NumThread`        | runtime auto                                                                            | Caps CPU threads for local engines.                                                     |
+| `NumCtx`           | engine default                                                                          | Context window length (tokens).                                                         |
+| `Mirostat`         | engine default (Ollama)                                                                 | Enables Mirostat sampling (`0` off, `1/2` modes).                                       |
+| `MirostatTau`      | engine default                                                                          | Controls surprise target for Mirostat sampling.                                         |
+| `MirostatEta`      | engine default                                                                          | Learning rate for Mirostat adaptation.                                                  |
+| `NumBatch`         | engine default (Ollama)                                                                 | Batch size for prompt processing.                                                       |
+| `NumGpu`           | engine default (Ollama)                                                                 | Number of GPUs to distribute work across.                                               |
+| `MainGpu`          | engine default (Ollama)                                                                 | Primary GPU index when multiple GPUs are present.                                       |
+| `LowVram`          | engine default (Ollama)                                                                 | Enable VRAM-saving mode; may reduce performance.                                        |
+| `VocabOnly`        | engine default (Ollama)                                                                 | Load vocabulary only for quick metadata inspection.                                     |
+| `UseMmap`          | engine default (Ollama)                                                                 | Memory map model weights instead of fully loading them.                                 |
+| `UseMlock`         | engine default (Ollama)                                                                 | Lock model weights in RAM to reduce paging.                                             |
+| `Numa`             | engine default (Ollama)                                                                 | Enable NUMA-aware allocations when available.                                           |
+| `Detail`           | engine default (OpenAI)                                                                 | Controls OpenAI vision detail level (`low`, `high`, `auto`).                            |
+| `CombineOutputs`   | engine default (OpenAI multi-output)                                                    | Controls whether multi-output models combine results automatically.                     |
 
 #### Model Service
 
 Configures the endpoint URL, method, format, and authentication for [Ollama](ollama/README.md), [OpenAI](openai/README.md), and other engines that perform remote HTTP requests:
 
-| Field                              | Default                                  | Notes                                                |
-|------------------------------------|------------------------------------------|------------------------------------------------------|
-| `Uri`                              | required for remote                      | Endpoint base. Empty keeps model local (TensorFlow). |
-| `Method`                           | `POST`                                   | Override verb if provider needs it.                  |
-| `Key`                              | `""`                                     | Bearer token; prefer env expansion.                  |
-| `Username` / `Password`            | `""`                                     | Injected as basic auth when URI lacks userinfo.      |
-| `Model`                            | `""`                                     | Endpoint-specific override; wins over model/name.    |
-| `Org` / `Project`                  | `""`                                     | OpenAI headers (org/proj IDs)                        |
-| `RequestFormat` / `ResponseFormat` | set by engine alias                      | Explicit values win over alias defaults.             |
-| `FileScheme`                       | set by engine alias (`data` or `base64`) | Controls image transport.                            |
-| `Disabled`                         | `false`                                  | Disable the endpoint without removing the model.     |
-
-> **Authentication:** All credentials and identifiers support `${ENV_VAR}` expansion. `Service.Key` sets `Authorization: Bearer <token>`; `Username`/`Password` injects HTTP basic authentication into the service URI when it is not already present.
+| Field                              | Default                                  | Notes                                                                                    |
+|------------------------------------|------------------------------------------|------------------------------------------------------------------------------------------|
+| `Uri`                              | required for remote                      | Endpoint base. Empty keeps model local (TensorFlow).                                     |
+| `Method`                           | `POST`                                   | Override verb if provider needs it.                                                      |
+| `Key`                              | `""`                                     | Bearer token; prefer env expansion (OpenAI: `OPENAI_API_KEY`, Ollama: `OLLAMA_API_KEY`). |
+| `Username` / `Password`            | `""`                                     | Injected as basic auth when URI lacks userinfo.                                          |
+| `Model`                            | `""`                                     | Endpoint-specific override; wins over model/name.                                        |
+| `Org` / `Project`                  | `""`                                     | OpenAI headers (org/proj IDs)                                                            |
+| `RequestFormat` / `ResponseFormat` | set by engine alias                      | Explicit values win over alias defaults.                                                 |
+| `FileScheme`                       | set by engine alias (`data` or `base64`) | Controls image transport.                                                                |
+| `Disabled`                         | `false`                                  | Disable the endpoint without removing the model.                                         |
+
+> **Authentication:** All credentials and identifiers support `${ENV_VAR}` expansion. `Service.Key` sets `Authorization: Bearer <token>`; `Username`/`Password` injects HTTP basic authentication into the service URI when it is not already present. When `Service.Key` is empty, PhotoPrism defaults to `OPENAI_API_KEY` (OpenAI engine) or `OLLAMA_API_KEY` (Ollama engine), also honoring their `_FILE` counterparts.
  
 ### Field Behavior & Precedence
 
 
@@ -5,7 +5,6 @@ import (
 	"strings"
 	"sync"
 
-	"github.com/photoprism/photoprism/internal/ai/vision/openai"
 	"github.com/photoprism/photoprism/pkg/http/scheme"
 )
 
@@ -61,14 +60,6 @@ func init() {
 		FileScheme:        scheme.Data,
 		DefaultResolution: DefaultResolution,
 	})
-
-	RegisterEngineAlias(openai.EngineName, EngineInfo{
-		Uri:               "https://api.openai.com/v1/responses",
-		RequestFormat:     ApiFormatOpenAI,
-		ResponseFormat:    ApiFormatOpenAI,
-		FileScheme:        scheme.Data,
-		DefaultResolution: openai.DefaultResolution,
-	})
 }
 
 // RegisterEngine adds/overrides an engine implementation for a specific API format.
@@ -85,6 +76,7 @@ type EngineInfo struct {
 	ResponseFormat    ApiFormat
 	FileScheme        string
 	DefaultResolution int
+	DefaultKey        string // Optional placeholder key (e.g., ${OPENAI_API_KEY}); applied only when Service.Key is empty.
 }
 
 // RegisterEngineAlias maps a logical engine name (e.g., "ollama") to a
 
@@ -30,6 +30,7 @@ func init() {
 		ResponseFormat:    ApiFormatOllama,
 		FileScheme:        scheme.Base64,
 		DefaultResolution: ollama.DefaultResolution,
+		DefaultKey:        ollama.APIKeyPlaceholder,
 	})
 
 	CaptionModel.Engine = ollama.EngineName
 
@@ -28,6 +28,15 @@ func init() {
 		Parser:   openaiParser{},
 		Defaults: openaiDefaults{},
 	})
+
+	RegisterEngineAlias(openai.EngineName, EngineInfo{
+		Uri:               "https://api.openai.com/v1/responses",
+		RequestFormat:     ApiFormatOpenAI,
+		ResponseFormat:    ApiFormatOpenAI,
+		FileScheme:        scheme.Data,
+		DefaultResolution: openai.DefaultResolution,
+		DefaultKey:        openai.APIKeyPlaceholder,
+	})
 }
 
 // SystemPrompt returns the default OpenAI system prompt for the specified model type.
 
@@ -491,10 +491,10 @@ func (m *Model) ApplyEngineDefaults() {
 		if info.DefaultResolution > 0 && m.Resolution <= 0 {
 			m.Resolution = info.DefaultResolution
 		}
-	}
 
-	if engine == openai.EngineName && strings.TrimSpace(m.Service.Key) == "" {
-		m.Service.Key = "${OPENAI_API_KEY}"
+		if strings.TrimSpace(m.Service.Key) == "" && strings.TrimSpace(info.DefaultKey) != "" {
+			m.Service.Key = info.DefaultKey
+		}
 	}
 
 	m.Engine = engine
Original file line number	Diff line number	Diff line change
`@@ -491,10 +491,10 @@ func (m *Model) ApplyEngineDefaults() {`
`491`	`491`	`if info.DefaultResolution > 0 && m.Resolution <= 0 {`
`492`	`492`	`m.Resolution = info.DefaultResolution`
`493`	`493`	`}`
`494`		`- }`
`495`	`494`
`496`		`- if engine == openai.EngineName && strings.TrimSpace(m.Service.Key) == "" {`
`497`		`- m.Service.Key = "${OPENAI_API_KEY}"`
	`495`	`+ if strings.TrimSpace(m.Service.Key) == "" && strings.TrimSpace(info.DefaultKey) != "" {`
	`496`	`+ m.Service.Key = info.DefaultKey`
	`497`	`+ }`
`498`	`498`	`}`
`499`	`499`
`500`	`500`	`m.Engine = engine`