chore: v0.4.1

av · av · commit b3be20743341 · 2026-02-09T21:30:17.000+01:00
diff --git a/.scripts/docs.ts b/.scripts/docs.ts
@@ -116,6 +116,12 @@ async function copyWithProcessor(
   const sourceContent = await Deno.readTextFile(source);
   const destContent = await processor(sourceContent);
 
+  // Ensure destination directory exists before writing
+  const dir = dest.split('/').slice(0, -1).join('/');
+  if (dir && !Array.from(Deno.readDirSync('.')).some(d => d.name === dir && d.isDirectory)) {
+    await Deno.mkdir(dir, { recursive: true });
+  }
+
   await Deno.writeTextFile(dest, destContent);
 }
 
diff --git a/.scripts/release.sh b/.scripts/release.sh
@@ -12,9 +12,14 @@ harbor dev docs
 
 # cd to wiki and push the docs
 cd ../harbor.wiki
-git add .
-git commit -m "chore: docs"
-git push origin master
+git add . || true
+# Commit only if there are changes
+if git diff-index --quiet HEAD --; then
+  echo "No docs changes to commit"
+else
+  git commit -m "chore: docs"
+  git push origin master || true
+fi
 cd ../harbor
 
 # echo "NPM Publish..."
diff --git a/.scripts/seed.ts b/.scripts/seed.ts
@@ -6,7 +6,7 @@ import * as toml from 'jsr:@std/toml';
 import * as path from 'jsr:@std/path';
 import * as collections from "jsr:@std/collections/deep-merge";
 
-const VERSION = "0.4.0";
+const VERSION = "0.4.1";
 
 type ValueSeed = {
   // Path relative to the project root
@@ -26,7 +26,7 @@ const targets: ValueSeed[] = [{
     },
   },
 }, {
-  target: 'boost/pyproject.toml',
+  target: 'services/boost/pyproject.toml',
   value: {
     project: {
       version: VERSION,
diff --git a/app/package.json b/app/package.json
@@ -1,7 +1,7 @@
 {
   "name": "@avcodes/harbor-app",
   "private": true,
-  "version": "0.3.41",
+  "version": "0.4.1",
   "type": "module",
   "scripts": {
     "dev": "vite",
diff --git a/app/src-tauri/Cargo.toml b/app/src-tauri/Cargo.toml
@@ -1,7 +1,7 @@
 
 [package]
 name = "harbor-app"
-version = "0.3.41"
+version = "0.4.1"
 description = "A companion app for Harbor LLM toolkit"
 authors = ["av"]
 edition = "2021"
diff --git a/app/src-tauri/tauri.conf.json b/app/src-tauri/tauri.conf.json
@@ -1,7 +1,7 @@
 {
   "$schema": "https://schema.tauri.app/config/2.4.0",
   "productName": "Harbor",
-  "version": "0.3.41",
+  "version": "0.4.1",
   "identifier": "com.harbor.app",
   "build": {
     "beforeDevCommand": "bun run dev",
diff --git a/boost/README.md b/boost/README.md
@@ -0,0 +1,296 @@
+> Handle: `boost`<br/>
+> URL: [http://localhost:34131/](http://localhost:34131/)
+
+![splash](../docs/harbor-boost.png)
+
+`boost` is an optimising LLM proxy with OpenAI-compatible API.
+
+### Documentation
+
+- [Features](#features)
+- [Starting](#starting)
+- [Configuration](#configuration)
+- [API](#api)
+- [Environment Variables Reference](../docs/5.2.2-Harbor-Boost-Configuration)
+- [Built-in Modules Reference](../docs/5.2.3-Harbor-Boost-Modules)
+- [Custom Modules Guide](../docs/5.2.1.-Harbor-Boost-Custom-Modules)
+- [Standalone Usage Guide](#standalone-usage)
+- [Boost Starter repo](https://github.com/av/boost-starter)
+
+***
+
+### Features
+
+#### OpenAI-compatible API
+
+Acts as a drop-in proxy for OpenAI APIs, compatible with most LLM providers and clients. Boost can be used as a "plain" proxy to combine multiple LLM backends behind a single endpoint with a single API key.
+
+![Short overview of boost behavior](../docs/boost-behavior.png)
+
+```bash
+POST http://localhost:34131/v1/chat/completions
+
+{
+  "model": "llama3.1",
+  "messages": [{ "role": "user", "content": "Tell me about LLMs" }]
+}
+```
+
+#### Modules
+
+Run custom code inside or instead of a chat completion, to fetch external data, improve reasoning, perform trace inference, and more.
+
+```bash
+POST http://localhost:34131/v1/chat/completions
+
+{
+  "model": "klmbr-llama3.1",
+  "messages": [{ "role": "user", "content": "Suggest me a random color" }]
+}
+```
+
+Boost comes with [a lot of built-in modules](../docs/5.2.3-Harbor-Boost-Modules) with various functions. You can use them directly or as a base for your own creations.
+
+| [`markov`](../docs/5.2.3-Harbor-Boost-Modules#markov) | [`concept`](../docs/5.2.3-Harbor-Boost-Modules#concept) |
+|-|-|
+| ![](../docs/boost-markov.png) | ![](../docs/boost-concept.png) |
+
+| [`nbs`](../docs/5.2.3-Harbor-Boost-Modules#nbs) |
+|-|
+| ![](../docs/boost-nbs.png) |
+
+| [`dnd`](../docs/5.2.3-Harbor-Boost-Modules#dnd) | [`promx`](../docs/5.2.3-Harbor-Boost-Modules#promx) |
+|-|-|
+| ![](../docs/boost-dnd.png) | ![](../docs/boost-promx.png) |
+
+| [`dot`](../docs/5.2.3-Harbor-Boost-Modules#dot) | [`klmbr`](../docs/5.2.3-Harbor-Boost-Modules#klmbr) | [`r0`](../docs/5.2.3-Harbor-Boost-Modules#r0) |
+|-|-|-|
+| ![](../docs/boost-dot.png) | ![](../docs/boost-klmbr.png) | ![](../docs/boost-r0.png) |
+
+#### Scripting
+
+Creating custom modules is a first-class feature and one of the main use-cases for Harbor Boost.
+
+```python
+# Simplest echo module replies back
+# with the last message from the input
+def apply(llm, chat):
+  await llm.emit_message(prompt=chat.tail.content)
+```
+
+See the [Custom Modules](../docs/5.2.1.-Harbor-Boost-Custom-Modules) guide for more information on how to create your own modules and overview of available interfaces.
+
+### Starting
+
+#### Start with Harbor
+
+```bash
+# [Optional] pre-build the image
+harbor build boost
+
+# Start the service
+harbor up boost
+```
+
+- Harbor connects `boost` with:
+  - to all included LLM backends (`ollama`, `llamacpp`, `vllm`, etc.)
+  - [`optillm`](../docs/2.3.33-Satellite\&colon-OptiLLM) as a backend
+  - `webui` and `dify` frontends
+
+```bash
+# Get the URL for the boost service
+harbor url boost
+
+# Open default boost endpoint in the browser
+harbor open boost
+```
+
+#### Start standalone
+
+```bash
+docker run \
+  -e "HARBOR_BOOST_OPENAI_URLS=http://172.17.0.1:11434/v1" \
+  -e "HARBOR_BOOST_OPENAI_KEYS=sk-ollama" \
+  -e "HARBOR_BOOST_MODULES=dot;klmbr;promx;autotemp;markov;" \
+  -e "HARBOR_BOOST_BASE_MODELS=true" \
+  -e "HARBOR_BOOST_API_KEY=sk-boost" \
+  -p 34131:8000 \
+  ghcr.io/av/harbor-boost:latest
+```
+
+See [standalone usage](#standalone-usage) guide below.
+
+### Configuration
+
+[Configuration](1.-Harbor-User-Guide#configuring-services) can be performed via Harbor CLI, [`harbor config`](../docs/3.-Harbor-CLI-Reference#harbor-config), [`harbor env`](../docs/3.-Harbor-CLI-Reference#harbor-env) or the `.env` file.
+
+All of the above ways are interchangeable and result in setting environment variables for the service.
+
+#### Harbor CLI
+
+Specific options can be set using `harbor` CLI:
+
+```bash
+# Enable/Disable a module
+harbor boost modules add <module>
+harbor boost modules rm <module>
+
+# Set a parameter
+harbor boost <module> <parameter>
+harbor boost <module> <parameter> <value>
+
+# See boost/module help entries
+# for more info
+harbor boost --help
+harbor boost klmbr --help
+harbor boost rcn --help
+harbor boost g1 --help
+
+# Additional OpenAI-compatible APIs to boost
+harbor boost urls add http://localhost:11434/v1
+harbor boost urls rm http://localhost:11434/v1
+harbor boost urls rm 0 # by index
+harobr boost urls ls
+
+# Keys for the OpenAI-compatible APIs to boost. Semicolon-separated list.
+# ⚠️ These are index-matched with the URLs. Even if the API doesn't require a key,
+# you still need to provide a placeholder for it.
+harbor boost keys add sk-ollama
+harbor boost keys rm sk-ollama
+harbor boost keys rm 0 # by index
+harbor boost keys ls
+```
+
+#### Harbor Config
+
+More options are available via [`harbor config`](../docs/3.-Harbor-CLI-Reference#harbor-config).
+
+```bash
+# See all available options
+harbor config ls boost
+
+# Some of the available options
+harbor config set boost.host.port 34131
+harbor config set boost.api.key sk-boost
+harbor config set boost.api.keys sk-user1;sk-user2;sk-user3
+```
+
+Below are additional configuration options that do not have an alias in the Harbor CLI (so you need to use [`harbor config`](../docs/3.-Harbor-CLI-Reference#harbor-config) directly). For example `harbor config set boost.intermediate_output true`.
+
+#### Environment Variables
+
+Most comprehensive way to configure `boost` is to use environment variables. You can set them in the `.env` file or via [`harbor env`](../docs/3.-Harbor-CLI-Reference#harbor-env).
+
+```bash
+# Using harbor env
+harbor env boost HARBOR_BOOST_API_KEY_MISTRAL sk-mistral
+
+# Or open one of these in your text editor
+open $(harbor home)/.env
+open $(harbor home)/services/boost/override.env
+```
+
+See all supported environment variables in the [Environment Variables Reference](../docs/5.2.2-Harbor-Boost-Configuration).
+
+There's no configuration for this module yet.
+
+### API
+
+`boost` works as an OpenAI-compatible API proxy. It'll query configured downstream services for which models they serve and provide "boosted" wrappers in its own API.
+
+See the [http catalog](https://github.com/av/harbor/blob/main/http-catalog/boost.http) entry for some sample requests.
+
+**Authorization**
+
+When [configured](#boost-configuration) to require an API key, you can provide the API key in the `Authorization` header.
+
+```http
+<!-- All three versions are accepted -->
+Authorization: sk-boost
+Authorization: bearer sk-boost
+Authorization: Bearer sk-boost
+```
+
+**`GET /v1/models`**
+
+List boosted models. `boost` will serve additional models as per enabled modules. For example:
+
+```jsonc
+[
+  {
+    // Original, unmodified model proxy
+    "id": "llama3.1:8b"
+    // ...
+  },
+  {
+    // LLM with klmbr technique applied
+    "id": "klmbr-llama3.1:8b"
+    // ...
+  },
+  {
+    // LLM with rcn technique applied
+    "id": "rcn-llama3.1:8b"
+    // ...
+  }
+]
+```
+
+**`POST /v1/chat/completions`**
+
+Chat completions endpoint.
+
+- Proxies all parameters to the downstream API, so custom payloads are supported out of the box, for example `json` format for Ollama
+- Supports streaming completions and tool calls
+
+```bash
+POST http://localhost:34131/v1/chat/completions
+
+{
+  "model": "llama3.1:8b",
+  "messages": [
+    { "role": "user", "content": "Suggest me a random color" }
+  ],
+  "stream": true
+}
+```
+
+**`GET /events/:stream_id`**
+
+Listen to a specific stream of events (associated with a single completion workflow). The stream ID is a unique identifier of the LLM instance processing the request (you may decide to advertise/pass it to the client in the workflow's code).
+
+**`GET /health`**
+
+Health check endpoint. Returns `{ status: 'ok' }` if the service is running.
+
+### Standalone usage
+
+You can run boost as a standalone Docker container. See [harbor-boost](https://github.com/av/harbor/pkgs/container/harbor-boost) package in GitHub Container Registry.
+
+```bash
+# [Optional] pre-pull the image
+docker pull ghcr.io/av/harbor-boost:latest
+
+# Start the container
+docker run \
+  # 172.17.0.1 is the default IP of the host, when running on Linux
+  # So, the example below is for local ollama
+  -e "HARBOR_BOOST_OPENAI_URLS=http://172.17.0.1:11434/v1" \
+  -e "HARBOR_BOOST_OPENAI_KEYS=sk-ollama" \
+  # Configuration for the boost modules
+  -e "HARBOR_BOOST_MODULES=klmbr;rcn;g1" \
+  -e "HARBOR_BOOST_KLMBR_PERCENTAGE=60" \
+  # [Optional] mount folder with custom modules
+  -v /path/to/custom_modules/folder:/app/custom_modules \
+  -p 8004:8000 \
+  ghcr.io/av/harbor-boost:latest
+
+# In the separate terminal (or detach the container)
+curl http://localhost:8004/health
+curl http://localhost:8004/v1/models
+```
+
+You can take a look at a [`boost-starter`](https://github.com/av/boost-starter) repo for a minimal example repository to get started.
+
+**Configuration**
+
+See [Environment Variables Reference](../docs/5.2.2-Harbor-Boost-Configuration).
diff --git a/docs/2.-Services.md b/docs/2.-Services.md
@@ -78,7 +78,7 @@ A Flexible Framework for Experiencing Cutting-edge LLM Inference Optimizations
 - <a href="https://github.com/av/harbor/wiki/2.2.2-Backend:-llama.cpp"><img src="https://github.com/ggerganov.png?size=200" alt="llama.cpp logo" width="12" height="12" /> llama.cpp</a> <span style="opacity: 0.5;">`Backend`</span><br/>
 LLM inference in C/C++
 
-- <a href="https://github.com/av/harbor/wiki/2.2.10-Backend:-lmdeploy">lmdeploy</a> <span style="opacity: 0.5;">`Backend`, `Partial Support`</span><br/>
+- <a href="https://github.com/av/harbor/wiki/2.2.10-Backend:-lmdeploy"><img src="https://www.google.com/s2/favicons?domain=lmdeploy.readthedocs.io&sz=128" alt="lmdeploy logo" width="12" height="12" /> lmdeploy</a> <span style="opacity: 0.5;">`Backend`, `Partial Support`</span><br/>
 
 
 - <a href="https://github.com/av/harbor/wiki/2.2.6-Backend:-mistral.rs"><img src="https://github.com/EricLBuehler.png?size=200" alt="mistral.rs logo" width="12" height="12" /> mistral.rs</a> <span style="opacity: 0.5;">`Backend`</span><br/>
diff --git a/harbor.sh b/harbor.sh
@@ -4775,7 +4775,7 @@ run_modularmax_command() {
 # ========================================================================
 
 # Globals
-version="0.3.41"
+version="0.4.1"
 harbor_repo_url="https://github.com/av/harbor.git"
 harbor_release_url="https://api.github.com/repos/av/harbor/releases/latest"
 delimiter="|"
diff --git a/package.json b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "@avcodes/harbor",
-  "version": "0.3.41",
+  "version": "0.4.1",
   "description": "Effortlessly run LLM backends, APIs, frontends, and services with one command.",
   "private": false,
   "author": "av <av@av.codes> (https://av.codes)",
diff --git a/promptfoo/README.md b/promptfoo/README.md
diff --git a/pyproject.toml b/pyproject.toml
diff --git a/services/boost/pyproject.toml b/services/boost/pyproject.toml

Original file line number	Diff line number	Diff line change
`@@ -1,7 +1,7 @@`
`1`	`1`	`{`
`2`	`2`	`"name": "@avcodes/harbor-app",`
`3`	`3`	`"private": true,`
`4`		`- "version": "0.3.41",`
	`4`	`+ "version": "0.4.1",`
`5`	`5`	`"type": "module",`
`6`	`6`	`"scripts": {`
`7`	`7`	`"dev": "vite",`
Original file line number	Diff line number	Diff line change
`@@ -1,7 +1,7 @@`
`1`	`1`	`{`
`2`	`2`	`"$schema": "https://schema.tauri.app/config/2.4.0",`
`3`	`3`	`"productName": "Harbor",`
`4`		`- "version": "0.3.41",`
	`4`	`+ "version": "0.4.1",`
`5`	`5`	`"identifier": "com.harbor.app",`
`6`	`6`	`"build": {`
`7`	`7`	`"beforeDevCommand": "bun run dev",`
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"name": "@avcodes/harbor",`
`3`		`- "version": "0.3.41",`
	`3`	`+ "version": "0.4.1",`
`4`	`4`	`"description": "Effortlessly run LLM backends, APIs, frontends, and services with one command.",`
`5`	`5`	`"private": false,`
`6`	`6`	`"author": "av <av@av.codes> (https://av.codes)",`