Improve LLM diagnostics and timeout configuration

jinxuesong · jinxuesong · commit 073a6dac34da · 2026-03-15T21:29:39.000+08:00
diff --git a/README.md b/README.md
@@ -199,7 +199,7 @@ If you already have your own OpenAI-compatible services, just replace the releva
 
 - `embedding`: change `apiKey` / `model` / `baseURL` / `dimensions`
 - `retrieval`: change `rerankProvider` / `rerankEndpoint` / `rerankModel` / `rerankApiKey`
-- `llm`: change `apiKey` / `model` / `baseURL`
+- `llm`: change `apiKey` / `model` / `baseURL` / `timeoutMs`
 
 For example, to replace only the LLM:
 
@@ -535,6 +535,7 @@ When `smartExtraction` is enabled (default: `true`), the plugin uses an LLM to i
 | `llm.apiKey` | string | *(falls back to `embedding.apiKey`)* | API key for the LLM provider |
 | `llm.model` | string | `openai/gpt-oss-120b` | LLM model name |
 | `llm.baseURL` | string | *(falls back to `embedding.baseURL`)* | LLM API endpoint |
+| `llm.timeoutMs` | number | `30000` | LLM request timeout in milliseconds |
 | `extractMinMessages` | number | `2` | Minimum messages before extraction triggers |
 | `extractMaxChars` | number | `8000` | Maximum characters sent to the LLM |
 
@@ -551,7 +552,7 @@ Full config (separate LLM endpoint):
 {
   "embedding": { "apiKey": "${OPENAI_API_KEY}", "model": "text-embedding-3-small" },
   "smartExtraction": true,
-  "llm": { "apiKey": "${OPENAI_API_KEY}", "model": "gpt-4o-mini", "baseURL": "https://api.openai.com/v1" },
+  "llm": { "apiKey": "${OPENAI_API_KEY}", "model": "gpt-4o-mini", "baseURL": "https://api.openai.com/v1", "timeoutMs": 30000 },
   "extractMinMessages": 2,
   "extractMaxChars": 8000
 }
diff --git a/README_CN.md b/README_CN.md
@@ -199,7 +199,7 @@ openclaw logs --follow --plain | rg "memory-lancedb-pro"
 
 - `embedding`：改 `apiKey` / `model` / `baseURL` / `dimensions`
 - `retrieval`：改 `rerankProvider` / `rerankEndpoint` / `rerankModel` / `rerankApiKey`
-- `llm`：改 `apiKey` / `model` / `baseURL`
+- `llm`：改 `apiKey` / `model` / `baseURL` / `timeoutMs`
 
 例如只替换 LLM：
 
@@ -535,6 +535,7 @@ OpenClaw 默认行为：
 | `llm.apiKey` | string | *（复用 `embedding.apiKey`）* | LLM 提供商 API Key |
 | `llm.model` | string | `openai/gpt-oss-120b` | LLM 模型名称 |
 | `llm.baseURL` | string | *（复用 `embedding.baseURL`）* | LLM API 端点 |
+| `llm.timeoutMs` | number | `30000` | LLM 请求超时（毫秒） |
 | `extractMinMessages` | number | `2` | 触发提取所需最少消息数 |
 | `extractMaxChars` | number | `8000` | 发送给 LLM 的最大字符数 |
 
@@ -551,7 +552,7 @@ OpenClaw 默认行为：
 {
   "embedding": { "apiKey": "${OPENAI_API_KEY}", "model": "text-embedding-3-small" },
   "smartExtraction": true,
-  "llm": { "apiKey": "${OPENAI_API_KEY}", "model": "gpt-4o-mini", "baseURL": "https://api.openai.com/v1" },
+  "llm": { "apiKey": "${OPENAI_API_KEY}", "model": "gpt-4o-mini", "baseURL": "https://api.openai.com/v1", "timeoutMs": 30000 },
   "extractMinMessages": 2,
   "extractMaxChars": 8000
 }
diff --git a/index.ts b/index.ts
@@ -131,6 +131,7 @@ interface PluginConfig {
     apiKey?: string;
     model?: string;
     baseURL?: string;
+    timeoutMs?: number;
   };
   extractMinMessages?: number;
   extractMaxChars?: number;
@@ -211,6 +212,10 @@ function parsePositiveInt(value: unknown): number | undefined {
   return undefined;
 }
 
+function resolveLlmTimeoutMs(config: PluginConfig): number {
+  return parsePositiveInt(config.llm?.timeoutMs) ?? 30000;
+}
+
 function resolveHookAgentId(
   explicitAgentId: string | undefined,
   sessionKey: string | undefined,
@@ -1654,12 +1659,13 @@ const memoryLanceDBProPlugin = {
           ? resolveEnvVars(config.llm.baseURL)
           : config.embedding.baseURL;
         const llmModel = config.llm?.model || "openai/gpt-oss-120b";
+        const llmTimeoutMs = resolveLlmTimeoutMs(config);
 
         const llmClient = createLlmClient({
           apiKey: llmApiKey,
           model: llmModel,
           baseURL: llmBaseURL,
-          timeoutMs: 30000,
+          timeoutMs: llmTimeoutMs,
           log: (msg: string) => api.logger.debug(msg),
         });
 
@@ -1681,7 +1687,13 @@ const memoryLanceDBProPlugin = {
           noiseBank,
         });
 
-        api.logger.info("memory-lancedb-pro: smart extraction enabled (LLM model: " + llmModel + ", noise bank: ON)");
+        api.logger.info(
+          "memory-lancedb-pro: smart extraction enabled (LLM model: "
+          + llmModel
+          + ", timeoutMs: "
+          + llmTimeoutMs
+          + ", noise bank: ON)",
+        );
       } catch (err) {
         api.logger.warn(`memory-lancedb-pro: smart extraction init failed, falling back to regex: ${String(err)}`);
       }
@@ -1971,11 +1983,13 @@ const memoryLanceDBProPlugin = {
             const llmBaseURL = config.llm?.baseURL
               ? resolveEnvVars(config.llm.baseURL)
               : config.embedding.baseURL;
+            const llmTimeoutMs = resolveLlmTimeoutMs(config);
             return createLlmClient({
               apiKey: llmApiKey,
               model: config.llm?.model || "openai/gpt-oss-120b",
               baseURL: llmBaseURL,
-              timeoutMs: 30000,
+              timeoutMs: llmTimeoutMs,
+              log: (msg: string) => api.logger.debug(msg),
             });
           } catch { return undefined; }
         })() : undefined,
diff --git a/openclaw.plugin.json b/openclaw.plugin.json
@@ -436,6 +436,11 @@
           },
           "baseURL": {
             "type": "string"
+          },
+          "timeoutMs": {
+            "type": "integer",
+            "minimum": 1,
+            "default": 30000
           }
         }
       },
@@ -812,6 +817,12 @@
       "placeholder": "https://api.groq.com/openai/v1",
       "help": "OpenAI-compatible base URL for LLM (defaults to embedding.baseURL if omitted)",
       "advanced": true
+    },
+    "llm.timeoutMs": {
+      "label": "LLM Timeout (ms)",
+      "placeholder": "30000",
+      "help": "Request timeout for the smart-extraction / upgrade LLM in milliseconds",
+      "advanced": true
     }
   }
 }
diff --git a/package.json b/package.json
@@ -36,7 +36,7 @@
     ]
   },
   "scripts": {
-    "test": "node test/embedder-error-hints.test.mjs && node test/migrate-legacy-schema.test.mjs && node --test test/config-session-strategy-migration.test.mjs && node --test test/recall-text-cleanup.test.mjs && node test/update-consistency-lancedb.test.mjs && node test/cli-smoke.mjs && node test/functional-e2e.mjs && node test/retriever-rerank-regression.mjs && node test/smart-memory-lifecycle.mjs && node test/smart-extractor-branches.mjs && node test/plugin-manifest-regression.mjs && node --test test/sync-plugin-version.test.mjs && node test/smart-metadata-v2.mjs && node test/vector-search-cosine.test.mjs && node test/context-support-e2e.mjs && node test/temporal-facts.test.mjs && node test/memory-update-supersede.test.mjs && node --test test/workflow-fork-guards.test.mjs",
+    "test": "node test/embedder-error-hints.test.mjs && node test/migrate-legacy-schema.test.mjs && node --test test/config-session-strategy-migration.test.mjs && node --test test/recall-text-cleanup.test.mjs && node test/update-consistency-lancedb.test.mjs && node test/cli-smoke.mjs && node test/functional-e2e.mjs && node test/retriever-rerank-regression.mjs && node test/smart-memory-lifecycle.mjs && node test/smart-extractor-branches.mjs && node test/plugin-manifest-regression.mjs && node --test test/sync-plugin-version.test.mjs && node test/smart-metadata-v2.mjs && node test/vector-search-cosine.test.mjs && node test/context-support-e2e.mjs && node test/temporal-facts.test.mjs && node test/memory-update-supersede.test.mjs && node test/memory-upgrader-diagnostics.test.mjs && node --test test/workflow-fork-guards.test.mjs",
     "test:openclaw-host": "node test/openclaw-host-functional.mjs",
     "version": "node scripts/sync-plugin-version.mjs openclaw.plugin.json package.json && git add openclaw.plugin.json"
   },
diff --git a/src/llm-client.ts b/src/llm-client.ts
@@ -16,6 +16,8 @@ export interface LlmClientConfig {
 export interface LlmClient {
   /** Send a prompt and parse the JSON response. Returns null on failure. */
   completeJson<T>(prompt: string, label?: string): Promise<T | null>;
+  /** Best-effort diagnostics for the most recent failure, if any. */
+  getLastError(): string | null;
 }
 
 /**
@@ -56,16 +58,108 @@ function previewText(value: string, maxLen = 200): string {
   return `${normalized.slice(0, maxLen - 3)}...`;
 }
 
+function nextNonWhitespaceChar(text: string, start: number): string | undefined {
+  for (let i = start; i < text.length; i++) {
+    const ch = text[i];
+    if (!/\s/.test(ch)) return ch;
+  }
+  return undefined;
+}
+
+/**
+ * Best-effort repair for common LLM JSON issues:
+ * - unescaped quotes inside string values
+ * - raw newlines / tabs inside strings
+ * - trailing commas before } or ]
+ */
+function repairCommonJson(text: string): string {
+  let result = "";
+  let inString = false;
+  let escaped = false;
+
+  for (let i = 0; i < text.length; i++) {
+    const ch = text[i];
+
+    if (escaped) {
+      result += ch;
+      escaped = false;
+      continue;
+    }
+
+    if (inString) {
+      if (ch === "\\") {
+        result += ch;
+        escaped = true;
+        continue;
+      }
+
+      if (ch === "\"") {
+        const nextCh = nextNonWhitespaceChar(text, i + 1);
+        // A string may legally end before object/array delimiters or a key colon.
+        if (
+          nextCh === undefined ||
+          nextCh === "," ||
+          nextCh === "}" ||
+          nextCh === "]" ||
+          nextCh === ":"
+        ) {
+          result += ch;
+          inString = false;
+        } else {
+          // Treat stray quotes inside a string as literal content.
+          result += "\\\"";
+        }
+        continue;
+      }
+
+      if (ch === "\n") {
+        result += "\\n";
+        continue;
+      }
+      if (ch === "\r") {
+        result += "\\r";
+        continue;
+      }
+      if (ch === "\t") {
+        result += "\\t";
+        continue;
+      }
+
+      result += ch;
+      continue;
+    }
+
+    if (ch === "\"") {
+      result += ch;
+      inString = true;
+      continue;
+    }
+
+    if (ch === ",") {
+      const nextCh = nextNonWhitespaceChar(text, i + 1);
+      if (nextCh === "}" || nextCh === "]") {
+        continue;
+      }
+    }
+
+    result += ch;
+  }
+
+  return result;
+}
+
 export function createLlmClient(config: LlmClientConfig): LlmClient {
   const client = new OpenAI({
     apiKey: config.apiKey,
     baseURL: config.baseURL,
     timeout: config.timeoutMs ?? 30000,
   });
   const log = config.log ?? (() => {});
+  let lastError: string | null = null;
 
   return {
     async completeJson<T>(prompt: string, label = "generic"): Promise<T | null> {
+      lastError = null;
       try {
         const response = await client.chat.completions.create({
           model: config.model,
@@ -82,43 +176,61 @@ export function createLlmClient(config: LlmClientConfig): LlmClient {
 
         const raw = response.choices?.[0]?.message?.content;
         if (!raw) {
-          log(
-            `memory-lancedb-pro: llm-client [${label}] empty response content from model ${config.model}`,
-          );
+          lastError =
+            `memory-lancedb-pro: llm-client [${label}] empty response content from model ${config.model}`;
+          log(lastError);
           return null;
         }
         if (typeof raw !== "string") {
-          log(
-            `memory-lancedb-pro: llm-client [${label}] non-string response content type=${Array.isArray(raw) ? "array" : typeof raw} from model ${config.model}`,
-          );
+          lastError =
+            `memory-lancedb-pro: llm-client [${label}] non-string response content type=${Array.isArray(raw) ? "array" : typeof raw} from model ${config.model}`;
+          log(lastError);
           return null;
         }
 
         const jsonStr = extractJsonFromResponse(raw);
         if (!jsonStr) {
-          log(
-            `memory-lancedb-pro: llm-client [${label}] no JSON object found (chars=${raw.length}, preview=${JSON.stringify(previewText(raw))})`,
-          );
+          lastError =
+            `memory-lancedb-pro: llm-client [${label}] no JSON object found (chars=${raw.length}, preview=${JSON.stringify(previewText(raw))})`;
+          log(lastError);
           return null;
         }
 
         try {
           return JSON.parse(jsonStr) as T;
         } catch (err) {
-          log(
-            `memory-lancedb-pro: llm-client [${label}] JSON.parse failed: ${err instanceof Error ? err.message : String(err)} (jsonChars=${jsonStr.length}, jsonPreview=${JSON.stringify(previewText(jsonStr))})`,
-          );
+          const repairedJsonStr = repairCommonJson(jsonStr);
+          if (repairedJsonStr !== jsonStr) {
+            try {
+              const repaired = JSON.parse(repairedJsonStr) as T;
+              log(
+                `memory-lancedb-pro: llm-client [${label}] recovered malformed JSON via heuristic repair (jsonChars=${jsonStr.length})`,
+              );
+              return repaired;
+            } catch (repairErr) {
+              lastError =
+                `memory-lancedb-pro: llm-client [${label}] JSON.parse failed: ${err instanceof Error ? err.message : String(err)}; repair failed: ${repairErr instanceof Error ? repairErr.message : String(repairErr)} (jsonChars=${jsonStr.length}, jsonPreview=${JSON.stringify(previewText(jsonStr))})`;
+              log(lastError);
+              return null;
+            }
+          }
+          lastError =
+            `memory-lancedb-pro: llm-client [${label}] JSON.parse failed: ${err instanceof Error ? err.message : String(err)} (jsonChars=${jsonStr.length}, jsonPreview=${JSON.stringify(previewText(jsonStr))})`;
+          log(lastError);
           return null;
         }
       } catch (err) {
         // Graceful degradation — return null so caller can fall back
-        log(
-          `memory-lancedb-pro: llm-client [${label}] request failed for model ${config.model}: ${err instanceof Error ? err.message : String(err)}`,
-        );
+        lastError =
+          `memory-lancedb-pro: llm-client [${label}] request failed for model ${config.model}: ${err instanceof Error ? err.message : String(err)}`;
+        log(lastError);
         return null;
       }
     },
+    getLastError(): string | null {
+      return lastError;
+    },
   };
 }
 
-export { extractJsonFromResponse };
+export { extractJsonFromResponse, repairCommonJson };
diff --git a/src/memory-upgrader.ts b/src/memory-upgrader.ts
@@ -315,7 +315,8 @@ export class MemoryUpgrader {
         }>(prompt);
 
         if (!llmResult) {
-          throw new Error("LLM returned null");
+          const detail = this.llm.getLastError();
+          throw new Error(detail || "LLM returned null");
         }
 
         enriched = {
diff --git a/test/memory-upgrader-diagnostics.test.mjs b/test/memory-upgrader-diagnostics.test.mjs

Original file line number	Diff line number	Diff line change
`@@ -436,6 +436,11 @@`
`436`	`436`	`},`
`437`	`437`	`"baseURL": {`
`438`	`438`	`"type": "string"`
	`439`	`+ },`
	`440`	`+ "timeoutMs": {`
	`441`	`+ "type": "integer",`
	`442`	`+ "minimum": 1,`
	`443`	`+ "default": 30000`
`439`	`444`	`}`
`440`	`445`	`}`
`441`	`446`	`},`
`@@ -812,6 +817,12 @@`
`812`	`817`	`"placeholder": "https://api.groq.com/openai/v1",`
`813`	`818`	`"help": "OpenAI-compatible base URL for LLM (defaults to embedding.baseURL if omitted)",`
`814`	`819`	`"advanced": true`
	`820`	`+ },`
	`821`	`+ "llm.timeoutMs": {`
	`822`	`+ "label": "LLM Timeout (ms)",`
	`823`	`+ "placeholder": "30000",`
	`824`	`+ "help": "Request timeout for the smart-extraction / upgrade LLM in milliseconds",`
	`825`	`+ "advanced": true`
`815`	`826`	`}`
`816`	`827`	`}`
`817`	`828`	`}`
Original file line number	Diff line number	Diff line change
`@@ -36,7 +36,7 @@`
`36`	`36`	`]`
`37`	`37`	`},`
`38`	`38`	`"scripts": {`
`39`		- "test": "node test/embedder-error-hints.test.mjs && node test/migrate-legacy-schema.test.mjs && node --test test/config-session-strategy-migration.test.mjs && node --test test/recall-text-cleanup.test.mjs && node test/update-consistency-lancedb.test.mjs && node test/cli-smoke.mjs && node test/functional-e2e.mjs && node test/retriever-rerank-regression.mjs && node test/smart-memory-lifecycle.mjs && node test/smart-extractor-branches.mjs && node test/plugin-manifest-regression.mjs && node --test test/sync-plugin-version.test.mjs && node test/smart-metadata-v2.mjs && node test/vector-search-cosine.test.mjs && node test/context-support-e2e.mjs && node test/temporal-facts.test.mjs && node test/memory-update-supersede.test.mjs && node --test test/workflow-fork-guards.test.mjs",
	`39`	+ "test": "node test/embedder-error-hints.test.mjs && node test/migrate-legacy-schema.test.mjs && node --test test/config-session-strategy-migration.test.mjs && node --test test/recall-text-cleanup.test.mjs && node test/update-consistency-lancedb.test.mjs && node test/cli-smoke.mjs && node test/functional-e2e.mjs && node test/retriever-rerank-regression.mjs && node test/smart-memory-lifecycle.mjs && node test/smart-extractor-branches.mjs && node test/plugin-manifest-regression.mjs && node --test test/sync-plugin-version.test.mjs && node test/smart-metadata-v2.mjs && node test/vector-search-cosine.test.mjs && node test/context-support-e2e.mjs && node test/temporal-facts.test.mjs && node test/memory-update-supersede.test.mjs && node test/memory-upgrader-diagnostics.test.mjs && node --test test/workflow-fork-guards.test.mjs",
`40`	`40`	`"test:openclaw-host": "node test/openclaw-host-functional.mjs",`
`41`	`41`	`"version": "node scripts/sync-plugin-version.mjs openclaw.plugin.json package.json && git add openclaw.plugin.json"`
`42`	`42`	`},`
Original file line number	Diff line number	Diff line change
`@@ -315,7 +315,8 @@ export class MemoryUpgrader {`
`315`	`315`	`}>(prompt);`
`316`	`316`
`317`	`317`	`if (!llmResult) {`
`318`		`- throw new Error("LLM returned null");`
	`318`	`+ const detail = this.llm.getLastError();`
	`319`	`+ throw new Error(detail \|\| "LLM returned null");`
`319`	`320`	`}`
`320`	`321`
`321`	`322`	`enriched = {`