🐛 Memory error cause by embedding model name with /

Jasonxia007 · Jasonxia007 · commit e0ddfeae004f · 2025-12-22T17:54:14.000+08:00
diff --git a/backend/utils/memory_utils.py b/backend/utils/memory_utils.py
@@ -29,10 +29,14 @@ def build_memory_config(tenant_id: str) -> Dict[str, Any]:
         raise ValueError("ES_HOST must include scheme, host and port, e.g. http://host:9200")
     es_host = f"{parsed.scheme}://{parsed.hostname}"
     es_port = parsed.port
+    # Normalize repo/name to avoid problematic characters in index names
+    safe_repo = embed_raw["model_repo"].lower().replace(
+        "/", "_") if embed_raw["model_repo"] else ""
+    safe_name = embed_raw["model_name"].lower().replace("/", "_")
     index_name = (
-        f"mem0_{embed_raw['model_repo'].lower()}_{embed_raw['model_name'].lower()}_{embed_raw['max_tokens']}"
+        f"mem0_{safe_repo}_{safe_name}_{embed_raw['max_tokens']}"
         if embed_raw["model_repo"]
-        else f"mem0_{embed_raw['model_name'].lower()}_{embed_raw['max_tokens']}"
+        else f"mem0_{safe_name}_{embed_raw['max_tokens']}"
     )
 
     # 3. Assemble final configuration
diff --git a/frontend/app/[locale]/knowledges/components/document/DocumentChunk.tsx b/frontend/app/[locale]/knowledges/components/document/DocumentChunk.tsx
@@ -781,6 +781,10 @@ const DocumentChunk: React.FC<DocumentChunkProps> = ({
               onChange={handlePaginationChange}
               disabled={loading}
               showQuickJumper
+              locale={{
+                jump_to: t("document.chunk.pagination.jumpTo"),
+                page: t("document.chunk.pagination.page"),
+              }}
               showTotal={(pageTotal, range) =>
                 t("document.chunk.pagination.range", {
                   defaultValue: "{{start}}-{{end}} of {{total}}",
diff --git a/frontend/public/locales/en/common.json b/frontend/public/locales/en/common.json
@@ -583,6 +583,8 @@
   "document.chunk.search.document": "Docs",
   "document.chunk.search.chunk": "Chunk",
   "document.chunk.pagination.range": "{{start}}-{{end}} of {{total}}",
+  "document.chunk.pagination.jumpTo": "Go to",
+  "document.chunk.pagination.page": "Page",
 
   "model.dialog.title": "Add Model",
   "model.dialog.label.type": "Model Type",
diff --git a/frontend/public/locales/zh/common.json b/frontend/public/locales/zh/common.json
@@ -584,6 +584,8 @@
   "document.chunk.search.document": "文档",
   "document.chunk.search.chunk": "分片",
   "document.chunk.pagination.range": "{{start}}-{{end}} / 共 {{total}}",
+  "document.chunk.pagination.jumpTo": "跳转到",
+  "document.chunk.pagination.page": "页",
 
   "model.dialog.title": "添加模型",
   "model.dialog.label.type": "模型类型",
diff --git a/test/backend/utils/test_memory_utils.py b/test/backend/utils/test_memory_utils.py
@@ -318,6 +318,36 @@ def test_build_memory_config_with_custom_port(self):
             self.assertEqual(result["vector_store"]["config"]
                              ["collection_name"], "mem0_openai_test-embed_1536")
 
+    def test_build_memory_config_sanitizes_slashes_in_repo_and_name(self):
+        """Slash characters in repo/name are replaced with underscores in collection name"""
+        mock_tenant_config_manager = MagicMock()
+        mock_tenant_config_manager.get_model_config.side_effect = [
+            {"model_name": "gpt-4", "model_repo": "azure/openai", "base_url": "https://api.example.com/v1", "api_key": "llm-key"},
+            {"model_name": "text-embed/ada-002", "model_repo": "azure/openai", "base_url": "https://api.example.com/v1", "api_key": "embed-key", "max_tokens": 1536}
+        ]
+
+        mock_const = MagicMock()
+        mock_const.ES_HOST = "http://localhost:9200"
+        mock_const.ES_API_KEY = "test-es-key"
+        mock_const.ES_USERNAME = "elastic"
+        mock_const.ES_PASSWORD = "test-password"
+
+        model_mapping = {"llm": "llm", "embedding": "embedding"}
+        mock_get_model_name = MagicMock()
+        mock_get_model_name.side_effect = ["azure/openai/gpt-4", "azure/openai/text-embed/ada-002"]
+
+        with patch('backend.utils.memory_utils.tenant_config_manager', mock_tenant_config_manager), \
+            patch('backend.utils.memory_utils._c', mock_const), \
+                patch('backend.utils.memory_utils.get_model_name_from_config', mock_get_model_name), \
+                patch('backend.utils.memory_utils.MODEL_CONFIG_MAPPING', model_mapping):
+
+            result = self.build_memory_config("tenant-with-slash")
+
+            self.assertEqual(
+                result["vector_store"]["config"]["collection_name"],
+                "mem0_azure_openai_text-embed_ada-002_1536",
+            )
+
     def test_build_memory_config_with_empty_model_repo(self):
         """Empty model_repo yields collection name without repo segment"""
         mock_tenant_config_manager = MagicMock()