redis · nkanu17 · Mar 26, 2026 · Mar 26, 2026 · Mar 27, 2026 · Mar 27, 2026
diff --git a/README.md b/README.md
@@ -13,7 +13,7 @@ A memory layer for AI agents.
 - **Dual Interface**: REST API and Model Context Protocol (MCP) server
 - **Two-Tier Memory**: Working memory (session-scoped) and long-term memory (persistent)
 - **Configurable Memory Strategies**: Customize how memories are extracted (discrete, summary, preferences, custom)
-- **Semantic Search**: Vector-based similarity search with metadata filtering
+- **Semantic, Keyword & Hybrid Search**: Vector-based similarity, full-text keyword, and combined hybrid search with metadata filtering
 - **Flexible Backends**: Pluggable memory vector database factory system
 - **Multi-Provider LLM Support**: OpenAI, Anthropic, AWS Bedrock, Ollama, Azure, Gemini via [LiteLLM](https://docs.litellm.ai/)
 - **AI Integration**: Automatic topic extraction, entity recognition, and conversation summarization
@@ -268,7 +268,7 @@ See **[LLM Providers](https://redis.github.io/agent-memory-server/llm-providers/
 ```
 Working Memory (Session-scoped)  →  Long-term Memory (Persistent)
     ↓                                      ↓
-- Messages                         - Semantic search
+- Messages                         - Semantic, keyword & hybrid search
 - Structured memories              - Topic modeling
 - Summary of past messages         - Entity recognition
 - Metadata                         - Deduplication

diff --git a/agent-memory-client/README.md b/agent-memory-client/README.md
@@ -165,7 +165,7 @@ working_memory = WorkingMemory(
 response = await client.put_working_memory("user-session-123", working_memory)
 
 # Retrieve working memory
-memory = await client.get_working_memory("user-session-123")
+created, memory = await client.get_or_create_working_memory("user-session-123")
 
 # Convenience method for data storage
 await client.set_working_memory_data(
@@ -201,6 +201,21 @@ results = await client.search_long_term_memory(
     user_id=UserId(eq="user-123"),
     limit=20
 )
+
+# Keyword search - exact term matching
+results = await client.search_long_term_memory(
+    text="science fiction",
+    search_mode="keyword",
+    limit=20
+)
+
+# Hybrid search - combines semantic and keyword matching
+results = await client.search_long_term_memory(
+    text="science fiction",
+    search_mode="hybrid",
+    hybrid_alpha=0.7,  # 0.0=keyword, 1.0=semantic
+    limit=20
+)
 ```
 
 ## Enhanced Features
@@ -333,9 +348,9 @@ from agent_memory_client.exceptions import (
 )
 
 try:
-    memory = await client.get_working_memory("nonexistent-session")
-except MemoryNotFoundError:
-    print("Session not found")
+    created, memory = await client.get_or_create_working_memory("nonexistent-session")
+    if created:
+        print("New session created")
 except MemoryServerError as e:
     print(f"Server error {e.status_code}: {e}")
 except MemoryClientError as e:

diff --git a/agent-memory-client/agent-memory-client-js/README.md b/agent-memory-client/agent-memory-client-js/README.md
@@ -90,14 +90,29 @@ await client.createLongTermMemory([
   },
 ]);
 
-// Search with filters
+// Search with filters (default: semantic search)
 const results = await client.searchLongTermMemory({
   text: "science fiction",
   topics: new Topics({ any: ["books", "entertainment"] }),
   userId: new UserId({ eq: "user-123" }),
   limit: 20,
 });
 
+// Keyword search - exact term matching
+const keywordResults = await client.searchLongTermMemory({
+  text: "science fiction",
+  searchMode: "keyword",
+  limit: 20,
+});
+
+// Hybrid search - combines semantic and keyword matching
+const hybridResults = await client.searchLongTermMemory({
+  text: "science fiction",
+  searchMode: "hybrid",
+  hybridAlpha: 0.7, // 0.0=keyword, 1.0=semantic
+  limit: 20,
+});
+
 // Get by ID
 const memory = await client.getLongTermMemory("memory-id");
 

diff --git a/agent-memory-client/agent_memory_client/client.py b/agent-memory-client/agent_memory_client/client.py
@@ -1386,7 +1386,7 @@ async def handle_tool_calls(client, tool_calls):
                 "type": "function",
                 "function": {
                     "name": "search_memory",
-                    "description": "Search long-term memory for relevant information using semantic vector search. Use this when you need to find previously stored information about the user, such as their preferences, past conversations, or important facts. Examples: 'Find information about user food preferences', 'What did they say about their job?', 'Look for travel preferences'. This searches only long-term memory, not current working memory - use get_working_memory for current session info. IMPORTANT: The result includes 'memories' with an 'id' field; use these IDs when calling edit_long_term_memory or delete_long_term_memories.",
+                    "description": "Search long-term memory for relevant information using semantic, keyword, or hybrid search. Use this when you need to find previously stored information about the user, such as their preferences, past conversations, or important facts. Examples: 'Find information about user food preferences', 'What did they say about their job?', 'Look for travel preferences'. This searches only long-term memory, not current working memory - use get_or_create_working_memory for current session info. IMPORTANT: The result includes 'memories' with an 'id' field; use these IDs when calling edit_long_term_memory or delete_long_term_memories.",
                     "parameters": {
                         "type": "object",
                         "properties": {
@@ -1875,7 +1875,7 @@ def get_update_memory_data_tool_schema(cls) -> ToolSchema:
                 "type": "function",
                 "function": {
                     "name": "update_working_memory_data",
-                    "description": "Store or update structured session data (JSON objects) in working memory. Use this for complex session-specific information that needs to be accessed and modified during the conversation. Examples: Travel itinerary {'destination': 'Paris', 'dates': ['2024-03-15', '2024-03-20']}, project details {'name': 'Website Redesign', 'deadline': '2024-04-01', 'status': 'in_progress'}. Different from add_memory_to_working_memory which stores simple text facts.",
+                    "description": "Store or update structured session data (JSON objects) in working memory. Use this for complex session-specific information that needs to be accessed and modified during the conversation. Examples: Travel itinerary {'destination': 'Paris', 'dates': ['2024-03-15', '2024-03-20']}, project details {'name': 'Website Redesign', 'deadline': '2024-04-01', 'status': 'in_progress'}. Different from lazily_create_long_term_memory which stores simple text facts for later promotion to long-term storage.",
                     "parameters": {
                         "type": "object",
                         "properties": {
@@ -2706,7 +2706,7 @@ async def _resolve_search_memory(self, args: dict[str, Any]) -> dict[str, Any]:
     async def _resolve_get_working_memory(
         self, session_id: str, namespace: str | None, user_id: str | None = None
     ) -> dict[str, Any]:
-        """Resolve get_working_memory function call."""
+        """Resolve get_working_memory (deprecated) function call."""
         return await self.get_working_memory_tool(
             session_id=session_id,
             namespace=namespace,
@@ -2731,7 +2731,7 @@ async def _resolve_add_memory(
         namespace: str | None,
         user_id: str | None = None,
     ) -> dict[str, Any]:
-        """Resolve add_memory_to_working_memory function call."""
+        """Resolve lazily_create_long_term_memory (formerly add_memory_to_working_memory) function call."""
         text = args.get("text", "")
         if not text:
             raise ValueError("Text parameter is required for adding memory")
@@ -2790,11 +2790,11 @@ async def _resolve_get_long_term_memory(
     async def _resolve_create_long_term_memory(
         self, args: dict[str, Any], namespace: str | None, user_id: str | None = None
     ) -> dict[str, Any]:
-        """Resolve create_long_term_memory function call."""
+        """Resolve eagerly_create_long_term_memory (and deprecated create_long_term_memory alias) function call."""
         memories_data = args.get("memories")
         if not memories_data:
             raise ValueError(
-                "memories parameter is required for create_long_term_memory"
+                "memories parameter is required for eagerly_create_long_term_memory"
             )
 
         # Convert dict memories to ClientMemoryRecord objects
@@ -2907,7 +2907,7 @@ async def resolve_function_calls(
             # Handle multiple function calls
             calls = [
                 {"name": "search_memory", "arguments": {"query": "user preferences"}},
-                {"name": "get_working_memory", "arguments": {}},
+                {"name": "get_or_create_working_memory", "arguments": {}},
             ]
 
             results = await client.resolve_function_calls(calls, "session123")

diff --git a/agent-memory-client/agent_memory_client/integrations/langchain.py b/agent-memory-client/agent_memory_client/integrations/langchain.py
@@ -127,7 +127,7 @@ def get_memory_tools(
     tool_configs = {
         "search_memory": {
             "name": "search_memory",
-            "description": "Search long-term memory for relevant information using semantic search. Use this to recall past conversations, user preferences, or stored facts. Returns memories ranked by relevance with scores.",
+            "description": "Search long-term memory for relevant information using semantic, keyword, or hybrid search. Use this to recall past conversations, user preferences, or stored facts. Returns memories ranked by relevance with scores.",
             "func": _create_search_memory_func(memory_client),
         },
         "get_or_create_working_memory": {
@@ -224,6 +224,9 @@ def _create_search_memory_func(client: MemoryAPIClient) -> Any:
 
     async def search_memory(
         query: str,
+        search_mode: str = "semantic",
+        hybrid_alpha: float | None = None,
+        text_scorer: str | None = None,
         topics: list[str] | None = None,
         entities: list[str] | None = None,
         memory_type: str | None = None,
@@ -234,6 +237,9 @@ async def search_memory(
         """Search long-term memory for relevant information."""
         result = await client.search_memory_tool(
             query=query,
+            search_mode=search_mode,
+            hybrid_alpha=hybrid_alpha,
+            text_scorer=text_scorer,
             topics=topics,
             entities=entities,
             memory_type=memory_type,

diff --git a/docs/README.md b/docs/README.md
@@ -75,7 +75,7 @@ For contributors and advanced users:
 
 | Feature | REST API | MCP Server | CLI | Documentation |
 |---------|----------|------------|-----|---------------|
-| **Memory Search** | ✅ `/v1/long-term-memory/search` | ✅ `search_long_term_memory` | ❌ | [REST API](api.md), [MCP](mcp.md) |
+| **Memory Search** (semantic, keyword, hybrid) | ✅ `/v1/long-term-memory/search` | ✅ `search_long_term_memory` | ❌ | [REST API](api.md), [MCP](mcp.md) |
 | **Memory Editing** | ✅ `PATCH /v1/long-term-memory/{id}` | ✅ `edit_long_term_memory` | ❌ | [Memory Editing](memory-lifecycle.md#memory-editing) |
 | **Query Optimization** | ✅ `optimize_query` param | ✅ `optimize_query` param | ❌ | [Query Optimization](query-optimization.md) |
 | **Recency Boost** | ✅ Default enabled | ✅ Available | ❌ | [Recency Boost](recency-boost.md) |

diff --git a/docs/agent-examples.md b/docs/agent-examples.md
@@ -93,7 +93,7 @@ A comprehensive travel assistant that demonstrates the most complete integration
 - **Automatic Tool Discovery**: Uses `MemoryAPIClient.get_all_memory_tool_schemas()` to automatically discover and integrate all available memory tools
 - **Unified Tool Resolution**: Leverages `client.resolve_tool_call()` to handle all memory tool calls uniformly across different LLM providers
 - **Working Memory Management**: Session-based conversation state and structured memory storage
-- **Long-term Memory**: Persistent memory storage and semantic search capabilities
+- **Long-term Memory**: Persistent memory storage with semantic, keyword, and hybrid search capabilities
 - **Optional Web Search**: Cached web search using Tavily API with Redis caching
 
 ### Available Tools
@@ -402,7 +402,7 @@ from agent_memory_client import create_memory_client
 client = await create_memory_client(base_url="http://localhost:8000")
 
 # Get only the 3 most recent messages
-memory = await client.get_working_memory(
+created, memory = await client.get_or_create_working_memory(
     session_id="my-session",
     namespace="demo",
     context_window_max=3

diff --git a/docs/index.md b/docs/index.md
@@ -38,7 +38,7 @@ Transform your AI agents from goldfish 🐠 into elephants 🐘 with Redis-power
 Redis Agent Memory Server is a production-ready memory system for AI agents and applications that:
 
 - **🧠 Remembers everything**: Stores conversation history, user preferences, and important facts across sessions
-- **🔍 Finds relevant context**: Uses semantic search to surface the right information at the right time
+- **🔍 Finds relevant context**: Uses semantic, keyword, and hybrid search to surface the right information at the right time
 - **📈 Gets smarter over time**: Automatically extracts, organizes, and deduplicates memories from interactions
 - **🔌 Works with any AI model**: REST API and MCP interfaces compatible with OpenAI, Anthropic, and others
 - **🌐 Multi-provider support**: Use [100+ LLM providers](llm-providers.md) via LiteLLM (OpenAI, Anthropic, AWS Bedrock, Ollama, Azure, Gemini, and more)
@@ -95,11 +95,11 @@ print(f"Found: {results.memories[0].text}")
 
 !!! success "Long-Term Memory (Persistent)"
     - User preferences, facts, and important information
-    - Semantic search with vector embeddings
+    - Flexible search: semantic (vector embeddings), keyword (full-text), and hybrid (combined)
     - Advanced filtering by time, topics, entities, users
 
 ### 🔍 Intelligent Search
-- **Semantic similarity**: Find memories by meaning, not just keywords
+- **Multiple search modes**: Semantic (vector similarity), keyword (full-text), and hybrid (combined) search
 - **Advanced filters**: Search by user, session, time, topics, entities
 - **Query optimization**: AI-powered query refinement for better results
 - **Recency boost**: Time-aware ranking that surfaces relevant recent information

diff --git a/docs/java-sdk.md b/docs/java-sdk.md
@@ -144,6 +144,21 @@ MemoryRecordResults results = client.longTermMemory().searchLongTermMemories(req
 // Simple text search
 MemoryRecordResults simpleResults = client.longTermMemory()
     .searchLongTermMemories("user preferences");
+
+// Keyword search - exact term matching
+SearchRequest keywordRequest = SearchRequest.builder()
+    .text("TechCorp engineer")
+    .searchMode("keyword")
+    .limit(10)
+    .build();
+
+// Hybrid search - combines semantic and keyword matching
+SearchRequest hybridRequest = SearchRequest.builder()
+    .text("user preferences")
+    .searchMode("hybrid")
+    .hybridAlpha(0.7)  // 0.0=keyword, 1.0=semantic
+    .limit(10)
+    .build();
 ```
 
 ### Get, Edit, and Delete

diff --git a/docs/long-term-memory.md b/docs/long-term-memory.md
@@ -4,14 +4,14 @@ Long-term memory is **persistent**, **cross-session** storage designed for knowl
 
 ## Overview
 
-Long-term memory provides persistent storage that survives server restarts and session expiration. It's optimized for semantic search, deduplication, and rich metadata to enable intelligent retrieval of relevant information.
+Long-term memory provides persistent storage that survives server restarts and session expiration. It's optimized for semantic, keyword, and hybrid search, deduplication, and rich metadata to enable intelligent retrieval of relevant information.
 
 | Feature | Details |
 |---------|---------|
 | **Scope** | Cross-session, persistent |
 | **Lifespan** | Permanent until manually deleted |
 | **Storage** | Redis with vector indexing |
-| **Search** | Semantic vector search |
+| **Search** | Semantic, keyword, and hybrid search |
 | **Capacity** | Unlimited (with compaction) |
 | **Use Case** | Knowledge base, user preferences |
 | **Indexing** | Vector embeddings + metadata |
@@ -126,17 +126,38 @@ POST /v1/long-term-memory/search
 
 ## Search Capabilities
 
-Long-term memory provides powerful search features:
+Long-term memory supports three search modes: **semantic** (vector similarity), **keyword** (full-text matching), and **hybrid** (combined).
 
-### Semantic Vector Search
+### Semantic Search (Default)
 ```json
 {
   "text": "python programming help",
+  "search_mode": "semantic",
   "limit": 10,
   "distance_threshold": 0.8
 }
 ```
 
+### Keyword Search
+```json
+{
+  "text": "TechCorp engineer",
+  "search_mode": "keyword",
+  "limit": 10
+}
+```
+
+### Hybrid Search
+Combines vector similarity with full-text keyword matching. Use `hybrid_alpha` to control the balance (0.0 = pure keyword, 1.0 = pure semantic, default 0.7).
+```json
+{
+  "text": "python programming help",
+  "search_mode": "hybrid",
+  "hybrid_alpha": 0.7,
+  "limit": 10
+}
+```
+
 ### Advanced Filtering
 ```json
 {

diff --git a/docs/mcp.md b/docs/mcp.md
@@ -4,7 +4,7 @@ Agent Memory Server offers an MCP (Model Context Protocol) server interface powe
 
 - **set_working_memory**: Set working memory for a session (like `PUT /v1/working-memory/{session_id}` in the REST API). Stores structured memory records and JSON data in working memory with automatic promotion to long-term storage.
 - **create_long_term_memories**: Create long-term memories directly, bypassing working memory. Useful for bulk memory creation.
-- **search_long_term_memory**: Perform semantic search across long-term memories with advanced filtering options.
+- **search_long_term_memory**: Search across long-term memories using semantic, keyword, or hybrid search modes with advanced filtering options.
 - **edit_long_term_memory**: Update existing long-term memories with new or corrected information. Allows partial updates to specific fields while preserving other data.
 - **delete_long_term_memories**: Remove specific long-term memories by ID. Useful for cleaning up outdated or incorrect information.
 - **get_long_term_memory**: Retrieve specific memories by ID for detailed inspection or verification before editing.
@@ -17,7 +17,7 @@ The MCP server provides the following tools that AI agents can use to manage mem
 ### Memory Search and Retrieval
 
 **search_long_term_memory**
-- Search for memories using semantic similarity
+- Search for memories using semantic (vector), keyword (full-text), or hybrid (combined) search
 - Supports advanced filtering by user, session, namespace, topics, entities, and timestamps
 - Configurable query optimization and recency boost
 - Returns ranked results with relevance scores

diff --git a/docs/quick-start.md b/docs/quick-start.md
@@ -178,7 +178,7 @@ await memory_client.create_long_term_memory([
 
 ## Step 7: Search Your Memories
 
-Search across all stored memories with semantic similarity:
+Search across all stored memories using semantic similarity, keyword matching, or hybrid search:
 
 ```python
 # Search for work-related information
@@ -331,7 +331,7 @@ You've just worked with both types of memory:
 - **Scope**: Cross-session, persistent
 - **Lifetime**: Permanent until deleted
 - **Use case**: User preferences, facts, knowledge
-- **Search**: Semantic vector search with advanced filtering
+- **Search**: Semantic, keyword, and hybrid search with advanced filtering
 
 ## Next Steps
 
@@ -537,7 +537,7 @@ redis-cli -h localhost -p 6379
 
 You now have a working AI agent memory system! Your memories will:
 - ✅ Persist across sessions
-- ✅ Be searchable with semantic similarity
+- ✅ Be searchable with semantic, keyword, or hybrid search
 - ✅ Automatically extract context from conversations
 - ✅ Provide relevant context to AI responses
 

diff --git a/docs/typescript-sdk.md b/docs/typescript-sdk.md
@@ -106,12 +106,27 @@ import {
   MemoryType,
 } from "agent-memory-client";
 
-// Basic search
+// Basic semantic search (default)
 const results = await client.searchLongTermMemory({
   text: "user preferences",
   limit: 10,
 });
 
+// Keyword search - exact term matching
+const keywordResults = await client.searchLongTermMemory({
+  text: "TechCorp engineer",
+  searchMode: "keyword",
+  limit: 10,
+});
+
+// Hybrid search - combines semantic and keyword matching
+const hybridResults = await client.searchLongTermMemory({
+  text: "user preferences",
+  searchMode: "hybrid",
+  hybridAlpha: 0.7, // 0.0=keyword, 1.0=semantic
+  limit: 10,
+});
+
 // With filters
 const filtered = await client.searchLongTermMemory({
   text: "programming languages",