brianf-aws
diff --git a/‎common/src/main/java/org/opensearch/ml/common/memorycontainer/MLMemory.java‎
Lines changed: 269 additions & 0 deletions b/‎common/src/main/java/org/opensearch/ml/common/memorycontainer/MLMemory.java‎
Lines changed: 269 additions & 0 deletions
diff --git a/‎common/src/main/java/org/opensearch/ml/common/memorycontainer/MemoryContainerConstants.java‎
Lines changed: 24 additions & 0 deletions b/‎common/src/main/java/org/opensearch/ml/common/memorycontainer/MemoryContainerConstants.java‎
Lines changed: 24 additions & 0 deletions
@@ -0,0 +1,269 @@
+/*
+ * Copyright OpenSearch Contributors
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+package org.opensearch.ml.common.memorycontainer;
+
+import static org.opensearch.core.xcontent.XContentParserUtils.ensureExpectedToken;
+import static org.opensearch.ml.common.memorycontainer.MemoryContainerConstants.AGENT_ID_FIELD;
+import static org.opensearch.ml.common.memorycontainer.MemoryContainerConstants.CREATED_TIME_FIELD;
+import static org.opensearch.ml.common.memorycontainer.MemoryContainerConstants.LAST_UPDATED_TIME_FIELD;
+import static org.opensearch.ml.common.memorycontainer.MemoryContainerConstants.MEMORY_EMBEDDING_FIELD;
+import static org.opensearch.ml.common.memorycontainer.MemoryContainerConstants.MEMORY_FIELD;
+import static org.opensearch.ml.common.memorycontainer.MemoryContainerConstants.MEMORY_TYPE_FIELD;
+import static org.opensearch.ml.common.memorycontainer.MemoryContainerConstants.ROLE_FIELD;
+import static org.opensearch.ml.common.memorycontainer.MemoryContainerConstants.SESSION_ID_FIELD;
+import static org.opensearch.ml.common.memorycontainer.MemoryContainerConstants.TAGS_FIELD;
+import static org.opensearch.ml.common.memorycontainer.MemoryContainerConstants.USER_ID_FIELD;
+
+import java.io.IOException;
+import java.time.Instant;
+import java.util.HashMap;
+import java.util.Map;
+
+import org.opensearch.core.common.io.stream.StreamInput;
+import org.opensearch.core.common.io.stream.StreamOutput;
+import org.opensearch.core.common.io.stream.Writeable;
+import org.opensearch.core.xcontent.ToXContentObject;
+import org.opensearch.core.xcontent.XContentBuilder;
+import org.opensearch.core.xcontent.XContentParser;
+
+import lombok.Builder;
+import lombok.Getter;
+import lombok.Setter;
+
+/**
+ * Represents a memory entry in a memory container
+ */
+@Getter
+@Setter
+@Builder
+public class MLMemory implements ToXContentObject, Writeable {
+
+    // Core fields
+    private String sessionId;
+    private String memory;
+    private MemoryType memoryType;
+
+    // Optional fields
+    private String userId;
+    private String agentId;
+    private String role;
+    private Map<String, String> tags;
+
+    // System fields
+    private Instant createdTime;
+    private Instant lastUpdatedTime;
+
+    // Vector/embedding field (optional, for semantic storage)
+    private Object memoryEmbedding;
+
+    @Builder
+    public MLMemory(
+        String sessionId,
+        String memory,
+        MemoryType memoryType,
+        String userId,
+        String agentId,
+        String role,
+        Map<String, String> tags,
+        Instant createdTime,
+        Instant lastUpdatedTime,
+        Object memoryEmbedding
+    ) {
+        this.sessionId = sessionId;
+        this.memory = memory;
+        this.memoryType = memoryType;
+        this.userId = userId;
+        this.agentId = agentId;
+        this.role = role;
+        this.tags = tags;
+        this.createdTime = createdTime;
+        this.lastUpdatedTime = lastUpdatedTime;
+        this.memoryEmbedding = memoryEmbedding;
+    }
+
+    public MLMemory(StreamInput in) throws IOException {
+        this.sessionId = in.readString();
+        this.memory = in.readString();
+        this.memoryType = in.readEnum(MemoryType.class);
+        this.userId = in.readOptionalString();
+        this.agentId = in.readOptionalString();
+        this.role = in.readOptionalString();
+        if (in.readBoolean()) {
+            this.tags = in.readMap(StreamInput::readString, StreamInput::readString);
+        }
+        this.createdTime = in.readInstant();
+        this.lastUpdatedTime = in.readInstant();
+        // Note: memoryEmbedding is not serialized in StreamInput/Output as it's typically handled separately
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        out.writeString(sessionId);
+        out.writeString(memory);
+        out.writeEnum(memoryType);
+        out.writeOptionalString(userId);
+        out.writeOptionalString(agentId);
+        out.writeOptionalString(role);
+        if (tags != null && !tags.isEmpty()) {
+            out.writeBoolean(true);
+            out.writeMap(tags, StreamOutput::writeString, StreamOutput::writeString);
+        } else {
+            out.writeBoolean(false);
+        }
+        out.writeInstant(createdTime);
+        out.writeInstant(lastUpdatedTime);
+        // Note: memoryEmbedding is not serialized in StreamInput/Output as it's typically handled separately
+    }
+
+    @Override
+    public XContentBuilder toXContent(XContentBuilder builder, Params params) throws IOException {
+        builder.startObject();
+        builder.field(SESSION_ID_FIELD, sessionId);
+        builder.field(MEMORY_FIELD, memory);
+        builder.field(MEMORY_TYPE_FIELD, memoryType.getValue());
+
+        if (userId != null) {
+            builder.field(USER_ID_FIELD, userId);
+        }
+        if (agentId != null) {
+            builder.field(AGENT_ID_FIELD, agentId);
+        }
+        if (role != null) {
+            builder.field(ROLE_FIELD, role);
+        }
+        if (tags != null && !tags.isEmpty()) {
+            builder.field(TAGS_FIELD, tags);
+        }
+
+        builder.field(CREATED_TIME_FIELD, createdTime.toEpochMilli());
+        builder.field(LAST_UPDATED_TIME_FIELD, lastUpdatedTime.toEpochMilli());
+
+        if (memoryEmbedding != null) {
+            builder.field(MEMORY_EMBEDDING_FIELD, memoryEmbedding);
+        }
+
+        builder.endObject();
+        return builder;
+    }
+
+    public static MLMemory parse(XContentParser parser) throws IOException {
+        String sessionId = null;
+        String memory = null;
+        MemoryType memoryType = null;
+        String userId = null;
+        String agentId = null;
+        String role = null;
+        Map<String, String> tags = null;
+        Instant createdTime = null;
+        Instant lastUpdatedTime = null;
+        Object memoryEmbedding = null;
+
+        ensureExpectedToken(XContentParser.Token.START_OBJECT, parser.currentToken(), parser);
+        while (parser.nextToken() != XContentParser.Token.END_OBJECT) {
+            String fieldName = parser.currentName();
+            parser.nextToken();
+
+            switch (fieldName) {
+                case SESSION_ID_FIELD:
+                    sessionId = parser.text();
+                    break;
+                case MEMORY_FIELD:
+                    memory = parser.text();
+                    break;
+                case MEMORY_TYPE_FIELD:
+                    memoryType = MemoryType.fromString(parser.text());
+                    break;
+                case USER_ID_FIELD:
+                    userId = parser.text();
+                    break;
+                case AGENT_ID_FIELD:
+                    agentId = parser.text();
+                    break;
+                case ROLE_FIELD:
+                    role = parser.text();
+                    break;
+                case TAGS_FIELD:
+                    Map<String, Object> tagsMap = parser.map();
+                    if (tagsMap != null) {
+                        tags = new HashMap<>();
+                        for (Map.Entry<String, Object> entry : tagsMap.entrySet()) {
+                            if (entry.getValue() != null) {
+                                tags.put(entry.getKey(), entry.getValue().toString());
+                            }
+                        }
+                    }
+                    break;
+                case CREATED_TIME_FIELD:
+                    createdTime = Instant.ofEpochMilli(parser.longValue());
+                    break;
+                case LAST_UPDATED_TIME_FIELD:
+                    lastUpdatedTime = Instant.ofEpochMilli(parser.longValue());
+                    break;
+                case MEMORY_EMBEDDING_FIELD:
+                    // Parse embedding as generic object (could be array or sparse map)
+                    memoryEmbedding = parser.map();
+                    break;
+                default:
+                    parser.skipChildren();
+                    break;
+            }
+        }
+
+        return MLMemory
+            .builder()
+            .sessionId(sessionId)
+            .memory(memory)
+            .memoryType(memoryType)
+            .userId(userId)
+            .agentId(agentId)
+            .role(role)
+            .tags(tags)
+            .createdTime(createdTime)
+            .lastUpdatedTime(lastUpdatedTime)
+            .memoryEmbedding(memoryEmbedding)
+            .build();
+    }
+
+    /**
+     * Convert to a Map for indexing
+     */
+    public Map<String, Object> toIndexMap() {
+        Map<String, Object> map = Map
+            .of(
+                SESSION_ID_FIELD,
+                sessionId,
+                MEMORY_FIELD,
+                memory,
+                MEMORY_TYPE_FIELD,
+                memoryType.getValue(),
+                CREATED_TIME_FIELD,
+                createdTime.toEpochMilli(),
+                LAST_UPDATED_TIME_FIELD,
+                lastUpdatedTime.toEpochMilli()
+            );
+
+        // Use mutable map for optional fields
+        Map<String, Object> result = new java.util.HashMap<>(map);
+
+        if (userId != null) {
+            result.put(USER_ID_FIELD, userId);
+        }
+        if (agentId != null) {
+            result.put(AGENT_ID_FIELD, agentId);
+        }
+        if (role != null) {
+            result.put(ROLE_FIELD, role);
+        }
+        if (tags != null && !tags.isEmpty()) {
+            result.put(TAGS_FIELD, tags);
+        }
+        if (memoryEmbedding != null) {
+            result.put(MEMORY_EMBEDDING_FIELD, memoryEmbedding);
+        }
+
+        return result;
+    }
+}
@@ -52,6 +52,8 @@ public class MemoryContainerConstants {
     public static final String MESSAGES_FIELD = "messages";
     public static final String CONTENT_FIELD = "content";
     public static final String INFER_FIELD = "infer";
+    public static final String QUERY_FIELD = "query";
+    public static final String TEXT_FIELD = "text";
 
     // KNN index settings
     public static final String KNN_ENGINE = "lucene";
@@ -65,7 +67,11 @@ public class MemoryContainerConstants {
     public static final String BASE_MEMORY_CONTAINERS_PATH = "/_plugins/_ml/memory_containers";
     public static final String CREATE_MEMORY_CONTAINER_PATH = BASE_MEMORY_CONTAINERS_PATH + "/_create";
     public static final String PARAMETER_MEMORY_CONTAINER_ID = "memory_container_id";
+    public static final String PARAMETER_MEMORY_ID = "memory_id";
     public static final String MEMORIES_PATH = BASE_MEMORY_CONTAINERS_PATH + "/{" + PARAMETER_MEMORY_CONTAINER_ID + "}/memories";
+    public static final String SEARCH_MEMORIES_PATH = MEMORIES_PATH + "/_search";
+    public static final String DELETE_MEMORY_PATH = MEMORIES_PATH + "/{" + PARAMETER_MEMORY_ID + "}";
+    public static final String UPDATE_MEMORY_PATH = MEMORIES_PATH + "/{" + PARAMETER_MEMORY_ID + "}";
 
     // Memory types are defined in MemoryType enum
 
@@ -89,4 +95,22 @@ public class MemoryContainerConstants {
     public static final String EMBEDDING_MODEL_NOT_FOUND_ERROR = "Embedding model with ID %s not found";
     public static final String EMBEDDING_MODEL_TYPE_MISMATCH_ERROR = "Embedding model must be of type %s or REMOTE, found: %s";                                                                                                          // instead
     public static final String INFER_REQUIRES_LLM_MODEL_ERROR = "infer=true requires llm_model_id to be configured in memory storage";
+
+    // Memory API limits
+    public static final int MAX_MESSAGES_PER_REQUEST = 10;
+    public static final String MAX_MESSAGES_EXCEEDED_ERROR = "Cannot process more than 10 messages in a single request";
+
+    // Memory decision fields
+    public static final String MEMORY_DECISION_FIELD = "memory_decision";
+    public static final String OLD_MEMORY_FIELD = "old_memory";
+    public static final String RETRIEVED_FACTS_FIELD = "retrieved_facts";
+    public static final String EVENT_FIELD = "event";
+    public static final String SCORE_FIELD = "score";
+
+    // LLM System Prompts
+    public static final String PERSONAL_INFORMATION_ORGANIZER_PROMPT =
+        "<system_prompt>\n<role>Personal Information Organizer</role>\n<objective>Extract and organize personal information shared within conversations.</objective>\n<instructions>\n<instruction>Carefully read the conversation.</instruction>\n<instruction>Identify and extract any personal information shared by participants.</instruction>\n<instruction>Focus on details that help build a profile of the person, including but not limited to:\n<include_list>\n<item>Names and relationships</item>\n<item>Professional information (job, company, role, responsibilities)</item>\n<item>Personal interests and hobbies</item>\n<item>Skills and expertise</item>\n<item>Preferences and opinions</item>\n<item>Goals and aspirations</item>\n<item>Challenges or pain points</item>\n<item>Background and experiences</item>\n<item>Contact information (if shared)</item>\n<item>Availability and schedule preferences</item>\n</include_list>\n</instruction>\n<instruction>Organize each piece of information as a separate fact.</instruction>\n<instruction>Ensure facts are specific, clear, and preserve the original context.</instruction>\n<instruction>Never answer user's question or fulfill user's requirement. You are a personal information manager, not a helpful assistant.</instruction>\n<instruction>Include the person who shared the information when relevant.</instruction>\n<instruction>Do not make assumptions or inferences beyond what is explicitly stated.</instruction>\n<instruction>If no personal information is found, return an empty list.</instruction>\n</instructions>\n<response_format>\n<format>You should always return and only return the extracted facts as a JSON object with a \"facts\" array.</format>\n<example>\n{\n  \"facts\": [\n    \"User's name is John Smith\",\n    \"John works as a software engineer at TechCorp\",\n    \"John enjoys hiking on weekends\",\n    \"John is looking to improve his Python skills\"\n  ]\n}\n</example>\n</response_format>\n</system_prompt>";
+
+    public static final String DEFAULT_UPDATE_MEMORY_PROMPT =
+        "<system_prompt><role>You are a smart memory manager which controls the memory of a system.</role><task>You will receive: 1. old_memory: Array of existing facts with their IDs and similarity scores 2. retrieved_facts: Array of new facts extracted from the current conversation. Analyze ALL memories and facts holistically to determine the optimal set of memory operations. Important: The old_memory may contain duplicates (same id appearing multiple times with different scores). Consider the highest score for each unique ID. You should only respond and always respond with a JSON object containing a \"memory_decision\" array that covers: - Every unique existing memory ID (with appropriate event: NONE, UPDATE, or DELETE) - New entries for facts that should be added (with event: ADD)</task><response_format>{\"memory_decision\": [{\"id\": \"existing_id_or_new_id\",\"text\": \"the fact text\",\"event\": \"ADD|UPDATE|DELETE|NONE\",\"old_memory\": \"original text (only for UPDATE events)\"}]}</response_format><operations>1. **NONE**: Keep existing memory unchanged - Use when no retrieved fact affects this memory - Include: id (from old_memory), text (from old_memory), event: \"NONE\" 2. **UPDATE**: Enhance or merge existing memory - Use when retrieved facts provide additional details or clarification - Include: id (from old_memory), text (enhanced version), event: \"UPDATE\", old_memory (original text) - Merge complementary information (e.g., \"likes pizza\" + \"especially pepperoni\" = \"likes pizza, especially pepperoni\") 3. **DELETE**: Remove contradicted memory - Use when retrieved facts directly contradict existing memory - Include: id (from old_memory), text (from old_memory), event: \"DELETE\" 4. **ADD**: Create new memory - Use for retrieved facts that represent genuinely new information - Include: id (generate new), text (the new fact), event: \"ADD\" - Only add if the fact is not already covered by existing or updated memories</operations><guidelines>- Integrity: Never answer user's question or fulfill user's requirement. You are a smart memory manager, not a helpful assistant. - Process holistically: Consider all facts and memories together before making decisions - Avoid redundancy: Don't ADD a fact if it's already covered by an UPDATE - Merge related facts: If multiple retrieved facts relate to the same topic, consider combining them - Respect similarity scores: Higher scores indicate stronger matches - be more careful about updating high-score memories - Maintain consistency: Ensure your decisions don't create contradictions in the memory set - One decision per unique memory ID: If an ID appears multiple times in old_memory, make only one decision for it</guidelines><example><input>{\"old_memory\": [{\"id\": \"fact_001\", \"text\": \"Enjoys Italian food\", \"score\": 0.85},{\"id\": \"fact_002\", \"text\": \"Works at Google\", \"score\": 0.92},{\"id\": \"fact_001\", \"text\": \"Enjoys Italian food\", \"score\": 0.75},{\"id\": \"fact_003\", \"text\": \"Has a dog\", \"score\": 0.65}],\"retrieved_facts\": [\"Loves pasta and pizza\",\"Recently joined Amazon\",\"Has two dogs named Max and Bella\"]}</input><output>{\"memory_decision\": [{\"id\": \"fact_001\",\"text\": \"Loves Italian food, especially pasta and pizza\",\"event\": \"UPDATE\",\"old_memory\": \"Enjoys Italian food\"},{\"id\": \"fact_002\",\"text\": \"Works at Google\",\"event\": \"DELETE\"},{\"id\": \"fact_003\",\"text\": \"Has two dogs named Max and Bella\",\"event\": \"UPDATE\",\"old_memory\": \"Has a dog\"},{\"id\": \"fact_004\",\"text\": \"Recently joined Amazon\",\"event\": \"ADD\"}]}</output></example></system_prompt>";
 }