Fix: Ensure consistent response format for PER agent (#4110) (#4117)

opensearch-trigger-bot[bot] · pyek-bot · web-flow · commit ccf9d6b4803a · 2025-08-13T19:05:35.000-07:00
(cherry picked from commit 1f28c21) Co-authored-by: Pavan Yekbote <pybot@amazon.com>
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/MLPlanExecuteAndReflectAgentRunner.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/MLPlanExecuteAndReflectAgentRunner.java
@@ -610,15 +610,15 @@ String extractJsonFromMarkdown(String response) {
     @VisibleForTesting
     void addToolsToPrompt(Map<String, Tool> tools, Map<String, String> allParams) {
         StringBuilder toolsPrompt = new StringBuilder(
-            "In this environment, the executor agent only has access to the below tools. You must choose from only the following tools — no other tools are available. Do not use tools not listed here. \n"
+            "In this environment, you have access to the tools listed below. Use these tools to create your plan, and do not reference or use any tools not listed here.\n"
         );
         int toolNumber = 0;
         for (Map.Entry<String, Tool> entry : tools.entrySet()) {
             String toolName = entry.getKey();
             String toolDescription = entry.getValue().getDescription();
             toolsPrompt.append(String.format("Tool %d - %s: %s\n\n", ++toolNumber, toolName, toolDescription));
         }
-        toolsPrompt.append("No other tools are available. Do not invent tools.\n\n");
+        toolsPrompt.append("No other tools are available. Do not invent tools. Only use tools to create the plan.\n\n");
         allParams.put(DEFAULT_PROMPT_TOOLS_FIELD, toolsPrompt.toString());
         populatePrompt(allParams);
         cleanUpResource(tools);
@@ -677,25 +677,20 @@ static List<ModelTensors> createModelTensors(
         String reactParentInteractionId
     ) {
         List<ModelTensors> modelTensors = new ArrayList<>();
-        modelTensors
-            .add(
-                ModelTensors
-                    .builder()
-                    .mlModelTensors(
-                        List
-                            .of(
-                                ModelTensor.builder().name(MLAgentExecutor.MEMORY_ID).result(sessionId).build(),
-                                ModelTensor.builder().name(MLAgentExecutor.PARENT_INTERACTION_ID).result(parentInteractionId).build(),
-                                ModelTensor.builder().name(EXECUTOR_AGENT_MEMORY_ID_FIELD).result(reactAgentMemoryId).build(),
-                                ModelTensor
-                                    .builder()
-                                    .name(EXECUTOR_AGENT_PARENT_INTERACTION_ID_FIELD)
-                                    .result(reactParentInteractionId)
-                                    .build()
-                            )
-                    )
-                    .build()
-            );
+        List<ModelTensor> tensors = new ArrayList<>();
+
+        tensors.add(ModelTensor.builder().name(MLAgentExecutor.MEMORY_ID).result(sessionId).build());
+        tensors.add(ModelTensor.builder().name(MLAgentExecutor.PARENT_INTERACTION_ID).result(parentInteractionId).build());
+
+        if (reactAgentMemoryId != null && !reactAgentMemoryId.isEmpty()) {
+            tensors.add(ModelTensor.builder().name(EXECUTOR_AGENT_MEMORY_ID_FIELD).result(reactAgentMemoryId).build());
+        }
+
+        if (reactParentInteractionId != null && !reactParentInteractionId.isEmpty()) {
+            tensors.add(ModelTensor.builder().name(EXECUTOR_AGENT_PARENT_INTERACTION_ID_FIELD).result(reactParentInteractionId).build());
+        }
+
+        modelTensors.add(ModelTensors.builder().mlModelTensors(tensors).build());
         return modelTensors;
     }
 
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/PromptTemplate.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/PromptTemplate.java
@@ -30,7 +30,7 @@ public class PromptTemplate {
         + "} \n"
         + "Objective: ${parameters."
         + USER_PROMPT_FIELD
-        + "} \n\n";
+        + "} \n\nRemember: Respond only in JSON format following the required schema.";
 
     public static final String DEFAULT_REFLECT_PROMPT_TEMPLATE = "${parameters."
         + DEFAULT_PROMPT_TOOLS_FIELD
@@ -49,7 +49,7 @@ public class PromptTemplate {
         + "}] \n\n"
         + "${parameters."
         + REFLECT_PROMPT_FIELD
-        + "} \n\n.";
+        + "} \n\n.Remember: Respond only in JSON format following the required schema.";
 
     public static final String DEFAULT_PLANNER_WITH_HISTORY_PROMPT_TEMPLATE = "${parameters."
         + DEFAULT_PROMPT_TOOLS_FIELD
@@ -62,27 +62,23 @@ public class PromptTemplate {
         + "}``` \n\n"
         + "You have currently executed the following steps: \n[${parameters."
         + COMPLETED_STEPS_FIELD
-        + "}] \n\n";
+        + "}] \n\nRemember: Respond only in JSON format following the required schema.";
 
-    // modify these -- ensure that it breaks down steps simpler
     public static final String DEFAULT_PLANNER_PROMPT =
-        "For the given objective, generate a step-by-step plan composed of simple, self-contained tasks. The final step should directly yield the final answer. Avoid unnecessary steps.";
+        "For the given objective, generate a step-by-step plan composed of simple, self-contained steps. The final step should directly yield the final answer. Avoid unnecessary steps.";
 
-    // modify these -- update your plan based on completed steps
     public static final String DEFAULT_REFLECT_PROMPT =
-        "Update your plan based on the latest results. If the task is complete, return the final answer. Otherwise, include only the remaining steps — do not repeat previously completed ones.";
+        "Update your plan based on the latest step results. If the task is complete, return the final answer. Otherwise, include only the remaining steps. Do not repeat previously completed steps.";
 
     public static final String FINAL_RESULT_RESPONSE_INSTRUCTIONS =
         """
-            When you deliver your final result, include a comprehensive report. This report must:
-
-            1. List every analysis or step you performed.
-            2. Summarize the inputs, methods, tools, and data used at each step.
-            3. Include key findings from all intermediate steps — do NOT omit them.
-            4. Clearly explain how the steps led to your final conclusion. Only mention the completed steps.
-            5. Return the full analysis and conclusion in the 'result' field, even if some of this was mentioned earlier.
-
-            The final response should be fully self-contained and detailed, allowing a user to understand the full investigation without needing to reference prior messages and steps.
+                When you deliver your final result, include a comprehensive report. This report must:
+                1. List every analysis or step you performed.
+                2. Summarize the inputs, methods, tools, and data used at each step.
+                3. Include key findings from all intermediate steps — do NOT omit them.
+                4. Clearly explain how the steps led to your final conclusion. Only mention the completed steps.
+                5. Return the full analysis and conclusion in the 'result' field, even if some of this was mentioned earlier. Ensure that special characters are escaped in the 'result' field.
+                6. The final response should be fully self-contained and detailed, allowing a user to understand the full investigation without needing to reference prior messages and steps.
             """;
 
     public static final String PLAN_EXECUTE_REFLECT_RESPONSE_FORMAT = "Response Instructions: \n"
@@ -93,7 +89,7 @@ public class PromptTemplate {
         + "\t\"result\": string \n"
         + "}\n"
         + "Use \"steps\" to return an array of strings where each string is a step to complete the objective, leave it empty if you know the final result. Please wrap each step in quotes and escape any special characters within the string. \n"
-        + "Use \"result\" return the final response when you have enough information, leave it empty if you want to execute more steps \n"
+        + "Use \"result\" return the final response when you have enough information, leave it empty if you want to execute more steps. Please escape any special characters within the result. \n"
         + "Here are examples of valid responses following the required JSON schema:\n\n"
         + "Example 1 - When you need to execute steps:\n"
         + "{\n"
@@ -103,7 +99,7 @@ public class PromptTemplate {
         + "Example 2 - When you have the final result:\n"
         + "{\n"
         + "\t\"steps\": [],\n"
-        + "\t\"result\": \"This is an example result\"\n"
+        + "\t\"result\": \"This is an example result\\n with escaped special characters\"\n"
         + "}\n"
         + "Important rules for the response:\n"
         + "1. Do not use commas within individual steps \n"
@@ -112,67 +108,36 @@ public class PromptTemplate {
 
     public static final String PLANNER_RESPONSIBILITY =
         """
-            You are a thoughtful and analytical agent working as the `Planner & Reflector Agent` in a Plan–Execute–Reflect framework. You collaborate with a separate `Executor Agent`, whose sole responsibility is to carry out specific Steps that you generate.
-
-            ## Core Responsibilities
-            - Receive a high-level objective or user goal and generate a clear, ordered sequence of simple executable Steps to complete the objective
-            - Ensure each Step is self-contained, meaning it can be executed without any prior context
-            - Each Step must specify exactly what to do, where to do it, and with which tools or parameters — avoid abstract instructions like “for each index” or “try something”
-            - If a partially completed plan and its execution results are provided, update the plan accordingly:
-              - Only include new Steps that still need to be executed
-              - Do not repeat previously completed Steps unless their output is outdated, missing, or clearly insufficient
-              - Use results from completed steps to avoid redundant or unnecessary follow-up actions
-              - If the task is already complete, return the final answer instead of a new plan
-              - If the available information is sufficient to provide a useful or partial answer, do so — do not over-plan or run unnecessary steps
-            - Use only the tools provided to construct your plan. You will be provided a list of available tools for each objective. Use only these tools in your plan — do not invent new tool names, do not guess what tools might exist, and do not reference tools not explicitly listed. If no suitable tool is available, plan using reasoning or observations instead.
-            - Always respond in JSON format
-
-            ## Step Guidelines
-            - Each Step must be simple, atomic, and concrete — suitable for execution by a separate agent
-            - Avoid ambiguity: Steps should clearly define the **specific data sources, indexes, services, or parameters** to use
-            - Do not include generic instructions that require iteration or interpretation (e.g., “for all indexes” or “check relevant logs”)
-            - Do not add any superfluous steps — the result of the final step should directly answer the objective
-
-            ### Bad Step Example: "Use the SearchIndexTool to sample documents from each index"
-
-            ### Good Step Example: "Use the SearchIndexTool to sample documents for the index: index-name"
-
-            ## Structural Expectations
-            - Track what Steps you generate and why
-            - Specify what tool or method each Step will likely require
-            - Use execution results to guide re-planning or task completion decisions
-            - Reuse prior results — do not re-fetch documents or metadata if they have already been retrieved
-            - If further progress is unlikely based on tool limitations or available data, stop and return the best possible result to the user
-            - Never rely on implicit knowledge, do not make make assumptions
-
-            Your goal is to produce a clean, efficient, and logically sound plan — or to adapt an existing one — to help the Executor Agent make steady progress toward the final answer. If no further progress can reasonably be made, summarize what has been learned and end the investigation.
+            You are a thoughtful and analytical planner agent in a plan-execute-reflect framework. Your job is to design a clear, step-by-step plan for a given objective.
+
+            Instructions:
+            - Break the objective into an ordered list of atomic, self-contained Steps that, if executed, will lead to the final result or complete the objective.
+            - Each Step must state what to do, where, and which tool/parameters would be used. You do not execute tools, only reference them for planning.
+            - Use only the provided tools; do not invent or assume tools. If no suitable tool applies, use reasoning or observations instead.
+            - Base your plan only on the data and information explicitly provided; do not rely on unstated knowledge or external facts.
+            - If there is insufficient information to create a complete plan, summarize what is known so far and clearly state what additional information is required to proceed.
+            - Stop and summarize if the task is complete or further progress is unlikely.
+            - Avoid vague instructions; be specific about data sources, indexes, or parameters.
+            - Never make assumptions or rely on implicit knowledge.
+            - Respond only in JSON format.
+
+            Step examples:
+            Good example: \"Use Tool to sample documents from index: 'my-index'\"
+            Bad example: \"Use Tool to sample documents from each index\"
+            Bad example: \"Use Tool to sample documents from all indices\"
             """;
 
-    // ask it to break down a large step into a smaller step
     public static final String EXECUTOR_RESPONSIBILITY =
         """
-            You are a dedicated helper agent working as the `Executor Agent` in a Plan–Execute–Reflect framework. In this setup, a separate `Planner & Reflector Agent` both creates an ordered list of discrete Steps and, after seeing your execution outputs, re-plans or refines those Steps as needed.
-
-            Your sole responsibility is to execute whatever Step you receive.
-
-            ## Core Responsibilities
-            - Receive a discrete Step and execute it completely
-            - Run all necessary internal reasoning or tool calls
-            - Return a single, consolidated response that fully addresses that Step
-            - If previous context can help you answer the Step, reuse that information instead of calling tools again
-
-            ## Critical Requirements
-            - You must never return an empty response
-            - Never end your reply with questions or requests for more information
-            - If you search any index, always include the full raw documents in your output. Do not summarize—so that every piece of retrieved evidence remains visible. This is critical for the `Planner & Reflector Agent` to decide the next step.
-            - If you cannot complete the Step, provide a clear explanation of what went wrong or what information was missing
-            - Never rely on implicit knowledge, do not make make assumptions
-
-            ## Efficiency Guidelines
-            - Reuse previous context when applicable, stating what you're reusing and why
-            - Use the most direct approach first
-            - If a tool call fails, try alternative approaches before declaring failure
-            - If a search request is complex, break it down into multiple simple search queries
-
-            Your response must be complete and actionable as-is.""";
+            You are a precise and reliable executor agent in a plan-execute-reflect framework. Your job is to execute the given instruction provided by the planner and return a complete, actionable result.
+
+            Instructions:
+            - Fully execute the given Step using the most relevant tools or reasoning.
+            - Include all relevant raw tool outputs (e.g., full documents from searches) so the planner has complete information; do not summarize unless explicitly instructed.
+            - Base your execution and conclusions only on the data and tool outputs available; do not rely on unstated knowledge or external facts.
+            - If the available data is insufficient to complete the Step, summarize what was obtained so far and clearly state the additional information or access required to proceed (do not guess).
+            - If unable to complete the Step, clearly explain what went wrong and what is needed to proceed.
+            - Avoid making assumptions and relying on implicit knowledge.
+            - Your response must be self-contained and ready for the planner to use without modification. Never end with a question.
+            - Break complex searches into simpler queries when appropriate.""";
 }
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/agent/MLPlanExecuteAndReflectAgentRunnerTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/agent/MLPlanExecuteAndReflectAgentRunnerTest.java
@@ -237,7 +237,7 @@ public void testBasicExecution() {
 
         ModelTensors firstModelTensors = mlModelOutputs.get(0);
         List<ModelTensor> firstModelTensorList = firstModelTensors.getMlModelTensors();
-        assertEquals(4, firstModelTensorList.size());
+        assertEquals(2, firstModelTensorList.size());
 
         ModelTensor memoryIdTensor = firstModelTensorList.get(0);
         assertEquals("memory_id", memoryIdTensor.getName());
@@ -310,7 +310,7 @@ public void testExecutionWithHistory() {
 
         ModelTensors firstModelTensors = mlModelOutputs.get(0);
         List<ModelTensor> firstModelTensorList = firstModelTensors.getMlModelTensors();
-        assertEquals(4, firstModelTensorList.size());
+        assertEquals(2, firstModelTensorList.size());
 
         ModelTensor memoryIdTensor = firstModelTensorList.get(0);
         assertEquals("memory_id", memoryIdTensor.getName());
@@ -575,10 +575,11 @@ public void testAddToolsToPrompt() {
         mlPlanExecuteAndReflectAgentRunner.addToolsToPrompt(tools, testParams);
 
         assertEquals(
-            "In this environment, the executor agent only has access to the below tools. You must choose from only the following tools — no other tools are available. Do not use tools not listed here. \n"
+            "In this environment, you have access to the tools listed below. Use these tools to create your plan, and do not reference or use any tools not listed here.\n"
                 + "Tool 1 - tool1: description1\n"
                 + "\n"
-                + "No other tools are available. Do not invent tools.\n\n",
+                + "No other tools are available. Do not invent tools. Only use tools to create the plan.\n"
+                + "\n",
             testParams.get(MLPlanExecuteAndReflectAgentRunner.DEFAULT_PROMPT_TOOLS_FIELD)
         );
     }
@@ -612,6 +613,15 @@ public void testCreateModelTensors() {
         assertEquals(parentInteractionId, tensors.getMlModelTensors().get(1).getResult());
         assertEquals(executorMemoryId, tensors.getMlModelTensors().get(2).getResult());
         assertEquals(executorParentId, tensors.getMlModelTensors().get(3).getResult());
+
+        result = MLPlanExecuteAndReflectAgentRunner.createModelTensors(sessionId, parentInteractionId, "", "");
+
+        assertNotNull(result);
+        assertEquals(1, result.size());
+        tensors = result.get(0);
+        assertEquals(2, tensors.getMlModelTensors().size());
+        assertEquals(sessionId, tensors.getMlModelTensors().get(0).getResult());
+        assertEquals(parentInteractionId, tensors.getMlModelTensors().get(1).getResult());
     }
 
     @Test