[BUG] Allow user to control react agent max_interations value to prevent empty response (#3756) (#3784)

opensearch-trigger-bot[bot] · pyek-bot · web-flow · commit e0fe59683ab0 · 2025-04-26T20:34:59.000-07:00
* fix: expose max_iteration for react Signed-off-by: Pavan Yekbote <pybot@amazon.com> * fix: defaults for agent execution and differentiate between step and step result Signed-off-by: Pavan Yekbote <pybot@amazon.com> * fix: return react agent id in agent response to expose more details Signed-off-by: Pavan Yekbote <pybot@amazon.com> * spotless Signed-off-by: Pavan Yekbote <pybot@amazon.com> * fix: remove test prompt from react system prompt Signed-off-by: Pavan Yekbote <pybot@amazon.com> * refactor: rename parameters exposed to user to executor Signed-off-by: Pavan Yekbote <pybot@amazon.com> * fix: give user complete control over planner system prompt Signed-off-by: Pavan Yekbote <pybot@amazon.com> --------- Signed-off-by: Pavan Yekbote <pybot@amazon.com> (cherry picked from commit 8339bcf) Co-authored-by: Pavan Yekbote <pybot@amazon.com>
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/MLPlanExecuteAndReflectAgentRunner.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/MLPlanExecuteAndReflectAgentRunner.java
@@ -17,6 +17,7 @@
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.getMcpToolSpecs;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.getMlToolSpecs;
 import static org.opensearch.ml.engine.algorithms.agent.MLChatAgentRunner.LLM_INTERFACE;
+import static org.opensearch.ml.engine.algorithms.agent.MLChatAgentRunner.MAX_ITERATION;
 import static org.opensearch.ml.engine.algorithms.agent.MLChatAgentRunner.saveTraceData;
 import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.DEFAULT_PLANNER_PROMPT;
 import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.DEFAULT_PLANNER_PROMPT_TEMPLATE;
@@ -90,16 +91,19 @@ public class MLPlanExecuteAndReflectAgentRunner implements MLAgentRunner {
     private String plannerWithHistoryPromptTemplate;
 
     // defaults
-    private static final String DEFAULT_SYSTEM_PROMPT = "Always respond in JSON format.";
-    private static final String DEFAULT_REACT_SYSTEM_PROMPT = "You are a helpful assistant.";
+    private static final String DEFAULT_PLANNER_SYSTEM_PROMPT =
+        "You are part of an OpenSearch cluster. When you deliver your final result, include a comprehensive report. This report MUST:\\n1. List every analysis or step you performed.\\n2. Summarize the inputs, methods, tools, and data used at each step.\\n3. Include key findings from all intermediate steps — do NOT omit them.\\n4. Clearly explain how the steps led to your final conclusion.\\n5. Return the full analysis and conclusion in the 'result' field, even if some of this was mentioned earlier.\\n\\nThe final response should be fully self-contained and detailed, allowing a user to understand the full investigation without needing to reference prior messages. Always respond in JSON format.";
+    private static final String DEFAULT_EXECUTOR_SYSTEM_PROMPT =
+        "You are a dedicated helper agent working as part of a plan‑execute‑reflect framework. Your role is to receive a discrete task, execute all necessary internal reasoning or tool calls, and return a single, final response that fully addresses the task. You must never return an empty response. If you are unable to complete the task or retrieve meaningful information, you must respond with a clear explanation of the issue or what was missing. Under no circumstances should you end your reply with a question or ask for more information. If you search any index, always include the raw documents in the final result instead of summarizing the content. This is critical to give visibility into what the query retrieved.";
     private static final String DEFAULT_NO_ESCAPE_PARAMS = "tool_configs,_tools";
     private static final String DEFAULT_MAX_STEPS_EXECUTED = "20";
     private static final int DEFAULT_MESSAGE_HISTORY_LIMIT = 10;
+    private static final String DEFAULT_REACT_MAX_ITERATIONS = "20";
 
     // fields
     public static final String PROMPT_FIELD = "prompt";
     public static final String USER_PROMPT_FIELD = "user_prompt";
-    public static final String REACT_SYSTEM_PROMPT_FIELD = "react_system_prompt";
+    public static final String EXECUTOR_SYSTEM_PROMPT_FIELD = "executor_system_prompt";
     public static final String STEPS_FIELD = "steps";
     public static final String COMPLETED_STEPS_FIELD = "completed_steps";
     public static final String PLANNER_PROMPT_FIELD = "planner_prompt";
@@ -109,18 +113,21 @@ public class MLPlanExecuteAndReflectAgentRunner implements MLAgentRunner {
     public static final String SYSTEM_PROMPT_FIELD = "system_prompt";
     public static final String QUESTION_FIELD = "question";
     public static final String MEMORY_ID_FIELD = "memory_id";
+    public static final String PARENT_INTERACTION_ID_FIELD = "parent_interaction_id";
     public static final String TENANT_ID_FIELD = "tenant_id";
     public static final String RESULT_FIELD = "result";
     public static final String RESPONSE_FIELD = "response";
     public static final String STEP_RESULT_FIELD = "step_result";
-    public static final String REACT_AGENT_ID_FIELD = "reAct_agent_id";
-    public static final String REACT_AGENT_MEMORY_ID_FIELD = "reAct_agent_memory_id";
+    public static final String EXECUTOR_AGENT_ID_FIELD = "executor_agent_id";
+    public static final String EXECUTOR_AGENT_MEMORY_ID_FIELD = "executor_agent_memory_id";
+    public static final String EXECUTOR_AGENT_PARENT_INTERACTION_ID_FIELD = "executor_agent_parent_interaction_id";
     public static final String NO_ESCAPE_PARAMS_FIELD = "no_escape_params";
     public static final String DEFAULT_PROMPT_TOOLS_FIELD = "tools_prompt";
     public static final String MAX_STEPS_EXECUTED_FIELD = "max_steps";
     public static final String PLANNER_PROMPT_TEMPLATE_FIELD = "planner_prompt_template";
     public static final String REFLECT_PROMPT_TEMPLATE_FIELD = "reflect_prompt_template";
     public static final String PLANNER_WITH_HISTORY_TEMPLATE_FIELD = "planner_with_history_template";
+    public static final String EXECUTOR_MAX_ITERATIONS_FIELD = "executor_max_iterations";
 
     public MLPlanExecuteAndReflectAgentRunner(
         Client client,
@@ -154,9 +161,7 @@ private void setupPromptParameters(Map<String, String> params) {
 
         String userPrompt = params.get(QUESTION_FIELD);
         params.put(USER_PROMPT_FIELD, userPrompt);
-
-        String userSystemPrompt = params.getOrDefault(SYSTEM_PROMPT_FIELD, "");
-        params.put(SYSTEM_PROMPT_FIELD, userSystemPrompt + DEFAULT_SYSTEM_PROMPT);
+        params.put(SYSTEM_PROMPT_FIELD, params.getOrDefault(SYSTEM_PROMPT_FIELD, DEFAULT_PLANNER_SYSTEM_PROMPT));
 
         if (params.get(PLANNER_PROMPT_FIELD) != null) {
             this.plannerPrompt = params.get(PLANNER_PROMPT_FIELD);
@@ -329,6 +334,8 @@ private void executePlanningLoop(
                 parentInteractionId,
                 finalResult,
                 completedSteps.get(completedSteps.size() - 2),
+                allParams.get(EXECUTOR_AGENT_MEMORY_ID_FIELD),
+                allParams.get(EXECUTOR_AGENT_PARENT_INTERACTION_ID_FIELD),
                 finalListener
             );
             return;
@@ -353,22 +360,31 @@ private void executePlanningLoop(
 
             if (parseLLMOutput.get(RESULT_FIELD) != null) {
                 String finalResult = parseLLMOutput.get(RESULT_FIELD);
-                saveAndReturnFinalResult((ConversationIndexMemory) memory, parentInteractionId, finalResult, null, finalListener);
+                saveAndReturnFinalResult(
+                    (ConversationIndexMemory) memory,
+                    parentInteractionId,
+                    allParams.get(EXECUTOR_AGENT_MEMORY_ID_FIELD),
+                    allParams.get(EXECUTOR_AGENT_PARENT_INTERACTION_ID_FIELD),
+                    finalResult,
+                    null,
+                    finalListener
+                );
             } else {
                 // todo: optimize double conversion of steps (string to list to string)
                 List<String> steps = Arrays.stream(parseLLMOutput.get(STEPS_FIELD).split(", ")).toList();
                 addSteps(steps, allParams, STEPS_FIELD);
 
                 String stepToExecute = steps.getFirst();
-                String reActAgentId = allParams.get(REACT_AGENT_ID_FIELD);
+                String reActAgentId = allParams.get(EXECUTOR_AGENT_ID_FIELD);
                 Map<String, String> reactParams = new HashMap<>();
                 reactParams.put(QUESTION_FIELD, stepToExecute);
-                if (allParams.containsKey(REACT_AGENT_MEMORY_ID_FIELD)) {
-                    reactParams.put(MEMORY_ID_FIELD, allParams.get(REACT_AGENT_MEMORY_ID_FIELD));
+                if (allParams.containsKey(EXECUTOR_AGENT_MEMORY_ID_FIELD)) {
+                    reactParams.put(MEMORY_ID_FIELD, allParams.get(EXECUTOR_AGENT_MEMORY_ID_FIELD));
                 }
 
-                reactParams.put(SYSTEM_PROMPT_FIELD, allParams.getOrDefault(REACT_SYSTEM_PROMPT_FIELD, DEFAULT_REACT_SYSTEM_PROMPT));
+                reactParams.put(SYSTEM_PROMPT_FIELD, allParams.getOrDefault(EXECUTOR_SYSTEM_PROMPT_FIELD, DEFAULT_EXECUTOR_SYSTEM_PROMPT));
                 reactParams.put(LLM_RESPONSE_FILTER, allParams.get(LLM_RESPONSE_FILTER));
+                reactParams.put(MAX_ITERATION, allParams.getOrDefault(EXECUTOR_MAX_ITERATIONS_FIELD, DEFAULT_REACT_MAX_ITERATIONS));
 
                 AgentMLInput agentInput = AgentMLInput
                     .AgentMLInputBuilder()
@@ -387,13 +403,18 @@ private void executePlanningLoop(
 
                     // Process tensors in a single stream
                     reactResult.getMlModelOutputs().stream().flatMap(output -> output.getMlModelTensors().stream()).forEach(tensor -> {
-                        if (MEMORY_ID_FIELD.equals(tensor.getName())) {
-                            results.put(MEMORY_ID_FIELD, tensor.getResult());
-                        } else {
-                            Map<String, ?> dataMap = tensor.getDataAsMap();
-                            if (dataMap != null && dataMap.containsKey(RESPONSE_FIELD)) {
-                                results.put(STEP_RESULT_FIELD, (String) dataMap.get(RESPONSE_FIELD));
-                            }
+                        switch (tensor.getName()) {
+                            case MEMORY_ID_FIELD:
+                                results.put(MEMORY_ID_FIELD, tensor.getResult());
+                                break;
+                            case PARENT_INTERACTION_ID_FIELD:
+                                results.put(PARENT_INTERACTION_ID_FIELD, tensor.getResult());
+                                break;
+                            default:
+                                Map<String, ?> dataMap = tensor.getDataAsMap();
+                                if (dataMap != null && dataMap.containsKey(RESPONSE_FIELD)) {
+                                    results.put(STEP_RESULT_FIELD, (String) dataMap.get(RESPONSE_FIELD));
+                                }
                         }
                     });
 
@@ -404,11 +425,16 @@ private void executePlanningLoop(
                     // Only add memory_id to params if it exists and is not empty
                     String reActMemoryId = results.get(MEMORY_ID_FIELD);
                     if (reActMemoryId != null && !reActMemoryId.isEmpty()) {
-                        allParams.put(REACT_AGENT_MEMORY_ID_FIELD, reActMemoryId);
+                        allParams.put(EXECUTOR_AGENT_MEMORY_ID_FIELD, reActMemoryId);
+                    }
+
+                    String reActParentInteractionId = results.get(PARENT_INTERACTION_ID_FIELD);
+                    if (reActParentInteractionId != null && !reActParentInteractionId.isEmpty()) {
+                        allParams.put(EXECUTOR_AGENT_PARENT_INTERACTION_ID_FIELD, reActParentInteractionId);
                     }
 
-                    completedSteps.add(stepToExecute);
-                    completedSteps.add(results.get(STEP_RESULT_FIELD));
+                    completedSteps.add(String.format("\nStep: %s\n", stepToExecute));
+                    completedSteps.add(String.format("\nStep Result: %s\n", results.get(STEP_RESULT_FIELD)));
 
                     saveTraceData(
                         (ConversationIndexMemory) memory,
@@ -524,6 +550,8 @@ private void addSteps(List<String> steps, Map<String, String> allParams, String
     private void saveAndReturnFinalResult(
         ConversationIndexMemory memory,
         String parentInteractionId,
+        String reactAgentMemoryId,
+        String reactParentInteractionId,
         String finalResult,
         String input,
         ActionListener<Object> finalListener
@@ -536,7 +564,12 @@ private void saveAndReturnFinalResult(
         }
 
         memory.getMemoryManager().updateInteraction(parentInteractionId, updateContent, ActionListener.wrap(res -> {
-            List<ModelTensors> finalModelTensors = createModelTensors(memory.getConversationId(), parentInteractionId);
+            List<ModelTensors> finalModelTensors = createModelTensors(
+                memory.getConversationId(),
+                parentInteractionId,
+                reactAgentMemoryId,
+                reactParentInteractionId
+            );
             finalModelTensors
                 .add(
                     ModelTensors
@@ -553,7 +586,12 @@ private void saveAndReturnFinalResult(
         }));
     }
 
-    private static List<ModelTensors> createModelTensors(String sessionId, String parentInteractionId) {
+    private static List<ModelTensors> createModelTensors(
+        String sessionId,
+        String parentInteractionId,
+        String reactAgentMemoryId,
+        String reactParentInteractionId
+    ) {
         List<ModelTensors> modelTensors = new ArrayList<>();
         modelTensors
             .add(
@@ -563,7 +601,13 @@ private static List<ModelTensors> createModelTensors(String sessionId, String pa
                         List
                             .of(
                                 ModelTensor.builder().name(MLAgentExecutor.MEMORY_ID).result(sessionId).build(),
-                                ModelTensor.builder().name(MLAgentExecutor.PARENT_INTERACTION_ID).result(parentInteractionId).build()
+                                ModelTensor.builder().name(MLAgentExecutor.PARENT_INTERACTION_ID).result(parentInteractionId).build(),
+                                ModelTensor.builder().name(EXECUTOR_AGENT_MEMORY_ID_FIELD).result(reactAgentMemoryId).build(),
+                                ModelTensor
+                                    .builder()
+                                    .name(EXECUTOR_AGENT_PARENT_INTERACTION_ID_FIELD)
+                                    .result(reactParentInteractionId)
+                                    .build()
                             )
                     )
                     .build()
diff --git a/plugin/src/main/java/org/opensearch/ml/action/agents/TransportRegisterAgentAction.java b/plugin/src/main/java/org/opensearch/ml/action/agents/TransportRegisterAgentAction.java
@@ -98,12 +98,12 @@ private void registerAgent(MLAgent agent, ActionListener<MLRegisterAgentResponse
             return;
         }
 
-        // If the agent is a PLAN_EXECUTE_AND_REFLECT agent and does not have a reAct agent id, create a reAct agent
+        // If the agent is a PLAN_EXECUTE_AND_REFLECT agent and does not have an executor agent id, create an executor (reAct) agent
         if (MLAgentType.from(mlAgent.getType()) == MLAgentType.PLAN_EXECUTE_AND_REFLECT
-            && !mlAgent.getParameters().containsKey(MLPlanExecuteAndReflectAgentRunner.REACT_AGENT_ID_FIELD)) {
+            && !mlAgent.getParameters().containsKey(MLPlanExecuteAndReflectAgentRunner.EXECUTOR_AGENT_ID_FIELD)) {
             createConversationAgent(mlAgent, tenantId, ActionListener.wrap(conversationAgentId -> {
                 Map<String, String> parameters = new HashMap<>(mlAgent.getParameters());
-                parameters.put(MLPlanExecuteAndReflectAgentRunner.REACT_AGENT_ID_FIELD, conversationAgentId);
+                parameters.put(MLPlanExecuteAndReflectAgentRunner.EXECUTOR_AGENT_ID_FIELD, conversationAgentId);
                 MLAgent updatedAgent = mlAgent.toBuilder().parameters(parameters).build();
                 registerAgentToIndex(updatedAgent, tenantId, listener);
             }, listener::onFailure));