wip

pyek-bot · pyek-bot · commit f5b7674b54be · 2025-04-24T17:38:48.000-07:00
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/agent/AgentUtilsTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/agent/AgentUtilsTest.java
@@ -8,9 +8,17 @@
 import static org.junit.Assert.assertEquals;
 import static org.junit.Assert.assertThrows;
 import static org.mockito.Mockito.when;
+import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.LLM_FINISH_REASON_PATH;
+import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.LLM_FINISH_REASON_TOOL_USE;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.LLM_GEN_INPUT;
+import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.LLM_RESPONSE_FILTER;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.PROMPT_PREFIX;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.PROMPT_SUFFIX;
+import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_CALLS_PATH;
+import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_CALLS_TOOL_INPUT;
+import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_CALLS_TOOL_NAME;
+import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_CALL_ID;
+import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_CALL_ID_PATH;
 import static org.opensearch.ml.engine.algorithms.agent.MLChatAgentRunner.ACTION;
 import static org.opensearch.ml.engine.algorithms.agent.MLChatAgentRunner.ACTION_INPUT;
 import static org.opensearch.ml.engine.algorithms.agent.MLChatAgentRunner.CHAT_HISTORY;
@@ -21,6 +29,7 @@
 import static org.opensearch.ml.engine.algorithms.agent.MLChatAgentRunner.THOUGHT;
 import static org.opensearch.ml.engine.algorithms.agent.MLChatAgentRunner.THOUGHT_RESPONSE;
 
+import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.HashMap;
@@ -695,6 +704,112 @@ public void testConstructToolParams_PlaceholderConfigInputJson() {
         Assert.assertEquals(actionInput, toolParams.get(LLM_GEN_INPUT));
     }
 
+    @Test
+    public void testParseLLMOutputWithToolCallsAndResponse() {
+        // Test case 1: Response containing both llm_response_filter and tool_calls_path
+        String response1 = "{\"metrics\":{\"latencyMs\":4589},\"output\":{\"message\":{\"content\":[{\"text\":\"Let me try another approach to find recommendation-related spans:\"},{\"toolUse\":{\"input\":{\"index\":\"otel-v1-apm-span-000001\",\"query\":{\"size\":10,\"query\":{\"bool\":{\"should\":[{\"wildcard\":{\"name\":\"*recommend*\"}},{\"exists\":{\"field\":\"span.attributes.app@products_recommended@count\"}}],\"minimum_should_match\":1}}}},\"name\":\"SearchIndexTool\",\"toolUseId\":\"tooluse_df9l5U5pTmeS_NFK4VI_zw\"}}],\"role\":\"assistant\"}},\"stopReason\":\"tool_use\",\"usage\":{\"cacheReadInputTokenCount\":0,\"cacheReadInputTokens\":0,\"cacheWriteInputTokenCount\":0,\"cacheWriteInputTokens\":0,\"inputTokens\":12902,\"outputTokens\":155,\"totalTokens\":13057}}";
+        
+        // Test case 2: Response containing only tool_calls_path
+        String response2 = "{\"metrics\":{\"latencyMs\":2131},\"output\":{\"message\":{\"content\":[{\"toolUse\":{\"input\":{\"index\":[\"ss4o_logs-2025.04.16\"]},\"name\":\"IndexMappingTool\",\"toolUseId\":\"tooluse_Q9Hkj3YrT3qfcwAIY3Y2WA\"}}],\"role\":\"assistant\"}},\"stopReason\":\"tool_use\",\"usage\":{\"cacheReadInputTokenCount\":0,\"cacheReadInputTokens\":0,\"cacheWriteInputTokenCount\":0,\"cacheWriteInputTokens\":0,\"inputTokens\":3411,\"outputTokens\":70,\"totalTokens\":3481}}";
+        
+        // Test case 3: Response containing only llm_response_filter
+        String response3 = "{\"metrics\":{\"latencyMs\":4589},\"output\":{\"message\":{\"content\":[{\"text\":\"Let me try another approach to find recommendation-related spans:\"}],\"role\":\"assistant\"}},\"usage\":{\"cacheReadInputTokenCount\":0,\"cacheReadInputTokens\":0,\"cacheWriteInputTokenCount\":0,\"cacheWriteInputTokens\":0,\"inputTokens\":12902,\"outputTokens\":155,\"totalTokens\":13057}}";
+
+        // Set up parameters
+        Map<String, String> parameters = new HashMap<>();
+        parameters.put(LLM_RESPONSE_FILTER, "$.choices[0].message.content");
+        parameters.put(TOOL_CALLS_PATH, "$.choices[0].message.tool_calls");
+        parameters.put(LLM_FINISH_REASON_PATH, "$.stopReason");
+        parameters.put(LLM_FINISH_REASON_TOOL_USE, "tool_use");
+        parameters.put(TOOL_CALLS_TOOL_NAME, "name");
+        parameters.put(TOOL_CALLS_TOOL_INPUT, "input");
+        parameters.put(TOOL_CALL_ID_PATH, "toolUseId");
+
+        // Test case 1
+        ModelTensorOutput modelTensorOutput1 = ModelTensorOutput
+            .builder()
+            .mlModelOutputs(
+                List.of(
+                    ModelTensors
+                        .builder()
+                        .mlModelTensors(
+                            List.of(ModelTensor.builder().name("response").dataAsMap(Map.of("response", response1)).build())
+                        )
+                        .build()
+                )
+            )
+            .build();
+
+        Map<String, String> output1 = AgentUtils.parseLLMOutput(
+            parameters,
+            modelTensorOutput1,
+            null,
+            Set.of("SearchIndexTool"),
+            new ArrayList<>()
+        );
+
+        Assert.assertEquals("", output1.get(THOUGHT));
+        Assert.assertEquals("SearchIndexTool", output1.get(ACTION));
+        Assert.assertTrue(output1.get(ACTION_INPUT).contains("otel-v1-apm-span-000001"));
+        Assert.assertEquals("tooluse_df9l5U5pTmeS_NFK4VI_zw", output1.get(TOOL_CALL_ID));
+
+        // Test case 2
+        ModelTensorOutput modelTensorOutput2 = ModelTensorOutput
+            .builder()
+            .mlModelOutputs(
+                List.of(
+                    ModelTensors
+                        .builder()
+                        .mlModelTensors(
+                            List.of(ModelTensor.builder().name("response").dataAsMap(Map.of("response", response2)).build())
+                        )
+                        .build()
+                )
+            )
+            .build();
+
+        Map<String, String> output2 = AgentUtils.parseLLMOutput(
+            parameters,
+            modelTensorOutput2,
+            null,
+            Set.of("IndexMappingTool"),
+            new ArrayList<>()
+        );
+
+        Assert.assertEquals("", output2.get(THOUGHT));
+        Assert.assertEquals("IndexMappingTool", output2.get(ACTION));
+        Assert.assertTrue(output2.get(ACTION_INPUT).contains("ss4o_logs-2025.04.16"));
+        Assert.assertEquals("tooluse_Q9Hkj3YrT3qfcwAIY3Y2WA", output2.get(TOOL_CALL_ID));
+
+        // Test case 3
+        ModelTensorOutput modelTensorOutput3 = ModelTensorOutput
+            .builder()
+            .mlModelOutputs(
+                List.of(
+                    ModelTensors
+                        .builder()
+                        .mlModelTensors(
+                            List.of(ModelTensor.builder().name("response").dataAsMap(Map.of("response", response3)).build())
+                        )
+                        .build()
+                )
+            )
+            .build();
+
+        Map<String, String> output3 = AgentUtils.parseLLMOutput(
+            parameters,
+            modelTensorOutput3,
+            null,
+            Set.of(),
+            new ArrayList<>()
+        );
+
+        Assert.assertNull(output3.get(ACTION));
+        Assert.assertNull(output3.get(ACTION_INPUT));
+        Assert.assertNull(output3.get(TOOL_CALL_ID));
+        Assert.assertTrue(output3.get(FINAL_ANSWER).contains("Let me try another approach to find recommendation-related spans:"));
+    }
+
     private void verifyConstructToolParams(String question, String actionInput, Consumer<Map<String, String>> verify) {
         Map<String, Tool> tools = Map.of("tool1", tool1);
         Map<String, MLToolSpec> toolSpecMap = Map