opensearch-project
diff --git a/‎ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/AgentUtils.java
Lines changed: 26 additions & 11 deletions b/‎ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/AgentUtils.java
Lines changed: 26 additions & 11 deletions
diff --git a/‎ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/MLChatAgentRunner.java
Lines changed: 41 additions & 134 deletions b/‎ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/MLChatAgentRunner.java
Lines changed: 41 additions & 134 deletions
@@ -75,6 +75,7 @@
 import org.opensearch.ml.engine.MLEngineClassLoader;
 import org.opensearch.ml.engine.algorithms.remote.McpConnectorExecutor;
 import org.opensearch.ml.engine.encryptor.Encryptor;
+import org.opensearch.ml.engine.function_calling.FunctionCalling;
 import org.opensearch.ml.engine.tools.McpSseTool;
 import org.opensearch.remote.metadata.client.GetDataObjectRequest;
 import org.opensearch.remote.metadata.client.SdkClient;
@@ -129,6 +130,9 @@ public class AgentUtils {
     public static final String LLM_FINISH_REASON_TOOL_USE = "llm_finish_reason_tool_use";
     public static final String TOOL_FILTERS_FIELD = "tool_filters";
 
+    // For function calling, do not escape the below params in connector by default
+    public static final String DEFAULT_NO_ESCAPE_PARAMS = "_chat_history,_tools,_interactions,tool_configs";
+
     public static String addExamplesToPrompt(Map<String, String> parameters, String prompt) {
         Map<String, String> examplesMap = new HashMap<>();
         if (parameters.containsKey(EXAMPLES)) {
@@ -299,7 +303,8 @@ public static Map<String, String> parseLLMOutput(
         ModelTensorOutput tmpModelTensorOutput,
         List<String> llmResponsePatterns,
         Set<String> inputTools,
-        List<String> interactions
+        List<String> interactions,
+        FunctionCalling functionCalling
     ) {
         Map<String, String> modelOutput = new HashMap<>();
         Map<String, ?> dataAsMap = tmpModelTensorOutput.getMlModelOutputs().get(0).getMlModelTensors().get(0).getDataAsMap();
@@ -339,20 +344,33 @@ public static Map<String, String> parseLLMOutput(
                 llmFinishReason = JsonPath.read(dataAsMap, llmFinishReasonPath);
             }
             if (parameters.get(LLM_FINISH_REASON_TOOL_USE).equalsIgnoreCase(llmFinishReason) || isToolUseResponse) {
-                List toolCalls = null;
+                List<Map<String, String>> toolCalls = null;
                 try {
-                    String toolCallsPath = parameters.get(TOOL_CALLS_PATH);
-                    if (toolCallsPath.startsWith("_llm_response.")) {
-                        Map<String, Object> llmResponse = StringUtils.fromJson(response.toString(), RESPONSE_FIELD);
-                        toolCalls = JsonPath.read(llmResponse, toolCallsPath.substring("_llm_response.".length()));
+                    String toolName = "";
+                    String toolInput = "";
+                    String toolCallId = "";
+                    if (functionCalling != null) {
+                        toolCalls = functionCalling.handle(tmpModelTensorOutput, parameters);
+                        // TODO: support multiple tool calls here
+                        toolName = toolCalls.getFirst().get("tool_name");
+                        toolInput = toolCalls.getFirst().get("tool_input");
+                        toolCallId = toolCalls.getFirst().get("tool_call_id");
                     } else {
-                        toolCalls = JsonPath.read(dataAsMap, toolCallsPath);
+                        String toolCallsPath = parameters.get(TOOL_CALLS_PATH);
+                        if (toolCallsPath.startsWith("_llm_response.")) {
+                            Map<String, Object> llmResponse = StringUtils.fromJson(response.toString(), RESPONSE_FIELD);
+                            toolCalls = JsonPath.read(llmResponse, toolCallsPath.substring("_llm_response.".length()));
+                        } else {
+                            toolCalls = JsonPath.read(dataAsMap, toolCallsPath);
+                        }
+                        toolName = JsonPath.read(toolCalls.get(0), parameters.get(TOOL_CALLS_TOOL_NAME));
+                        toolInput = StringUtils.toJson(JsonPath.read(toolCalls.get(0), parameters.get(TOOL_CALLS_TOOL_INPUT)));
+                        toolCallId = JsonPath.read(toolCalls.get(0), parameters.get(TOOL_CALL_ID_PATH));
                     }
                     String toolCallsMsgPath = parameters.get(INTERACTION_TEMPLATE_ASSISTANT_TOOL_CALLS_PATH);
                     String toolCallsMsgExcludePath = parameters.get(INTERACTION_TEMPLATE_ASSISTANT_TOOL_CALLS_EXCLUDE_PATH);
                     if (toolCallsMsgPath != null) {
                         if (toolCallsMsgExcludePath != null) {
-
                             Map<String, ?> newDataAsMap = removeJsonPath(dataAsMap, toolCallsMsgExcludePath, false);
                             Object toolCallsMsg = JsonPath.read(newDataAsMap, toolCallsMsgPath);
                             interactions.add(StringUtils.toJson(toolCallsMsg));
@@ -371,9 +389,6 @@ public static Map<String, String> parseLLMOutput(
                                 )
                             );
                     }
-                    String toolName = JsonPath.read(toolCalls.get(0), parameters.get(TOOL_CALLS_TOOL_NAME));
-                    String toolInput = StringUtils.toJson(JsonPath.read(toolCalls.get(0), parameters.get(TOOL_CALLS_TOOL_INPUT)));
-                    String toolCallId = JsonPath.read(toolCalls.get(0), parameters.get(TOOL_CALL_ID_PATH));
                     modelOutput.put(THOUGHT, "");
                     modelOutput.put(ACTION, toolName);
                     modelOutput.put(ACTION_INPUT, toolInput);
 
@@ -11,21 +11,13 @@
 import static org.opensearch.ml.common.utils.StringUtils.processTextDoc;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.DISABLE_TRACE;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.INTERACTIONS_PREFIX;
-import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.LLM_FINISH_REASON_PATH;
-import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.LLM_FINISH_REASON_TOOL_USE;
-import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.LLM_RESPONSE_FILTER;
-import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.NO_ESCAPE_PARAMS;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.PROMPT_CHAT_HISTORY_PREFIX;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.PROMPT_PREFIX;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.PROMPT_SUFFIX;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.RESPONSE_FORMAT_INSTRUCTION;
-import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_CALLS_PATH;
-import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_CALLS_TOOL_INPUT;
-import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_CALLS_TOOL_NAME;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_CALL_ID;
-import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_CALL_ID_PATH;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_RESPONSE;
-import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_TEMPLATE;
+import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.TOOL_RESULT;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.VERBOSE;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.cleanUpResource;
 import static org.opensearch.ml.engine.algorithms.agent.AgentUtils.constructToolParams;
@@ -79,6 +71,9 @@
 import org.opensearch.ml.common.transport.prediction.MLPredictionTaskRequest;
 import org.opensearch.ml.common.utils.StringUtils;
 import org.opensearch.ml.engine.encryptor.Encryptor;
+import org.opensearch.ml.engine.function_calling.FunctionCalling;
+import org.opensearch.ml.engine.function_calling.FunctionCallingFactory;
+import org.opensearch.ml.engine.function_calling.LLMMessage;
 import org.opensearch.ml.engine.memory.ConversationIndexMemory;
 import org.opensearch.ml.engine.memory.ConversationIndexMessage;
 import org.opensearch.ml.engine.tools.MLModelTool;
@@ -117,7 +112,6 @@ public class MLChatAgentRunner implements MLAgentRunner {
     public static final String FINAL_ANSWER = "final_answer";
     public static final String THOUGHT_RESPONSE = "thought_response";
     public static final String INTERACTIONS = "_interactions";
-    public static final String DEFAULT_NO_ESCAPE_PARAMS = "_chat_history,_tools,_interactions,tool_configs";
     public static final String INTERACTION_TEMPLATE_TOOL_RESPONSE = "interaction_template.tool_response";
     public static final String CHAT_HISTORY_QUESTION_TEMPLATE = "chat_history_template.user_question";
     public static final String CHAT_HISTORY_RESPONSE_TEMPLATE = "chat_history_template.ai_response";
@@ -170,116 +164,11 @@ public void run(MLAgent mlAgent, Map<String, String> inputParams, ActionListener
         params.putAll(inputParams);
 
         String llmInterface = params.get(LLM_INTERFACE);
-        // todo: introduce function calling
-        // handle parameters based on llmInterface
-        if ("openai/v1/chat/completions".equalsIgnoreCase(llmInterface)) {
-            if (!params.containsKey(NO_ESCAPE_PARAMS)) {
-                params.put(NO_ESCAPE_PARAMS, DEFAULT_NO_ESCAPE_PARAMS);
-            }
-            params.put(LLM_RESPONSE_FILTER, "$.choices[0].message.content");
-
-            params
-                .put(
-                    TOOL_TEMPLATE,
-                    "{\"type\": \"function\", \"function\": { \"name\": \"${tool.name}\", \"description\": \"${tool.description}\", \"parameters\": ${tool.attributes.input_schema}, \"strict\": ${tool.attributes.strict:-false} } }"
-                );
-            params.put(TOOL_CALLS_PATH, "$.choices[0].message.tool_calls");
-            params.put(TOOL_CALLS_TOOL_NAME, "function.name");
-            params.put(TOOL_CALLS_TOOL_INPUT, "function.arguments");
-            params.put(TOOL_CALL_ID_PATH, "id");
-            params.put("tool_configs", ", \"tools\": [${parameters._tools:-}], \"parallel_tool_calls\": false");
-
-            params.put("tool_choice", "auto");
-            params.put("parallel_tool_calls", "false");
-
-            params.put("interaction_template.assistant_tool_calls_path", "$.choices[0].message");
-            params
-                .put(
-                    "interaction_template.tool_response",
-                    "{ \"role\": \"tool\", \"tool_call_id\": \"${_interactions.tool_call_id}\", \"content\": \"${_interactions.tool_response}\" }"
-                );
-
-            params.put("chat_history_template.user_question", "{\"role\": \"user\",\"content\": \"${_chat_history.message.question}\"}");
-            params.put("chat_history_template.ai_response", "{\"role\": \"assistant\",\"content\": \"${_chat_history.message.response}\"}");
-
-            params.put(LLM_FINISH_REASON_PATH, "$.choices[0].finish_reason");
-            params.put(LLM_FINISH_REASON_TOOL_USE, "tool_calls");
-        } else if ("bedrock/converse/claude".equalsIgnoreCase(llmInterface)) {
-            if (!params.containsKey(NO_ESCAPE_PARAMS)) {
-                params.put(NO_ESCAPE_PARAMS, DEFAULT_NO_ESCAPE_PARAMS);
-            }
-            params.put(LLM_RESPONSE_FILTER, "$.output.message.content[0].text");
-
-            params
-                .put(
-                    TOOL_TEMPLATE,
-                    "{\"toolSpec\":{\"name\":\"${tool.name}\",\"description\":\"${tool.description}\",\"inputSchema\": {\"json\": ${tool.attributes.input_schema} } }}"
-                );
-            params.put(TOOL_CALLS_PATH, "$.output.message.content[*].toolUse");
-            params.put(TOOL_CALLS_TOOL_NAME, "name");
-            params.put(TOOL_CALLS_TOOL_INPUT, "input");
-            params.put(TOOL_CALL_ID_PATH, "toolUseId");
-            params.put("tool_configs", ", \"toolConfig\": {\"tools\": [${parameters._tools:-}]}");
-
-            params.put("interaction_template.assistant_tool_calls_path", "$.output.message");
-            params
-                .put(
-                    "interaction_template.tool_response",
-                    "{\"role\":\"user\",\"content\":[{\"toolResult\":{\"toolUseId\":\"${_interactions.tool_call_id}\",\"content\":[{\"text\":\"${_interactions.tool_response}\"}]}}]}"
-                );
-
-            params
-                .put(
-                    "chat_history_template.user_question",
-                    "{\"role\":\"user\",\"content\":[{\"text\":\"${_chat_history.message.question}\"}]}"
-                );
-            params
-                .put(
-                    "chat_history_template.ai_response",
-                    "{\"role\":\"assistant\",\"content\":[{\"text\":\"${_chat_history.message.response}\"}]}"
-                );
-
-            params.put(LLM_FINISH_REASON_PATH, "$.stopReason");
-            params.put(LLM_FINISH_REASON_TOOL_USE, "tool_use");
-        } else if ("bedrock/converse/deepseek_r1".equalsIgnoreCase(llmInterface)) {
-            if (!params.containsKey(NO_ESCAPE_PARAMS)) {
-                params.put(NO_ESCAPE_PARAMS, "_chat_history,_interactions");
-            }
-            params.put(LLM_RESPONSE_FILTER, "$.output.message.content[0].text");
-            params.put("llm_final_response_post_filter", "$.message.content[0].text");
-
-            params
-                .put(
-                    TOOL_TEMPLATE,
-                    "{\"toolSpec\":{\"name\":\"${tool.name}\",\"description\":\"${tool.description}\",\"inputSchema\": {\"json\": ${tool.attributes.input_schema} } }}"
-                );
-            params.put(TOOL_CALLS_PATH, "_llm_response.tool_calls");
-            params.put(TOOL_CALLS_TOOL_NAME, "tool_name");
-            params.put(TOOL_CALLS_TOOL_INPUT, "input");
-            params.put(TOOL_CALL_ID_PATH, "id");
-
-            params.put("interaction_template.assistant_tool_calls_path", "$.output.message");
-            params.put("interaction_template.assistant_tool_calls_exclude_path", "[ \"$.output.message.content[?(@.reasoningContent)]\" ]");
-            params
-                .put(
-                    "interaction_template.tool_response",
-                    "{\"role\":\"user\",\"content\":[ {\"text\":\"{\\\"tool_call_id\\\":\\\"${_interactions.tool_call_id}\\\",\\\"tool_result\\\": \\\"${_interactions.tool_response}\\\"\"} ]}"
-                );
-
-            params
-                .put(
-                    "chat_history_template.user_question",
-                    "{\"role\":\"user\",\"content\":[{\"text\":\"${_chat_history.message.question}\"}]}"
-                );
-            params
-                .put(
-                    "chat_history_template.ai_response",
-                    "{\"role\":\"assistant\",\"content\":[{\"text\":\"${_chat_history.message.response}\"}]}"
-                );
-
-            params.put(LLM_FINISH_REASON_PATH, "_llm_response.stop_reason");
-            params.put(LLM_FINISH_REASON_TOOL_USE, "tool_use");
+        FunctionCalling functionCalling = FunctionCallingFactory.create(llmInterface);
+        if (functionCalling != null) {
+            functionCalling.configure(params);
         }
+
         String memoryType = mlAgent.getMemory().getType();
         String memoryId = params.get(MLAgentExecutor.MEMORY_ID);
         String appType = mlAgent.getAppType();
@@ -347,23 +236,30 @@ public void run(MLAgent mlAgent, Map<String, String> inputParams, ActionListener
                     }
                 }
 
-                runAgent(mlAgent, params, listener, memory, memory.getConversationId());
+                runAgent(mlAgent, params, listener, memory, memory.getConversationId(), functionCalling);
             }, e -> {
                 log.error("Failed to get chat history", e);
                 listener.onFailure(e);
             }), messageHistoryLimit);
         }, listener::onFailure));
     }
 
-    private void runAgent(MLAgent mlAgent, Map<String, String> params, ActionListener<Object> listener, Memory memory, String sessionId) {
+    private void runAgent(
+        MLAgent mlAgent,
+        Map<String, String> params,
+        ActionListener<Object> listener,
+        Memory memory,
+        String sessionId,
+        FunctionCalling functionCalling
+    ) {
         List<MLToolSpec> toolSpecs = getMlToolSpecs(mlAgent, params);
 
         // Create a common method to handle both success and failure cases
         Consumer<List<MLToolSpec>> processTools = (allToolSpecs) -> {
             Map<String, Tool> tools = new HashMap<>();
             Map<String, MLToolSpec> toolSpecMap = new HashMap<>();
             createTools(toolFactories, params, allToolSpecs, tools, toolSpecMap, mlAgent);
-            runReAct(mlAgent.getLlm(), tools, toolSpecMap, params, memory, sessionId, mlAgent.getTenantId(), listener);
+            runReAct(mlAgent.getLlm(), tools, toolSpecMap, params, memory, sessionId, mlAgent.getTenantId(), listener, functionCalling);
         };
 
         // Fetch MCP tools and handle both success and failure cases
@@ -384,7 +280,8 @@ private void runReAct(
         Memory memory,
         String sessionId,
         String tenantId,
-        ActionListener<Object> listener
+        ActionListener<Object> listener,
+        FunctionCalling functionCalling
     ) {
         Map<String, String> tmpParameters = constructLLMParams(llm, parameters);
         String prompt = constructLLMPrompt(tools, tmpParameters);
@@ -437,7 +334,8 @@ private void runReAct(
                         tmpModelTensorOutput,
                         llmResponsePatterns,
                         tools.keySet(),
-                        interactions
+                        interactions,
+                        functionCalling
                     );
 
                     String thought = String.valueOf(modelOutput.get(THOUGHT));
@@ -510,7 +408,8 @@ private void runReAct(
                             actionInput,
                             toolParams,
                             interactions,
-                            toolCallId
+                            toolCallId,
+                            functionCalling
                         );
                     } else {
                         String res = String.format(Locale.ROOT, "Failed to run the tool %s which is unsupported.", action);
@@ -675,20 +574,28 @@ private static void runTool(
         String actionInput,
         Map<String, String> toolParams,
         List<String> interactions,
-        String toolCallId
+        String toolCallId,
+        FunctionCalling functionCalling
     ) {
         if (tools.get(action).validate(toolParams)) {
             try {
                 String finalAction = action;
                 ActionListener<Object> toolListener = ActionListener.wrap(r -> {
-                    interactions
-                        .add(
-                            substitute(
-                                tmpParameters.get(INTERACTION_TEMPLATE_TOOL_RESPONSE),
-                                Map.of(TOOL_CALL_ID, toolCallId, "tool_response", processTextDoc(StringUtils.toJson(r))),
-                                INTERACTIONS_PREFIX
-                            )
-                        );
+                    if (functionCalling != null) {
+                        List<Map<String, Object>> toolResults = List.of(Map.of(TOOL_CALL_ID, toolCallId, TOOL_RESULT, Map.of("text", r)));
+                        List<LLMMessage> llmMessages = functionCalling.supply(toolResults);
+                        // TODO: support multiple tool calls at the same time so that multiple LLMMessages can be generated here
+                        interactions.add(llmMessages.getFirst().getResponse());
+                    } else {
+                        interactions
+                            .add(
+                                substitute(
+                                    tmpParameters.get(INTERACTION_TEMPLATE_TOOL_RESPONSE),
+                                    Map.of(TOOL_CALL_ID, toolCallId, "tool_response", processTextDoc(StringUtils.toJson(r))),
+                                    INTERACTIONS_PREFIX
+                                )
+                            );
+                    }
                     nextStepListener.onResponse(r);
                 }, e -> {
                     interactions