ml-explore
diff --git a/‎Applications/LLMEval/ContentView.swift
Lines changed: 102 additions & 26 deletions b/‎Applications/LLMEval/ContentView.swift
Lines changed: 102 additions & 26 deletions
diff --git a/‎Applications/MLXChatExample/ViewModels/ChatViewModel.swift
Lines changed: 2 additions & 0 deletions b/‎Applications/MLXChatExample/ViewModels/ChatViewModel.swift
Lines changed: 2 additions & 0 deletions
diff --git a/‎Libraries/MLXLMCommon/Chat.swift
Lines changed: 5 additions & 0 deletions b/‎Libraries/MLXLMCommon/Chat.swift
Lines changed: 5 additions & 0 deletions
diff --git a/‎Libraries/MLXLMCommon/Evaluate.swift
Lines changed: 26 additions & 1 deletion b/‎Libraries/MLXLMCommon/Evaluate.swift
Lines changed: 26 additions & 1 deletion
diff --git a/‎Libraries/MLXLMCommon/Extensions/Encodable+toolResult.swift
Lines changed: 14 additions & 0 deletions b/‎Libraries/MLXLMCommon/Extensions/Encodable+toolResult.swift
Lines changed: 14 additions & 0 deletions
diff --git a/‎Libraries/MLXLMCommon/Streamlined.swift
Lines changed: 2 additions & 3 deletions b/‎Libraries/MLXLMCommon/Streamlined.swift
Lines changed: 2 additions & 3 deletions
diff --git a/‎Libraries/MLXLMCommon/Tool/Tool.swift
Lines changed: 62 additions & 0 deletions b/‎Libraries/MLXLMCommon/Tool/Tool.swift
Lines changed: 62 additions & 0 deletions
diff --git a/‎Libraries/MLXLMCommon/Tool/ToolCall.swift
Lines changed: 53 additions & 0 deletions b/‎Libraries/MLXLMCommon/Tool/ToolCall.swift
Lines changed: 53 additions & 0 deletions
@@ -34,7 +34,7 @@ struct ContentView: View {
                 }
                 HStack {
                     Toggle(isOn: $llm.includeWeatherTool) {
-                        Text("Include \"get current weather\" tool")
+                        Text("Include tools")
                     }
                     .frame(maxWidth: 350, alignment: .leading)
                     Toggle(isOn: $llm.enableThinking) {
@@ -188,28 +188,50 @@ class LLMEvaluator {
 
     var loadState = LoadState.idle
 
-    let currentWeatherToolSpec: [String: any Sendable] =
-        [
-            "type": "function",
-            "function": [
-                "name": "get_current_weather",
-                "description": "Get the current weather in a given location",
-                "parameters": [
-                    "type": "object",
-                    "properties": [
-                        "location": [
-                            "type": "string",
-                            "description": "The city and state, e.g. San Francisco, CA",
-                        ] as [String: String],
-                        "unit": [
-                            "type": "string",
-                            "enum": ["celsius", "fahrenheit"],
-                        ] as [String: any Sendable],
-                    ] as [String: [String: any Sendable]],
-                    "required": ["location"],
-                ] as [String: any Sendable],
-            ] as [String: any Sendable],
-        ] as [String: any Sendable]
+    let currentWeatherTool = Tool<WeatherInput, WeatherOutput>(
+        name: "get_current_weather",
+        description: "Get the current weather in a given location",
+        parameters: [
+            .required(
+                "location", type: .string, description: "The city and state, e.g. San Francisco, CA"
+            ),
+            .optional(
+                "unit",
+                type: .string,
+                description: "The unit of temperature",
+                extraProperties: [
+                    "enum": ["celsius", "fahrenheit"],
+                    "default": "celsius",
+                ]
+            ),
+        ]
+    ) { input in
+        let range = input.unit == "celsius" ? (min: -20.0, max: 40.0) : (min: 0, max: 100)
+        let temperature = Double.random(in: range.min ... range.max)
+
+        let conditions = ["Sunny", "Cloudy", "Rainy", "Snowy", "Windy", "Stormy"].randomElement()!
+
+        return WeatherOutput(temperature: temperature, conditions: conditions)
+    }
+
+    let addTool = Tool<AddInput, AddOutput>(
+        name: "add_two_numbers",
+        description: "Add two numbers together",
+        parameters: [
+            .required("first", type: .int, description: "The first number to add"),
+            .required("second", type: .int, description: "The second number to add"),
+        ]
+    ) { input in
+        AddOutput(result: input.first + input.second)
+    }
+
+    let timeTool = Tool<EmptyInput, TimeOutput>(
+        name: "get_time",
+        description: "Get the current time",
+        parameters: [],
+    ) { _ in
+        TimeOutput(time: Date.now.formatted())
+    }
 
     /// load and return the model -- can be called multiple times, subsequent calls will
     /// just return the loaded model
@@ -243,15 +265,24 @@ class LLMEvaluator {
         }
     }
 
-    private func generate(prompt: String) async {
+    private func generate(prompt: String, toolResult: String? = nil) async {
 
         self.output = ""
-        let chat: [Chat.Message] = [
+        var chat: [Chat.Message] = [
             .system("You are a helpful assistant"),
             .user(prompt),
         ]
+
+        if let toolResult {
+            chat.append(.tool(toolResult))
+        }
+
         let userInput = UserInput(
-            chat: chat, additionalContext: ["enable_thinking": enableThinking])
+            chat: chat,
+            tools: includeWeatherTool
+                ? [currentWeatherTool.schema, addTool.schema, timeTool.schema] : nil,
+            additionalContext: ["enable_thinking": enableThinking]
+        )
 
         do {
             let modelContainer = try await load()
@@ -280,6 +311,10 @@ class LLMEvaluator {
                             self.stat = "\(completion.tokensPerSecond) tokens/s"
                         }
                     }
+
+                    if let toolCall = batch.compactMap({ $0.toolCall }).first {
+                        try await handleToolCall(toolCall, prompt: prompt)
+                    }
                 }
             }
 
@@ -303,4 +338,45 @@ class LLMEvaluator {
         generationTask?.cancel()
         running = false
     }
+
+    private func handleToolCall(_ toolCall: ToolCall, prompt: String) async throws {
+        let result =
+            switch toolCall.function.name {
+            case currentWeatherTool.name:
+                try await toolCall.execute(with: currentWeatherTool).toolResult
+            case addTool.name:
+                try await toolCall.execute(with: addTool).toolResult
+            case timeTool.name:
+                try await toolCall.execute(with: timeTool).toolResult
+            default:
+                "No tool match"
+            }
+
+        await generate(prompt: prompt, toolResult: result)
+    }
+}
+
+struct WeatherInput: Codable {
+    let location: String
+    let unit: String?
+}
+
+struct WeatherOutput: Codable {
+    let temperature: Double
+    let conditions: String
+}
+
+struct AddInput: Codable {
+    let first: Int
+    let second: Int
+}
+
+struct AddOutput: Codable {
+    let result: Int
+}
+
+struct EmptyInput: Codable {}
+
+struct TimeOutput: Codable {
+    let time: String
 }
@@ -89,6 +89,8 @@ class ChatViewModel {
                 case .info(let info):
                     // Update performance metrics
                     generateCompletionInfo = info
+                case .toolCall(let call):
+                    break
                 }
             }
         }
 
@@ -42,10 +42,15 @@ public enum Chat {
             Self(role: .user, content: content, images: images, videos: videos)
         }
 
+        public static func tool(_ content: String) -> Self {
+            Self(role: .tool, content: content)
+        }
+
         public enum Role: String {
             case user
             case assistant
             case system
+            case tool
         }
     }
 }
 
@@ -804,6 +804,7 @@ public func generate(
 
             var tokenCount = 0
             var detokenizer = NaiveStreamingDetokenizer(tokenizer: context.tokenizer)
+            let toolCallProcessor = ToolCallProcessor()
 
             for token in iterator {
 
@@ -826,7 +827,16 @@ public func generate(
                 detokenizer.append(token: token)
                 if let chunk = detokenizer.next() {
                     tokenCount += 1
-                    continuation.yield(.chunk(chunk))
+
+                    // Process chunk through the tool call processor
+                    if let textToYield = toolCallProcessor.processChunk(chunk) {
+                        continuation.yield(.chunk(textToYield))
+                    }
+
+                    // Check if we have a complete tool call
+                    if let toolCall = toolCallProcessor.toolCalls.popLast() {
+                        continuation.yield(.toolCall(toolCall))
+                    }
                 }
             }
 
@@ -909,14 +919,19 @@ public struct GenerateCompletionInfo: Sendable {
 public enum Generation: Sendable {
     /// A generated token represented as a String
     case chunk(String)
+
     /// Completion information summarizing token counts and performance metrics.
     case info(GenerateCompletionInfo)
 
+    /// A tool call from the language model.
+    case toolCall(ToolCall)
+
     /// Generated text or nil
     public var chunk: String? {
         switch self {
         case .chunk(let string): string
         case .info: nil
+        case .toolCall: nil
         }
     }
 
@@ -925,6 +940,16 @@ public enum Generation: Sendable {
         switch self {
         case .chunk: nil
         case .info(let info): info
+        case .toolCall: nil
+        }
+    }
+
+    /// Tool call or nil
+    public var toolCall: ToolCall? {
+        switch self {
+        case .chunk: nil
+        case .info: nil
+        case .toolCall(let toolCall): toolCall
         }
     }
 
 
@@ -0,0 +1,14 @@
+// Copyright © 2025 Apple Inc.
+
+import Foundation
+
+// Extension on Codable to handle JSON encoding with snake case
+extension Encodable {
+    public var toolResult: String {
+        let encoder = JSONEncoder()
+        encoder.keyEncodingStrategy = .convertToSnakeCase
+
+        guard let data = try? encoder.encode(self) else { return "{}" }
+        return String(data: data, encoding: .utf8) ?? "{}"
+    }
+}
@@ -101,9 +101,8 @@ private class Generator {
                 for await item in try MLXLMCommon.generate(
                     input: input, cache: cache, parameters: generateParameters, context: context)
                 {
-                    switch item {
-                    case .chunk(let chunk): continuation.yield(chunk)
-                    case .info: break
+                    if let chunk = item.chunk {
+                        continuation.yield(chunk)
                     }
                 }
 
 
@@ -0,0 +1,62 @@
+// Copyright © 2025 Apple Inc.
+
+import Foundation
+import Tokenizers
+
+/// Protocol defining the requirements for a tool.
+public protocol ToolProtocol: Sendable {
+    /// The JSON Schema describing the tool's interface.
+    var schema: ToolSpec { get }
+}
+
+public struct Tool<Input: Codable, Output: Codable>: ToolProtocol {
+    /// The JSON Schema describing the tool's interface.
+    public let schema: ToolSpec
+
+    /// The handler for the tool.
+    public let handler: (Input) async throws -> Output
+
+    /// The name of the tool extracted from the schema
+    public var name: String {
+        let function = schema["function"] as? [String: Any]
+        let name = function?["name"] as? String
+        return name ?? ""
+    }
+
+    public init(
+        name: String,
+        description: String,
+        parameters: [ToolParameter],
+        handler: @escaping (Input) async throws -> Output
+    ) {
+        var properties = [String: Any]()
+        var requiredParams = [String]()
+
+        for param in parameters {
+            properties[param.name] = param.schema
+            if param.isRequired {
+                requiredParams.append(param.name)
+            }
+        }
+
+        self.schema = [
+            "type": "function",
+            "function": [
+                "name": name,
+                "description": description,
+                "parameters": [
+                    "type": "object",
+                    "properties": properties,
+                    "required": requiredParams,
+                ],
+            ],
+        ]
+
+        self.handler = handler
+    }
+
+    public init(schema: ToolSpec, handler: @escaping (Input) async throws -> Output) {
+        self.schema = schema
+        self.handler = handler
+    }
+}
@@ -0,0 +1,53 @@
+// Copyright © 2025 Apple Inc.
+
+import Foundation
+
+public struct ToolCall: Hashable, Codable, Sendable {
+    /// Represents the function details for a tool call
+    public struct Function: Hashable, Codable, Sendable {
+        /// The name of the function
+        public let name: String
+
+        /// The arguments passed to the function
+        public let arguments: [String: JSONValue]
+
+        public init(name: String, arguments: [String: Any]) {
+            self.name = name
+            self.arguments = arguments.mapValues { JSONValue.from($0) }
+        }
+    }
+
+    /// The function to be called
+    public let function: Function
+}
+
+extension ToolCall {
+    public func execute<Input, Output>(with tool: Tool<Input, Output>) async throws -> Output {
+        // Check that the tool name matches the function name
+        guard tool.name == function.name else {
+            throw ToolError.nameMismatch(toolName: tool.name, functionName: function.name)
+        }
+
+        // Convert the JSONValue arguments dictionary to a JSON-encoded Data object
+        let jsonObject = function.arguments.mapValues { $0.anyValue }
+        let jsonData = try JSONSerialization.data(withJSONObject: jsonObject)
+
+        // Decode the Input type from the JSON data
+        let input = try JSONDecoder().decode(Input.self, from: jsonData)
+
+        // Execute the tool's handler with the decoded input
+        return try await tool.handler(input)
+    }
+}
+
+// Define Tool-related errors
+public enum ToolError: Error, LocalizedError {
+    case nameMismatch(toolName: String, functionName: String)
+
+    public var errorDescription: String? {
+        switch self {
+        case .nameMismatch(let toolName, let functionName):
+            return "Tool name mismatch: expected '\(toolName)' but got '\(functionName)'"
+        }
+    }
+}
Original file line number	Diff line number	Diff line change
`@@ -89,6 +89,8 @@ class ChatViewModel {`
`89`	`89`	`case .info(let info):`
`90`	`90`	`// Update performance metrics`
`91`	`91`	`generateCompletionInfo = info`
	`92`	`+ case .toolCall(let call):`
	`93`	`+ break`
`92`	`94`	`}`
`93`	`95`	`}`
`94`	`96`	`}`
Original file line number	Diff line number	Diff line change
`@@ -42,10 +42,15 @@ public enum Chat {`
`42`	`42`	`Self(role: .user, content: content, images: images, videos: videos)`
`43`	`43`	`}`
`44`	`44`
	`45`	`+ public static func tool(_ content: String) -> Self {`
	`46`	`+ Self(role: .tool, content: content)`
	`47`	`+ }`
	`48`	`+`
`45`	`49`	`public enum Role: String {`
`46`	`50`	`case user`
`47`	`51`	`case assistant`
`48`	`52`	`case system`
	`53`	`+ case tool`
`49`	`54`	`}`
`50`	`55`	`}`
`51`	`56`	`}`
Original file line number	Diff line number	Diff line change
`@@ -101,9 +101,8 @@ private class Generator {`
`101`	`101`	`for await item in try MLXLMCommon.generate(`
`102`	`102`	`input: input, cache: cache, parameters: generateParameters, context: context)`
`103`	`103`	`{`
`104`		`- switch item {`
`105`		`- case .chunk(let chunk): continuation.yield(chunk)`
`106`		`- case .info: break`
	`104`	`+ if let chunk = item.chunk {`
	`105`	`+ continuation.yield(chunk)`
`107`	`106`	`}`
`108`	`107`	`}`
`109`	`108`