fix calculator toolcall

VyasGuru · sanchitmonga22 · commit 04d22b3fa3c2 · 2026-04-14T13:07:02.000-07:00
diff --git a/examples/ios/RunAnywhereAI/RunAnywhereAI/Features/Chat/ViewModels/LLMViewModel+ToolCalling.swift b/examples/ios/RunAnywhereAI/RunAnywhereAI/Features/Chat/ViewModels/LLMViewModel+ToolCalling.swift
@@ -69,10 +69,13 @@ extension LLMViewModel {
             toolCallInfo = nil
         }
 
+        // Strip any residual <think> tags before displaying
+        let displayText = Self.stripThinkTags(from: result.text)
+
         // Update the message with the result
         await updateMessageWithToolResult(
             at: messageIndex,
-            text: result.text,
+            text: displayText,
             toolCallInfo: toolCallInfo
         )
     }
diff --git a/examples/ios/RunAnywhereAI/RunAnywhereAI/Features/Chat/Views/ChatInterfaceView.swift b/examples/ios/RunAnywhereAI/RunAnywhereAI/Features/Chat/Views/ChatInterfaceView.swift
@@ -31,6 +31,7 @@ struct ChatInterfaceView: View {
     @State private var showingLoRAManagement = false
     @State private var pendingLoRAURL: URL?
     @State private var loraScale: Float = 1.0
+    @ObservedObject private var toolSettingsViewModel = ToolSettingsViewModel.shared
     @AppStorage("thinkingModeEnabled") private var thinkingModeEnabled = false
     @FocusState private var isTextFieldFocused: Bool
 
@@ -452,7 +453,7 @@ extension ChatInterfaceView {
                     thinkingModeBadge
                 }
 
-                if viewModel.useToolCalling {
+                if viewModel.useToolCalling && !toolSettingsViewModel.registeredTools.isEmpty {
                     toolCallingBadge
                 }
 
diff --git a/examples/ios/RunAnywhereAI/RunAnywhereAI/Features/Settings/ToolSettingsView.swift b/examples/ios/RunAnywhereAI/RunAnywhereAI/Features/Settings/ToolSettingsView.swift
@@ -84,11 +84,22 @@ class ToolSettingsViewModel: ObservableObject {
                     category: "Utility"
                 ),
                 executor: { args in
-                    let expression = args["expression"]?.stringValue
-                        ?? args["input"]?.stringValue
-                        ?? args["expr"]?.stringValue
-                        ?? args.values.compactMap(\.stringValue).first
-                        ?? "0"
+                    // Extract expression from args, handling both string and number ToolValue types
+                    let expression: String = {
+                        let keys = ["expression", "input", "expr"]
+                        for key in keys {
+                            if let val = args[key] {
+                                if let s = val.stringValue { return s }
+                                if let n = val.numberValue { return "\(n)" }
+                            }
+                        }
+                        // Fallback: try any value in the dict
+                        for val in args.values {
+                            if let s = val.stringValue { return s }
+                            if let n = val.numberValue { return "\(n)" }
+                        }
+                        return "0"
+                    }()
                     print("Calculator received args: \(args), using expression: '\(expression)'")
                     // Clean the expression - remove any non-math characters
                     let cleanedExpression = expression
@@ -98,16 +109,22 @@ class ToolSettingsViewModel: ObservableObject {
                         .replacingOccurrences(of: "÷", with: "/")
                         .trimmingCharacters(in: .whitespacesAndNewlines)
 
-                    do {
-                        let exp = NSExpression(format: cleanedExpression)
-                        if let result = exp.expressionValue(with: nil, context: nil) as? NSNumber {
-                            return [
-                                "result": .number(result.doubleValue),
-                                "expression": .string(expression)
-                            ]
-                        }
-                    } catch {
-                        // Fall through to error
+                    // Validate expression contains only safe math characters
+                    let allowedChars = CharacterSet(charactersIn: "0123456789.+-*/() ")
+                    guard cleanedExpression.unicodeScalars.allSatisfy({ allowedChars.contains($0) }),
+                          !cleanedExpression.isEmpty else {
+                        return [
+                            "error": .string("Could not evaluate expression: \(expression)"),
+                            "expression": .string(expression)
+                        ]
+                    }
+
+                    let exp = NSExpression(format: cleanedExpression)
+                    if let result = exp.expressionValue(with: nil, context: nil) as? NSNumber {
+                        return [
+                            "result": .number(result.doubleValue),
+                            "expression": .string(expression)
+                        ]
                     }
                     return [
                         "error": .string("Could not evaluate expression: \(expression)"),
diff --git a/examples/ios/RunAnywhereAI/RunAnywhereAI/Features/Voice/VoiceAgentViewModel.swift b/examples/ios/RunAnywhereAI/RunAnywhereAI/Features/Voice/VoiceAgentViewModel.swift
@@ -389,7 +389,8 @@ final class VoiceAgentViewModel: ObservableObject {
         do {
             let settings = SettingsViewModel.shared
             let voiceConfig = VoiceSessionConfig(
-                thinkingModeEnabled: settings.loadedModelSupportsThinking && settings.thinkingModeEnabled
+                thinkingModeEnabled: settings.loadedModelSupportsThinking && settings.thinkingModeEnabled,
+                maxTokens: settings.maxTokens
             )
             session = try await RunAnywhere.startVoiceSession(config: voiceConfig)
             sessionState = .listening
diff --git a/sdk/runanywhere-commons/src/features/llm/tool_calling.cpp b/sdk/runanywhere-commons/src/features/llm/tool_calling.cpp
@@ -399,13 +399,41 @@ static bool extract_json_value(const char* json_obj, const char* key, char** out
                                         *out_is_object = true;
                                         return true;
                                     }
+                                } else {
+                                    // Scalar value (number, boolean, null)
+                                    // Read until comma, closing brace, or whitespace
+                                    size_t val_start = pos;
+                                    size_t val_end = pos;
+                                    while (val_end < len && json_obj[val_end] != ',' &&
+                                           json_obj[val_end] != '}' && json_obj[val_end] != ']' &&
+                                           json_obj[val_end] != '\n') {
+                                        val_end++;
+                                    }
+                                    // Trim trailing whitespace
+                                    while (val_end > val_start &&
+                                           (json_obj[val_end - 1] == ' ' || json_obj[val_end - 1] == '\t')) {
+                                        val_end--;
+                                    }
+                                    if (val_end > val_start) {
+                                        size_t val_len = val_end - val_start;
+                                        *out_value = static_cast<char*>(malloc(val_len + 1));
+                                        if (*out_value) {
+                                            memcpy(*out_value, json_obj + val_start, val_len);
+                                            (*out_value)[val_len] = '\0';
+                                        }
+                                        *out_is_object = false;
+                                        return true;
+                                    }
                                 }
                             }
                         }
                     }
 
                     // Move to end of key for continued scanning
+                    // Skip the in_string toggle - extract_json_string already
+                    // consumed the closing quote so in_string must stay false.
                     i = key_end - 1;
+                    continue;
                 }
             }
             in_string = !in_string;
@@ -664,10 +692,46 @@ static bool extract_tool_name_and_args(const char* json_obj, char** out_tool_nam
                     }
                 }
 
-                // No arguments found - use empty object
-                *out_args_json = static_cast<char*>(malloc(3));
-                if (*out_args_json) {
-                    std::memcpy(*out_args_json, "{}", 3);
+                // No standard argument wrapper key found.
+                // Fallback: collect all remaining keys (excluding the tool name key)
+                // as flat arguments. This handles LLM output like:
+                // {"tool": "calculate", "expression": "5 * 100"}
+                {
+                    std::vector<std::string> all_keys = get_json_keys(json_obj);
+                    std::string flat_args = "{";
+                    bool first = true;
+                    for (const auto& k : all_keys) {
+                        // Skip the key that matched the tool name
+                        bool is_tool_key = false;
+                        for (int t = 0; TOOL_NAME_KEYS[t] != nullptr; t++) {
+                            if (str_equals_ignore_case(k.c_str(), TOOL_NAME_KEYS[t])) {
+                                is_tool_key = true;
+                                break;
+                            }
+                        }
+                        if (is_tool_key) continue;
+
+                        char* kval = nullptr;
+                        bool kval_is_obj = false;
+                        if (extract_json_value(json_obj, k.c_str(), &kval, &kval_is_obj)) {
+                            if (!first) flat_args += ",";
+                            std::string escaped_key = escape_json_string(k.c_str());
+                            if (kval_is_obj) {
+                                flat_args += "\"" + escaped_key + "\":" + std::string(kval);
+                            } else if (kval) {
+                                std::string escaped_val = escape_json_string(kval);
+                                flat_args += "\"" + escaped_key + "\":\"" + escaped_val + "\"";
+                            }
+                            free(kval);
+                            first = false;
+                        }
+                    }
+                    flat_args += "}";
+
+                    *out_args_json = static_cast<char*>(malloc(flat_args.size() + 1));
+                    if (*out_args_json) {
+                        std::memcpy(*out_args_json, flat_args.c_str(), flat_args.size() + 1);
+                    }
                 }
                 return true;
             }
diff --git a/sdk/runanywhere-swift/Sources/RunAnywhere/Public/Extensions/LLM/RunAnywhere+ToolCalling.swift b/sdk/runanywhere-swift/Sources/RunAnywhere/Public/Extensions/LLM/RunAnywhere+ToolCalling.swift
@@ -168,8 +168,17 @@ public extension RunAnywhere {
         let registeredTools = await ToolRegistry.shared.getAll()
         let tools = opts.tools ?? registeredTools
 
+        // Extract /no_think prefix before building the full prompt so it stays
+        // at the beginning where the C++ inference layer expects it.
+        let noThinkPrefix = "/no_think\n"
+        let hasNoThink = prompt.hasPrefix(noThinkPrefix)
+        let cleanPrompt = hasNoThink ? String(prompt.dropFirst(noThinkPrefix.count)) : prompt
+
         let systemPrompt = buildToolSystemPrompt(tools: tools, options: opts)
-        var fullPrompt = systemPrompt.isEmpty ? prompt : "\(systemPrompt)\n\nUser: \(prompt)"
+        var fullPrompt = systemPrompt.isEmpty ? cleanPrompt : "\(systemPrompt)\n\nUser: \(cleanPrompt)"
+        if hasNoThink {
+            fullPrompt = "\(noThinkPrefix)\(fullPrompt)"
+        }
 
         var allToolCalls: [ToolCall] = []
         var allToolResults: [ToolResult] = []
diff --git a/sdk/runanywhere-swift/Sources/RunAnywhere/Public/Extensions/VoiceAgent/RunAnywhere+VoiceSession.swift b/sdk/runanywhere-swift/Sources/RunAnywhere/Public/Extensions/VoiceAgent/RunAnywhere+VoiceSession.swift
@@ -228,12 +228,11 @@ public actor VoiceSessionHandle {
                 effectivePrompt = transcription
             }
 
-            let rawResponse = try await RunAnywhere.voiceAgentGenerateResponse(effectivePrompt)
-
-            // Step 3: Parse out <think> tags from response before TTS
-            let parsed = ThinkingContentParser.extract(from: rawResponse)
-            cleanedResponse = parsed.text
-            thinkingContent = parsed.thinking
+            let options = LLMGenerationOptions(maxTokens: config.maxTokens ?? 100)
+            let result = try await RunAnywhere.generate(effectivePrompt, options: options)
+            // generate() already runs ThinkingContentParser internally
+            cleanedResponse = result.text
+            thinkingContent = result.thinkingContent
 
             emit(.responded(text: cleanedResponse, thinkingContent: thinkingContent))
 
diff --git a/sdk/runanywhere-swift/Sources/RunAnywhere/Public/Extensions/VoiceAgent/VoiceAgentTypes.swift b/sdk/runanywhere-swift/Sources/RunAnywhere/Public/Extensions/VoiceAgent/VoiceAgentTypes.swift
@@ -225,18 +225,23 @@ public struct VoiceSessionConfig: Sendable {
     /// Whether thinking mode is enabled for the LLM.
     public var thinkingModeEnabled: Bool
 
+    /// Maximum tokens for LLM generation (nil uses SDK default of 100)
+    public var maxTokens: Int?
+
     public init(
         silenceDuration: TimeInterval = 1.5,
         speechThreshold: Float = 0.1,
         autoPlayTTS: Bool = true,
         continuousMode: Bool = true,
-        thinkingModeEnabled: Bool = false
+        thinkingModeEnabled: Bool = false,
+        maxTokens: Int? = nil
     ) {
         self.silenceDuration = silenceDuration
         self.speechThreshold = speechThreshold
         self.autoPlayTTS = autoPlayTTS
         self.continuousMode = continuousMode
         self.thinkingModeEnabled = thinkingModeEnabled
+        self.maxTokens = maxTokens
     }
 
     /// Default configuration

Original file line number	Diff line number	Diff line change
`@@ -69,10 +69,13 @@ extension LLMViewModel {`
`69`	`69`	`toolCallInfo = nil`
`70`	`70`	`}`
`71`	`71`
	`72`	`+ // Strip any residual <think> tags before displaying`
	`73`	`+ let displayText = Self.stripThinkTags(from: result.text)`
	`74`	`+`
`72`	`75`	`// Update the message with the result`
`73`	`76`	`await updateMessageWithToolResult(`
`74`	`77`	`at: messageIndex,`
`75`		`- text: result.text,`
	`78`	`+ text: displayText,`
`76`	`79`	`toolCallInfo: toolCallInfo`
`77`	`80`	`)`
`78`	`81`	`}`
Original file line number	Diff line number	Diff line change
`@@ -31,6 +31,7 @@ struct ChatInterfaceView: View {`
`31`	`31`	`@State private var showingLoRAManagement = false`
`32`	`32`	`@State private var pendingLoRAURL: URL?`
`33`	`33`	`@State private var loraScale: Float = 1.0`
	`34`	`+ @ObservedObject private var toolSettingsViewModel = ToolSettingsViewModel.shared`
`34`	`35`	`@AppStorage("thinkingModeEnabled") private var thinkingModeEnabled = false`
`35`	`36`	`@FocusState private var isTextFieldFocused: Bool`
`36`	`37`
`@@ -452,7 +453,7 @@ extension ChatInterfaceView {`
`452`	`453`	`thinkingModeBadge`
`453`	`454`	`}`
`454`	`455`
`455`		`- if viewModel.useToolCalling {`
	`456`	`+ if viewModel.useToolCalling && !toolSettingsViewModel.registeredTools.isEmpty {`
`456`	`457`	`toolCallingBadge`
`457`	`458`	`}`
`458`	`459`