Modify other test file to match the new output format

Salma Elshafey · Salma Elshafey · commit a40c91bf59bd · 2025-06-24T00:20:40.000+03:00
diff --git a/sdk/evaluation/azure-ai-evaluation/tests/unittests/test_agent_evaluators.py b/sdk/evaluation/azure-ai-evaluation/tests/unittests/test_agent_evaluators.py
@@ -9,109 +9,87 @@ class TestEvaluate:
     def test_tool_call_accuracy_evaluator_missing_inputs(self, mock_model_config):
         tool_call_accuracy = ToolCallAccuracyEvaluator(model_config=mock_model_config)
 
-        # Test tool_calls provided but missing response
-        with pytest.raises(EvaluationException) as exc_info:
-            tool_call_accuracy(
-                query="Where is the Eiffel Tower?",
-                response="The Eiffel Tower is in Paris.",
-                tool_calls="Test",
-                tool_definitions={
-                    "name": "fetch_weather",
-                    "description": "Fetches the weather information for the specified location.",
-                    "parameters": {
-                        "type": "object",
-                        "properties": {
-                            "location": {
-                                "type": "string",
-                                "description": "The location to fetch weather for."
-                            }
+        # Test with missing tool_calls and response
+        result = tool_call_accuracy(
+            query="Where is the Eiffel Tower?",
+            tool_definitions=[{
+                "name": "fetch_weather",
+                "description": "Fetches the weather information for the specified location.",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "location": {
+                            "type": "string",
+                            "description": "The location to fetch weather for."
                         }
                     }
                 }
-            )
+            }]
+        )
+        assert not result["applicable"]
+        assert result["tool_call_accurate"] == "not applicable"
+        assert "No tool calls found in response or provided tool_calls." in result["tool_call_accurate_reason"]
 
         # Test with missing tool_definitions
-        with pytest.raises(EvaluationException) as exc_info:
-            tool_call_accuracy(
-                query="Where is the Eiffel Tower?",
-                tool_calls={
-                    "type": "tool_call",
-                    "tool_call": {
-                        "id": "call_K21dwOxgCN2syn4qjutMVV7Z",
-                        "type": "function",
-                    "function": {
-                        "name": "fetch_weather",
-                        "arguments": {
-                            "location": "Tokyo"
-                        }
-                    }
-                    }
+        result = tool_call_accuracy(
+            query="Where is the Eiffel Tower?",
+            tool_definitions=[],
+            tool_calls=[{
+                "type": "tool_call",
+                "name": "fetch_weather",
+                "arguments": {
+                    "location": "Tokyo"
                 }
-            )
-        assert "Tool definitions must be provided." in str(exc_info.value)
-
-        # Test with missing tool_cools
-        with pytest.raises(EvaluationException) as exc_info:
-            tool_call_accuracy(
-                query="Where is the Eiffel Tower?",
-                tool_definitions={
-		            "name": "fetch_weather",
-		            "description": "Fetches the weather information for the specified location.",
-		            "parameters": {
-			            "type": "object",
-			            "properties": {
-                            "location": {
-                                "type": "string",
-                                "description": "The location to fetch weather for."
-                            }
-			            }
-		            }
-	            }
-            )
+            }]
+        )
+        assert not result["applicable"]
+        assert result["tool_call_accurate"] == "not applicable"
+        assert "Tool definitions must be provided." in result["tool_call_accurate_reason"]
 
-        assert "Either response or tool_calls must be provided." in str(exc_info.value)
-
-        # Test response provided but missing tool_calls
-        with pytest.raises(EvaluationException) as exc_info:
-            tool_call_accuracy(
-                query="Where is the Eiffel Tower?",
-                response="The Eiffel Tower is in Paris.",
-                tool_definitions={
-                    "name": "fetch_weather",
-                    "description": "Fetches the weather information for the specified location.",
-                    "parameters": {
-                        "type": "object",
-                        "properties": {
-                            "location": {
-                                "type": "string",
-                                "description": "The location to fetch weather for."
-                            }
+        # Test with response that has no tool calls
+        result = tool_call_accuracy(
+            query="Where is the Eiffel Tower?",
+            response="The Eiffel Tower is in Paris.",
+            tool_definitions=[{
+                "name": "fetch_weather",
+                "description": "Fetches the weather information for the specified location.",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "location": {
+                            "type": "string",
+                            "description": "The location to fetch weather for."
                         }
                     }
                 }
-            )
-
-        assert "response does not have tool calls. Either provide tool_calls or response with tool calls." in str(exc_info.value)
+            }]
+        )
+        assert not result["applicable"]
+        assert result["tool_call_accurate"] == "not applicable"
+        assert "No tool calls found in response or provided tool_calls." in result["tool_call_accurate_reason"]
 
-        # Test tool_calls provided but missing response
-        with pytest.raises(EvaluationException) as exc_info:
-            tool_call_accuracy(
-                query="Where is the Eiffel Tower?",
-                response="The Eiffel Tower is in Paris.",
-                tool_calls="Test",
-                tool_definitions={
-                    "name": "fetch_weather",
-                    "description": "Fetches the weather information for the specified location.",
-                    "parameters": {
-                        "type": "object",
-                        "properties": {
-                            "location": {
-                                "type": "string",
-                                "description": "The location to fetch weather for."
-                            }
+        # Test with tool call for which definition is not provided
+        result = tool_call_accuracy(
+            query="Where is the Eiffel Tower?",
+            tool_calls=[{
+                "type": "tool_call",
+                "name": "some_other_tool",
+                "arguments": {}
+            }],
+            tool_definitions=[{
+                "name": "fetch_weather",
+                "description": "Fetches the weather information for the specified location.",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "location": {
+                            "type": "string",
+                            "description": "The location to fetch weather for."
                         }
                     }
                 }
-            )
-
-            assert "Tool definition not found" in str(exc_info.value)
+            }]
+        )
+        assert not result["applicable"]
+        assert result["tool_call_accurate"] == "not applicable"
+        assert "Tool definitions for all tool calls must be provided." in result["tool_call_accurate_reason"]