@@ -104,7 +104,6 @@ def test_evaluate_tools_valid1(self, mock_model_config):
104
104
assert "per_tool_call_details" in result
105
105
assert ToolCallAccuracyEvaluator ._EXCESS_TOOL_CALLS_KEY in result
106
106
assert ToolCallAccuracyEvaluator ._MISSING_TOOL_CALLS_KEY in result
107
- assert result ["applicable" ] is True
108
107
109
108
def test_evaluate_tools_valid2 (self , mock_model_config ):
110
109
evaluator = ToolCallAccuracyEvaluator (model_config = mock_model_config )
@@ -163,7 +162,6 @@ def test_evaluate_tools_valid2(self, mock_model_config):
163
162
assert "per_tool_call_details" in result
164
163
assert ToolCallAccuracyEvaluator ._EXCESS_TOOL_CALLS_KEY in result
165
164
assert ToolCallAccuracyEvaluator ._MISSING_TOOL_CALLS_KEY in result
166
- assert result ["applicable" ] is True
167
165
168
166
def test_evaluate_tools_valid3 (self , mock_model_config ):
169
167
evaluator = ToolCallAccuracyEvaluator (model_config = mock_model_config )
@@ -222,7 +220,6 @@ def test_evaluate_tools_valid3(self, mock_model_config):
222
220
assert "per_tool_call_details" in result
223
221
assert ToolCallAccuracyEvaluator ._EXCESS_TOOL_CALLS_KEY in result
224
222
assert ToolCallAccuracyEvaluator ._MISSING_TOOL_CALLS_KEY in result
225
- assert result ["applicable" ] is True
226
223
227
224
def test_evaluate_tools_one_eval_fails (self , mock_model_config ):
228
225
with pytest .raises (EvaluationException ) as exc_info :
@@ -311,7 +308,6 @@ def test_evaluate_tools_some_not_applicable(self, mock_model_config):
311
308
assert result ["per_tool_call_details" ] == {}
312
309
assert result [ToolCallAccuracyEvaluator ._EXCESS_TOOL_CALLS_KEY ] == {}
313
310
assert result [ToolCallAccuracyEvaluator ._MISSING_TOOL_CALLS_KEY ] == {}
314
- assert result ["applicable" ] is False
315
311
316
312
def test_evaluate_tools_all_not_applicable (self , mock_model_config ):
317
313
evaluator = ToolCallAccuracyEvaluator (model_config = mock_model_config )
@@ -351,7 +347,6 @@ def test_evaluate_tools_all_not_applicable(self, mock_model_config):
351
347
assert result ["per_tool_call_details" ] == {}
352
348
assert result [ToolCallAccuracyEvaluator ._EXCESS_TOOL_CALLS_KEY ] == {}
353
349
assert result [ToolCallAccuracyEvaluator ._MISSING_TOOL_CALLS_KEY ] == {}
354
- assert result ["applicable" ] is False
355
350
356
351
def test_evaluate_tools_no_tools (self , mock_model_config ):
357
352
evaluator = ToolCallAccuracyEvaluator (model_config = mock_model_config )
@@ -383,5 +378,4 @@ def test_evaluate_tools_no_tools(self, mock_model_config):
383
378
assert result [f"{ key } _reason" ] == ToolCallAccuracyEvaluator ._NO_TOOL_CALLS_MESSAGE
384
379
assert result ["per_tool_call_details" ] == {}
385
380
assert result [ToolCallAccuracyEvaluator ._EXCESS_TOOL_CALLS_KEY ] == {}
386
- assert result [ToolCallAccuracyEvaluator ._MISSING_TOOL_CALLS_KEY ] == {}
387
- assert result ["applicable" ] is False
381
+ assert result [ToolCallAccuracyEvaluator ._MISSING_TOOL_CALLS_KEY ] == {}
0 commit comments