Skip to content

Commit b719c6f

Browse files
authored
update sdk version (#94)
* update sdk version for updated types * bump version + update changelog
1 parent 32513d5 commit b719c6f

File tree

4 files changed

+50
-9
lines changed

4 files changed

+50
-9
lines changed

CHANGELOG.md

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,10 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
77

88
## [Unreleased]
99

10+
## [1.0.23] 2025-06-24
11+
12+
- Update sdk version
13+
1014
## [1.0.22] 2025-06-23
1115

1216
- Remove quality_preset arg
@@ -108,7 +112,8 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
108112

109113
- Initial release of the `cleanlab-codex` client library.
110114

111-
[Unreleased]: https://github.com/cleanlab/cleanlab-codex/compare/v1.0.22...HEAD
115+
[Unreleased]: https://github.com/cleanlab/cleanlab-codex/compare/v1.0.23...HEAD
116+
[1.0.23]: https://github.com/cleanlab/cleanlab-codex/compare/v1.0.22...v1.0.23
112117
[1.0.22]: https://github.com/cleanlab/cleanlab-codex/compare/v1.0.21...v1.0.22
113118
[1.0.21]: https://github.com/cleanlab/cleanlab-codex/compare/v1.0.20...v1.0.21
114119
[1.0.20]: https://github.com/cleanlab/cleanlab-codex/compare/v1.0.19...v1.0.20

pyproject.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@ classifiers = [
2626
]
2727
dependencies = [
2828
"cleanlab-tlm~=1.1",
29-
"codex-sdk==0.1.0a21",
29+
"codex-sdk==0.1.0a22",
3030
"pydantic>=2.0.0, <3",
3131
]
3232

src/cleanlab_codex/__about__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
11
# SPDX-License-Identifier: MIT
2-
__version__ = "1.0.22"
2+
__version__ = "1.0.23"

tests/test_validator.py

Lines changed: 42 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -15,9 +15,21 @@ def mock_project() -> Generator[Mock, None, None]:
1515
is_bad_response=True,
1616
expert_answer=None,
1717
eval_scores={
18-
"response_helpfulness": EvalScores(score=0.95, failed=False),
19-
"trustworthiness": EvalScores(score=0.5, failed=True),
18+
"response_helpfulness": EvalScores(
19+
score=0.95,
20+
triggered=False,
21+
triggered_escalation=False,
22+
triggered_guardrail=False,
23+
),
24+
"trustworthiness": EvalScores(
25+
score=0.5,
26+
triggered=True,
27+
triggered_escalation=True,
28+
triggered_guardrail=True,
29+
),
2030
},
31+
escalated_to_sme=True,
32+
should_guardrail=True,
2133
)
2234
mock.from_access_key.return_value = mock_obj
2335
yield mock
@@ -31,9 +43,21 @@ def mock_project_with_custom_thresholds() -> Generator[Mock, None, None]:
3143
is_bad_response=False,
3244
expert_answer=None,
3345
eval_scores={
34-
"response_helpfulness": EvalScores(score=0.95, failed=False),
35-
"trustworthiness": EvalScores(score=0.5, failed=False),
46+
"response_helpfulness": EvalScores(
47+
score=0.95,
48+
triggered=False,
49+
triggered_escalation=False,
50+
triggered_guardrail=False,
51+
),
52+
"trustworthiness": EvalScores(
53+
score=0.5,
54+
triggered=False,
55+
triggered_escalation=False,
56+
triggered_guardrail=False,
57+
),
3658
},
59+
escalated_to_sme=False,
60+
should_guardrail=False,
3761
)
3862
mock.from_access_key.return_value = mock_obj
3963
yield mock
@@ -66,9 +90,21 @@ def test_validate_expert_answer(self, mock_project: Mock) -> None:
6690
is_bad_response=True,
6791
expert_answer="expert answer",
6892
eval_scores={
69-
"response_helpfulness": EvalScores(score=0.95, failed=False),
70-
"trustworthiness": EvalScores(score=0.5, failed=True),
93+
"response_helpfulness": EvalScores(
94+
score=0.95,
95+
triggered=False,
96+
triggered_escalation=False,
97+
triggered_guardrail=False,
98+
),
99+
"trustworthiness": EvalScores(
100+
score=0.5,
101+
triggered=True,
102+
triggered_escalation=True,
103+
triggered_guardrail=True,
104+
),
71105
},
106+
escalated_to_sme=True,
107+
should_guardrail=True,
72108
)
73109
# Basically any response will be flagged as untrustworthy
74110
result = validator.validate(query="test query", context="test context", response="test response")

0 commit comments

Comments
 (0)