Skip to content

Commit a8b7419

Browse files
authored
Add header to Codex API requests for capturing product analytics data (#53)
* pass metadata in header for codex API requests to indicate integration type * hatch fmt * small fixes * ignore type check in test * include cleanlab-codex version in headers for codex backend requests * update client lib version * respond to PR feedback * add instructions to DEVELOPMENT for how to build and install the package locally * small changes re: angela's feedback * amend changelog
1 parent 1f02e3c commit a8b7419

10 files changed

+204
-150
lines changed

CHANGELOG.md

+5-1
Original file line numberDiff line numberDiff line change
@@ -7,8 +7,11 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
77

88
## [Unreleased]
99

10+
## [1.0.2] - 2025-03-07
11+
1012
- Extract scores and metadata from detection functions in `response_validation.py`.
1113
- Normalize scores used by `is_fallback_response` function to be between 0 and 1.
14+
- Pass metadata in headers for query requests.
1215

1316
## [1.0.1] - 2025-02-26
1417

@@ -18,6 +21,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
1821

1922
- Initial release of the `cleanlab-codex` client library.
2023

21-
[Unreleased]: https://github.com/cleanlab/cleanlab-codex/compare/v1.0.1...HEAD
24+
[Unreleased]: https://github.com/cleanlab/cleanlab-codex/compare/v1.0.2...HEAD
25+
[1.0.2]: https://github.com/cleanlab/cleanlab-codex/compare/v1.0.1...v1.0.2
2226
[1.0.1]: https://github.com/cleanlab/cleanlab-codex/compare/v1.0.0...v1.0.1
2327
[1.0.0]: https://github.com/cleanlab/cleanlab-codex/compare/267a93300f77c94e215d7697223931e7926cad9e...v1.0.0

DEVELOPMENT.md

+9
Original file line numberDiff line numberDiff line change
@@ -90,6 +90,15 @@ Automated releases are handled by the [release workflow][release-workflow] which
9090
[hatch-version]: https://hatch.pypa.io/latest/version/#updating
9191
[changelog]: CHANGELOG.md
9292

93+
94+
### How to build and install the package locally
95+
96+
You may want to build and install the package locally - for example, to see how your changes affect other Python code in a script or Jupyter notebook.
97+
98+
To do this, you can build the package with `hatch build` and then install it in your local environment with `pip install dist/cleanlab_codex-<version>-py3-none-any.whl`.
99+
100+
Alternatively, you can use `pip install -e /path/to/cleanlab-codex` to install the package from your local code. Note that if you make further local changes after that, you may need to reload the module, i.e. `reload(cleanlab_codex)`, or restart the kernel.
101+
93102
## Continuous integration
94103

95104
Testing, type checking, and formatting/linting is [checked in CI][ci].

src/cleanlab_codex/__about__.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
11
# SPDX-License-Identifier: MIT
2-
__version__ = "1.0.1"
2+
__version__ = "1.0.2"

src/cleanlab_codex/codex_tool.py

+6-1
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,7 @@
66

77
from typing_extensions import Annotated
88

9+
from cleanlab_codex.internal.analytics import IntegrationType, _AnalyticsMetadata
910
from cleanlab_codex.project import Project
1011
from cleanlab_codex.utils.errors import MissingDependencyError
1112
from cleanlab_codex.utils.function import (
@@ -110,7 +111,11 @@ def query(
110111
Returns:
111112
The answer to the question if available. If no answer is available, this returns a fallback answer or None.
112113
"""
113-
return self._project.query(question, fallback_answer=self._fallback_answer)[0]
114+
return self._project.query(
115+
question=question,
116+
fallback_answer=self._fallback_answer,
117+
analytics_metadata=_AnalyticsMetadata(integration_type=IntegrationType.TOOL),
118+
)[0]
114119

115120
def to_openai_tool(self) -> dict[str, Any]:
116121
"""Converts the tool to the expected format for an [OpenAI function tool](https://platform.openai.com/docs/guides/function-calling).
+26
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
from __future__ import annotations
2+
3+
from enum import Enum
4+
5+
from cleanlab_codex.__about__ import __version__ as package_version
6+
7+
8+
class IntegrationType(str, Enum):
9+
"""Supported methods for integrating Codex into a RAG system using this library."""
10+
11+
BACKUP = "backup"
12+
TOOL = "tool"
13+
14+
15+
class _AnalyticsMetadata:
16+
def __init__(self, *, integration_type: IntegrationType):
17+
self._integration_type = integration_type
18+
self._package_version = package_version
19+
self._source = "cleanlab-codex-python"
20+
21+
def to_headers(self) -> dict[str, str]:
22+
return {
23+
"X-Integration-Type": self._integration_type,
24+
"X-Client-Library-Version": self._package_version,
25+
"X-Source": self._source,
26+
}

src/cleanlab_codex/internal/project.py

-40
This file was deleted.

src/cleanlab_codex/project.py

+35-5
Original file line numberDiff line numberDiff line change
@@ -8,16 +8,17 @@
88

99
from codex import AuthenticationError
1010

11-
from cleanlab_codex.internal.project import query_project
11+
from cleanlab_codex.internal.analytics import IntegrationType, _AnalyticsMetadata
1212
from cleanlab_codex.internal.sdk_client import client_from_access_key
13+
from cleanlab_codex.types.entry import Entry
1314
from cleanlab_codex.types.project import ProjectConfig
1415

1516
if _TYPE_CHECKING:
1617
from datetime import datetime
1718

1819
from codex import Codex as _Codex
1920

20-
from cleanlab_codex.types.entry import Entry, EntryCreate
21+
from cleanlab_codex.types.entry import EntryCreate
2122

2223
_ERROR_CREATE_ACCESS_KEY = (
2324
"Failed to create access key. Please ensure you have the necessary permissions "
@@ -159,6 +160,7 @@ def query(
159160
*,
160161
fallback_answer: Optional[str] = None,
161162
read_only: bool = False,
163+
analytics_metadata: Optional[_AnalyticsMetadata] = None,
162164
) -> tuple[Optional[str], Optional[Entry]]:
163165
"""Query Codex to check if this project contains an answer to the question. Add the question to the project for SME review if it does not.
164166
@@ -173,10 +175,38 @@ def query(
173175
If Codex is able to answer the question, the first element will be the answer returned by Codex and the second element will be the existing [`Entry`](/codex/api/python/types.entry#class-entry) in the Codex project.
174176
If Codex is unable to answer the question, the first element will be `fallback_answer` if provided, otherwise None. The second element will be a new [`Entry`](/codex/api/python/types.entry#class-entry) in the Codex project.
175177
"""
176-
return query_project(
177-
client=self._sdk_client,
178+
if not analytics_metadata:
179+
analytics_metadata = _AnalyticsMetadata(integration_type=IntegrationType.BACKUP)
180+
181+
return self._query_project(
178182
question=question,
179-
project_id=self.id,
180183
fallback_answer=fallback_answer,
181184
read_only=read_only,
185+
analytics_metadata=analytics_metadata,
182186
)
187+
188+
def _query_project(
189+
self,
190+
question: str,
191+
*,
192+
fallback_answer: Optional[str] = None,
193+
read_only: bool = False,
194+
analytics_metadata: Optional[_AnalyticsMetadata] = None,
195+
) -> tuple[Optional[str], Optional[Entry]]:
196+
extra_headers = analytics_metadata.to_headers() if analytics_metadata else None
197+
maybe_entry = self._sdk_client.projects.entries.query(self._id, question=question, extra_headers=extra_headers)
198+
199+
if maybe_entry is not None:
200+
entry = Entry.model_validate(maybe_entry.model_dump())
201+
if entry.answer is not None:
202+
return entry.answer, entry
203+
204+
return fallback_answer, entry
205+
206+
if not read_only:
207+
created_entry = Entry.model_validate(
208+
self._sdk_client.projects.entries.add_question(self._id, question=question).model_dump()
209+
)
210+
return fallback_answer, created_entry
211+
212+
return fallback_answer, None

tests/internal/test_analytics.py

+21
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,21 @@
1+
from __future__ import annotations
2+
3+
import pytest
4+
5+
from cleanlab_codex.__about__ import __version__ as package_version
6+
from cleanlab_codex.internal.analytics import IntegrationType, _AnalyticsMetadata
7+
8+
9+
def test_analytics_metadata_to_headers_uses_defaults() -> None:
10+
metadata = _AnalyticsMetadata(integration_type=IntegrationType.BACKUP)
11+
12+
assert metadata.to_headers() == {
13+
"X-Integration-Type": IntegrationType.BACKUP,
14+
"X-Source": "cleanlab-codex-python",
15+
"X-Client-Library-Version": package_version,
16+
}
17+
18+
19+
def test_analytics_metadata_requires_integration_type() -> None:
20+
with pytest.raises(TypeError):
21+
_AnalyticsMetadata() # type: ignore[call-arg]

0 commit comments

Comments
 (0)