-
Notifications
You must be signed in to change notification settings - Fork 25
/
Copy pathopenrouter.py
79 lines (62 loc) · 2.2 KB
/
openrouter.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
import json
from asyncio import sleep
import httpx
from ..logger import logger
from .client import Client
from .types import ChatFormatRequest
# Preferred provider routing arguments.
# Change depending on what model you'd like to use.
PROVIDER = {"order": ["Together", "DeepInfra"]}
class Response:
def __init__(self, response):
self.text = response
class OpenRouter(Client):
def __init__(
self,
model: str,
api_key: str | None = None,
base_url="https://openrouter.ai/api/v1/chat/completions",
):
super().__init__(model)
self.headers = {"Authorization": f"Bearer {api_key}"}
self.url = base_url
self.client = httpx.AsyncClient()
def postprocess(self, response):
response_json = response.json()
msg = response_json["choices"][0]["message"]["content"]
return Response(msg)
async def generate( # type: ignore
self,
prompt: ChatFormatRequest,
raw: bool = False,
max_retries: int = 1,
**kwargs, # type: ignore
) -> Response: # type: ignore
kwargs.pop("schema", None)
max_tokens = kwargs.pop("max_tokens", 500)
temperature = kwargs.pop("temperature", 1.0)
data = {
"model": self.model,
"messages": prompt,
# "provider": PROVIDER,
"max_tokens": max_tokens,
"temperature": temperature,
}
for attempt in range(max_retries):
try:
response = await self.client.post(
url=self.url, json=data, headers=self.headers
)
if raw:
return response.json()
result = self.postprocess(response)
return result
except json.JSONDecodeError:
logger.warning(
f"Attempt {attempt + 1}: Invalid JSON response, retrying..."
)
except Exception as e:
logger.warning(f"Attempt {attempt + 1}: {str(e)}, retrying...")
await sleep(1)
logger.error("All retry attempts failed.")
raise RuntimeError("Failed to generate text after multiple attempts.")