Skip to content

Commit 3da5ea8

Browse files
authored
Add GPT-5 evals and "minimal" to reasoning dropdown (#2671)
* GPT-5 evals * Add evals for GPT-5 * Upgrade openAI SDK * Change snapshots to reasoning_effort of minimal
1 parent 570e530 commit 3da5ea8

File tree

31 files changed

+1417
-13
lines changed

31 files changed

+1417
-13
lines changed

app/backend/approaches/chatreadretrieveread.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -162,7 +162,7 @@ async def run_search_approach(
162162
), # Setting too low risks malformed JSON, setting too high may affect performance
163163
temperature=0.0, # Minimize creativity for search query generation
164164
tools=tools,
165-
reasoning_effort="low", # Minimize reasoning for search query generation
165+
reasoning_effort="minimal", # Minimize reasoning for search query generation
166166
),
167167
)
168168

@@ -202,7 +202,7 @@ async def run_search_approach(
202202
model=self.chatgpt_model,
203203
deployment=self.chatgpt_deployment,
204204
usage=chat_completion.usage,
205-
reasoning_effort="low",
205+
reasoning_effort="minimal",
206206
),
207207
ThoughtStep(
208208
"Search using generated search query",

app/backend/requirements.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -212,7 +212,7 @@ multidict==6.0.5
212212
# yarl
213213
oauthlib==3.2.2
214214
# via requests-oauthlib
215-
openai==1.63.0
215+
openai==1.99.8
216216
# via -r requirements.in
217217
opentelemetry-api==1.31.1
218218
# via

app/frontend/src/components/Settings/Settings.tsx

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -335,6 +335,7 @@ export const Settings = ({
335335
}
336336
aria-labelledby={reasoningEffortFieldId}
337337
options={[
338+
{ key: "minimal", text: t("labels.reasoningEffortOptions.minimal") },
338339
{ key: "low", text: t("labels.reasoningEffortOptions.low") },
339340
{ key: "medium", text: t("labels.reasoningEffortOptions.medium") },
340341
{ key: "high", text: t("labels.reasoningEffortOptions.high") }

app/frontend/src/locales/da/translation.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -89,6 +89,7 @@
8989
"useQueryRewriting": "Brug forespørgselsomskrivning til informationsgenfinding",
9090
"reasoningEffort": "Ræsonnementsindsats",
9191
"reasoningEffortOptions": {
92+
"minimal": "Minimal (kun GPT-5)",
9293
"low": "Lav",
9394
"medium": "Medium",
9495
"high": "Høj"

app/frontend/src/locales/en/translation.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -99,6 +99,7 @@
9999
"useQueryRewriting": "Use query rewriting for retrieval",
100100
"reasoningEffort": "Reasoning effort",
101101
"reasoningEffortOptions": {
102+
"minimal": "Minimal (GPT-5 only)",
102103
"low": "Low",
103104
"medium": "Medium",
104105
"high": "High"

app/frontend/src/locales/es/translation.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -93,6 +93,7 @@
9393
"useQueryRewriting": "Utiliza la reescritura de consultas para la recuperación",
9494
"reasoningEffort": "Esfuerzo de razonamiento",
9595
"reasoningEffortOptions": {
96+
"minimal": "Mínimo (solo GPT-5)",
9697
"low": "Bajo",
9798
"medium": "Medio",
9899
"high": "Alto"

app/frontend/src/locales/fr/translation.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -95,6 +95,7 @@
9595
"useQueryRewriting": "Utilisez la réécriture des requêtes pour la récupération",
9696
"reasoningEffort": "Effort de raisonnement",
9797
"reasoningEffortOptions": {
98+
"minimal": "Minimal (GPT-5 uniquement)",
9899
"low": "Faible",
99100
"medium": "Moyen",
100101
"high": "Élevé"

app/frontend/src/locales/it/translation.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -93,6 +93,7 @@
9393
"useQueryRewriting": "Usa la riscrittura delle query per il recupero",
9494
"reasoningEffort": "Sforzo di ragionamento",
9595
"reasoningEffortOptions": {
96+
"minimal": "Minimo (solo GPT-5)",
9697
"low": "Basso",
9798
"medium": "Medio",
9899
"high": "Alto"

app/frontend/src/locales/ja/translation.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -93,6 +93,7 @@
9393
"useQueryRewriting": "検索のためにクエリの書き換えを使用する",
9494
"reasoningEffort": "推論の労力",
9595
"reasoningEffortOptions": {
96+
"minimal": "最小(GPT-5 のみ)",
9697
"low": "",
9798
"medium": "",
9899
"high": ""

app/frontend/src/locales/nl/translation.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -93,6 +93,7 @@
9393
"useQueryRewriting": "Gebruik de herformulering van zoekopdrachten om informatie op te halen",
9494
"reasoningEffort": "Redeneerinspanning",
9595
"reasoningEffortOptions": {
96+
"minimal": "Minimaal (alleen GPT-5)",
9697
"low": "Laag",
9798
"medium": "Gemiddeld",
9899
"high": "Hoog"

0 commit comments

Comments
 (0)