Skip to content

Commit 1e57a1b

Browse files
committed
[owl] Increase max tokens for query rewrite (#926)
* increase max tokens for query rewrite * gpt 4o audio mini deprecated update to gpt audio mini
1 parent fa92fd3 commit 1e57a1b

2 files changed

Lines changed: 4 additions & 4 deletions

File tree

services/api/src/owl/utils/lm.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2114,7 +2114,7 @@ async def _generate_search_query(
21142114
hyperparams.update(
21152115
temperature=0.01,
21162116
top_p=0.01,
2117-
max_tokens=1000,
2117+
max_tokens=10000,
21182118
stream=False,
21192119
reasoning_effort="minimal",
21202120
)

services/api/tests/gen_table/test_row_ops.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -152,10 +152,10 @@ def setup():
152152
create_model_config(
153153
{
154154
# "id": "openai/Qwen/Qwen-2-Audio-7B",
155-
"id": "openai/gpt-4o-mini-audio-preview",
155+
"id": "openai/gpt-audio-mini",
156156
"type": "llm",
157157
# "name": "ELLM Qwen2 Audio (7B)",
158-
"name": "OpenAI GPT-4o Mini Audio Preview",
158+
"name": "OpenAI GPT Audio Mini",
159159
"capabilities": ["chat", "audio"],
160160
"context_length": 128000,
161161
"languages": ["en"],
@@ -174,7 +174,7 @@ def setup():
174174
DeploymentCreate(
175175
model_id=llm_config_audio.id,
176176
# name="ELLM Qwen2 Audio (7B) Deployment",
177-
name="OpenAI GPT-4o Mini Audio Preview Deployment",
177+
name="OpenAI GPT Audio Mini Deployment",
178178
# provider=CloudProvider.ELLM,
179179
provider=CloudProvider.OPENAI,
180180
routing_id=llm_config_audio.id,

0 commit comments

Comments
 (0)