Skip to content

Commit d4389f6

Browse files
committed
updated klavis
1 parent 78dbd75 commit d4389f6

2 files changed

Lines changed: 9 additions & 5 deletions

File tree

tests/pytest/mcp_configurations/klavis_strata_mcp.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
{
22
"mcpServers": {
33
"klavis-strata": {
4-
"url": "https://strata.klavis.ai/mcp/",
4+
"url": "https://gmail-mcp-server.klavis.ai/mcp/?instance_id=74ddb651-9204-480e-9fe4-4a90d9f10c69",
55
"authorization": "Bearer ${KLAVIS_AUTH_TOKEN}"
66
}
77
}

tests/pytest/test_pytest_klavis_mcp.py

Lines changed: 8 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -12,14 +12,17 @@
1212
class ResponseFormat(BaseModel):
1313
score: float
1414

15-
'''
15+
16+
"""
1617
You should copy https://painted-tennis-ebc.notion.site/MCPMark-Source-Hub-23181626b6d7805fb3a7d59c63033819
1718
into your Notion for the notion test.
18-
'''
19+
"""
20+
21+
1922
@evaluation_test(
2023
input_dataset=["tests/pytest/datasets/klavis_mcp_test.jsonl"],
2124
rollout_processor=AgentRolloutProcessor(),
22-
completion_params=[{"model": "fireworks_ai/accounts/fireworks/models/kimi-k2-instruct"}],
25+
completion_params=[{"model": "fireworks_ai/accounts/fireworks/models/kimi-k2-thinking"}],
2326
mode="pointwise",
2427
mcp_config_path="tests/pytest/mcp_configurations/klavis_strata_mcp.json",
2528
)
@@ -31,7 +34,7 @@ async def test_pytest_klavis_mcp(row: EvaluationRow) -> EvaluationRow:
3134
api_key=os.environ["FIREWORKS_API_KEY"], base_url="https://api.fireworks.ai/inference/v1"
3235
) as client:
3336
response = await client.chat.completions.create(
34-
model="accounts/fireworks/models/kimi-k2-instruct-0905",
37+
model="accounts/fireworks/models/kimi-k2-thinking",
3538
messages=[
3639
{
3740
"role": "system",
@@ -50,6 +53,7 @@ async def test_pytest_klavis_mcp(row: EvaluationRow) -> EvaluationRow:
5053
response_text = response.choices[0].message.content
5154
logger.info("response_text: %s", response_text)
5255
score = json.loads(response_text or "{}")["score"]
56+
5357
row.evaluation_result = EvaluateResult(
5458
score=score,
5559
reason=response_text,

0 commit comments

Comments
 (0)