Skip to content

Commit c68c154

Browse files
committed
Fix pre-commit failures
1 parent c80da64 commit c68c154

14 files changed

Lines changed: 43 additions & 25 deletions

File tree

ajet/backbone/verl/core_algos.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -187,7 +187,6 @@ def update(self, current_kl, n_steps):
187187
current_kl (float): Current KL divergence value (unused).
188188
n_steps (int): Number of steps taken (unused).
189189
"""
190-
pass
191190

192191

193192
def get_kl_controller(kl_ctrl):

ajet/context_tracker/multiagent_tracking.py

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
import copy
33
import json
44
from dataclasses import dataclass, field
5-
from typing import List, Tuple
5+
from typing import List, Tuple, cast
66

77
from beast_logger import NestedJsonItem, SeqItem, print_dict, print_nested
88
from loguru import logger
@@ -173,12 +173,14 @@ def step_spawn_timeline(self, messages: List[dict], tools: List = [], disable_to
173173

174174
any_later_msg_has_user_role = any((m["role"] == "user") for m in messages[i+1:])
175175

176+
msg_content = cast(str, msg["content"])
177+
176178
# extract content block from openai-competible messages and convert to ExtendedMessage
177179
timeline += [
178180
ExtendedMessage(
179181
author=author,
180182
role=msg["role"],
181-
content=msg["content"],
183+
content=msg_content,
182184
tokenizer=self.tokenizer,
183185
tools=tools,
184186
tool_calls=(msg["tool_calls"] if "tool_calls" in msg else []),
@@ -189,7 +191,7 @@ def step_spawn_timeline(self, messages: List[dict], tools: List = [], disable_to
189191
before_last_query=any_later_msg_has_user_role
190192
)
191193
]
192-
if ("<think>" in msg["content"]) and (not previous_message_encounter_user_role):
194+
if ("<think>" in msg_content) and (not previous_message_encounter_user_role):
193195
logger.warning(f"Warning! Message content contains <think> tag, but no prior message has `user` role! This is not a common scenario. Please check your agent loop carefully.")
194196

195197
return timeline

ajet/copilot/create-keep-think-model-chat-template/SKILL.md

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -12,5 +12,3 @@ You must not do this in-place, instead, please create another model.
1212
E.g., "/mnt/data_cpfs/xielipeng.xlp/models/Qwen3-8B" -> "/mnt/data_cpfs/xielipeng.xlp/models/Qwen3-8B-Keep-History"
1313
For all files within the original model path, please create symbolic links instead of copying files.
1414
With only one exception, the tokenizer config file, which should be copied and modified to change the chat template.
15-
16-

ajet/tokenizer/service.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@
2020
import time
2121
from collections import OrderedDict
2222
from concurrent.futures import Future, ThreadPoolExecutor
23-
from typing import Any, Optional
23+
from typing import Optional
2424

2525
import msgpack
2626
import zmq

ajet/tuner_lib/experimental/swarm_server.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
from ajet.utils.process_killer import kill_process_tree
1515
from ajet.utils.sync_train_code import extract_ajet_zip
1616
from ajet.tuner_lib.experimental.swarm_overwatch_utils import CurrentBatchRolloutPoolInformation
17-
from ajet.tuner_lib.experimental.interchange_utils import DEBUG, VERBOSE, CLIENT_ACTIVE_TIMEOUT
17+
from ajet.tuner_lib.experimental.interchange_utils import DEBUG, VERBOSE
1818
from ajet.tuner_lib.experimental.interchange_utils import (
1919
SyncTrainConfigRequest,
2020
ClaimEpisodeRequest,

ajet/utils/advantage.py

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,15 @@
1+
from __future__ import annotations
2+
3+
from collections import defaultdict
4+
from typing import TYPE_CHECKING, Optional
5+
6+
import numpy as np
7+
import torch
8+
9+
if TYPE_CHECKING:
10+
from verl.trainer.config import AlgoConfig
11+
12+
113
def compute_grpo_outcome_advantage(
214
token_level_rewards: torch.Tensor,
315
response_mask: torch.Tensor,

tutorial/example_appworld_swarm/agent_roll_timeline_study_text_level_tl.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -12,11 +12,8 @@
1212
"""
1313

1414
import os
15-
import statistics
16-
from concurrent.futures import ThreadPoolExecutor, as_completed
1715
from typing import Generator, List
1816

19-
from tqdm import tqdm
2017

2118
from ajet.copilot.job import AgentJetJob
2219
from ajet.schema.task import Task

tutorial/example_appworld_swarm/agent_roll_timeline_study_token_level_tl.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -12,11 +12,8 @@
1212
"""
1313

1414
import os
15-
import statistics
16-
from concurrent.futures import ThreadPoolExecutor, as_completed
1715
from typing import Generator, List
1816

19-
from tqdm import tqdm
2017

2118
from ajet.copilot.job import AgentJetJob
2219
from ajet.schema.task import Task

tutorial/example_appworld_swarm/agent_roll_timeline_study_token_level_tl_qwen3_original.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -12,11 +12,8 @@
1212
"""
1313

1414
import os
15-
import statistics
16-
from concurrent.futures import ThreadPoolExecutor, as_completed
1715
from typing import Generator, List
1816

19-
from tqdm import tqdm
2017

2118
from ajet.copilot.job import AgentJetJob
2219
from ajet.schema.task import Task

tutorial/example_cocktail_rl_v2/train_aime_as_swarm_client_1.py

Lines changed: 8 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,12 @@
2727
_THIS_DIR = os.path.dirname(__file__)
2828

2929

30+
def _scalar_reward(reward: float | list[float] | None) -> float:
31+
if not isinstance(reward, (int, float)):
32+
raise TypeError(f"Expected scalar reward, got {type(reward).__name__}: {reward!r}")
33+
return float(reward)
34+
35+
3036
@dataclass
3137
class _AimeAgentConfig:
3238
"""Duck-types the subset of AgentJetJob that execute_agent reads."""
@@ -113,7 +119,7 @@ def rollout(self, task: Task) -> float:
113119
)
114120
out = _execute_aime_agent(task, api_baseurl_key, self.agent_config)
115121
self.swarm_worker.end_episode(task, episode_uuid, out)
116-
return out.reward
122+
return _scalar_reward(out.reward)
117123

118124
def eval_rollout(self, task: Task) -> float:
119125
assert self.swarm_worker is not None
@@ -122,7 +128,7 @@ def eval_rollout(self, task: Task) -> float:
122128
)
123129
try:
124130
out = _execute_aime_agent(task, api_baseurl_key, self.agent_config)
125-
return out.reward
131+
return _scalar_reward(out.reward)
126132
finally:
127133
self.swarm_worker.abort_episode(episode_uuid)
128134

0 commit comments

Comments
 (0)