Skip to content

Commit 98db2b7

Browse files
committed
delete exit message
1 parent 5132c2b commit 98db2b7

File tree

3 files changed

+6
-5
lines changed

3 files changed

+6
-5
lines changed

ajet/backbone/trainer_verl.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -596,8 +596,9 @@ def fit(self): # noqa: C901
596596
context_tracker_arr: List[BaseContextTracker] = self.parallel_env.rollout(
597597
tasks, mode="sample", epoch=f"train.{epoch}"
598598
)
599-
from ajet import bp
600-
bp("BATCH")
599+
600+
# from ajet import bp; bp("BATCH")
601+
601602
logger.info("end fit rollout")
602603
gen_batch_output = self.parallel_env.to_dataproto(context_tracker_arr)
603604
logger.info("end dataproto convertion")

ajet/task_rollout/single_worker.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -128,7 +128,7 @@ def rollout_env_worker(
128128
workflow_task=workflow_task,
129129
)
130130
except SwarmReceiveAbortException as exc: # noqa: BLE001
131-
print('SwarmReceiveAbortException caught in rollout_env_worker')
131+
# print('SwarmReceiveAbortException caught in rollout_env_worker')
132132
return None # type: ignore
133133
except TestSuccessException as e:
134134
logger.success(

ajet/task_runner/swarm_runner.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,7 @@ def register_episode_and_wait_output(
7575
message = zmq_socket.recv_string()
7676
except zmq.Again as e:
7777
if should_exit_hard():
78-
logger.warning(f'{episode_uuid} Exiting workflow due to should_exit_hard signal.')
78+
# logger.warning(f'{episode_uuid} Exiting workflow due to should_exit_hard signal.')
7979
context_tracker.reset()
8080
raise SwarmReceiveAbortException(f"Episode {episode_uuid} aborted due to system exit.")
8181
else:
@@ -127,7 +127,7 @@ def execute(self, workflow_task: WorkflowTask) -> BaseContextTracker:
127127
should_exit_hard = hooks['should_interrupt_hard_fn']
128128

129129
if should_exit_soft() or should_exit_hard():
130-
print(f'Exiting workflow worker due to interrupt signal for episode {workflow_task.episode_uuid}.')
130+
# print(f'Exiting workflow worker due to interrupt signal for episode {workflow_task.episode_uuid}.')
131131
raise SwarmReceiveAbortException(f"Episode {workflow_task.episode_uuid} aborted due to interrupt signal.")
132132

133133
# context tracker will trace and gather everything we need for training

0 commit comments

Comments
 (0)