@@ -270,7 +270,7 @@ def test_evaluate_with_lambda_agent_wait_for_completion(self, lambda_agent_arn,
270270 assert "pipeline" in execution .arn .lower ()
271271 logger .info (f"Started 3P agent base model evaluation: { execution .arn } " )
272272
273- execution .wait ()
273+ execution .wait (EVALUATION_TIMEOUT_SECONDS )
274274 assert execution .status .overall_status in ("Succeeded" , "Failed" , "Stopped" )
275275 logger .info (f"Execution completed: { execution .status .overall_status } " )
276276
@@ -315,12 +315,15 @@ def test_evaluate_base_model_with_agent_lambda_object(self, lambda_agent_arn, te
315315 assert execution .arn is not None
316316 logger .info (f"Started CustomAgentLambda object evaluation: { execution .arn } " )
317317
318+ execution .wait (EVALUATION_TIMEOUT_SECONDS )
319+ assert execution .status .overall_status == "Succeeded"
320+
318321 def test_evaluate_with_attached_trainer (self , lambda_agent_arn , test_config ):
319322 """Test evaluating a fine-tuned model by attaching to an existing training job."""
320323 from sagemaker .train .multi_turn_rl_trainer import MultiTurnRLTrainer
321324
322325 attached_job = MultiTurnRLTrainer .attach (
323- "openai-reasoning-gpt- oss-20b -mtrl-20260602164546 " , session = boto3 .Session (region_name = _REGION )
326+ "mock- oss-test -mtrl-20260615143910 " , session = boto3 .Session (region_name = _REGION )
324327 )
325328
326329 evaluator = MultiTurnRLEvaluator (
@@ -339,3 +342,6 @@ def test_evaluate_with_attached_trainer(self, lambda_agent_arn, test_config):
339342 assert execution is not None
340343 assert execution .arn is not None
341344 logger .info (f"Started attached trainer evaluation: { execution .arn } " )
345+
346+ execution .wait (EVALUATION_TIMEOUT_SECONDS )
347+ assert execution .status .overall_status == "Succeeded"
0 commit comments