Skip to content

Commit adef22f

Browse files
author
Syed Jafri
committed
fix: unskip sft rlaif rlvr integ tests
1 parent 4cd4a58 commit adef22f

4 files changed

Lines changed: 27 additions & 32 deletions

File tree

sagemaker-train/tests/integ/train/conftest.py

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -38,3 +38,13 @@ def sagemaker_session():
3838

3939
if region_manual_set and "AWS_DEFAULT_REGION" in os.environ:
4040
del os.environ["AWS_DEFAULT_REGION"]
41+
42+
43+
NOVA_REGION = "us-east-1"
44+
45+
46+
@pytest.fixture(scope="module")
47+
def sagemaker_session_us_east_1():
48+
"""Create a SageMaker session in us-east-1 for Nova model tests."""
49+
boto_session = boto3.Session(region_name=NOVA_REGION)
50+
return Session(boto_session=boto_session)

sagemaker-train/tests/integ/train/test_rlaif_trainer_integration.py

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,6 @@
2121
import pytest
2222

2323

24-
@pytest.mark.skip(reason="Skipping GPU resource intensive test")
2524
def test_rlaif_trainer_lora_complete_workflow(sagemaker_session):
2625
"""Test complete RLAIF training workflow with LORA."""
2726

@@ -33,7 +32,7 @@ def test_rlaif_trainer_lora_complete_workflow(sagemaker_session):
3332
reward_prompt='Builtin.Summarize',
3433
mlflow_experiment_name="test-rlaif-finetuned-models-exp",
3534
mlflow_run_name="test-rlaif-finetuned-models-run",
36-
training_dataset="arn:aws:sagemaker:us-west-2:729646638167:hub-content/sdktest/DataSet/rlvr-rlaif-oss-test-data/0.0.1",
35+
training_dataset="s3://mc-flows-sdk-testing/input_data/rlvr-rlaif-test-data/train_285.jsonl",
3736
s3_output_path="s3://mc-flows-sdk-testing/output/",
3837
accept_eula=True
3938
)
@@ -61,7 +60,6 @@ def test_rlaif_trainer_lora_complete_workflow(sagemaker_session):
6160
assert training_job.output_model_package_arn is not None
6261

6362

64-
@pytest.mark.skip(reason="Skipping GPU resource intensive test")
6563
def test_rlaif_trainer_with_custom_reward_settings(sagemaker_session):
6664
"""Test RLAIF trainer with different reward model and prompt."""
6765

@@ -73,7 +71,7 @@ def test_rlaif_trainer_with_custom_reward_settings(sagemaker_session):
7371
reward_prompt="arn:aws:sagemaker:us-west-2:729646638167:hub-content/sdktest/JsonDoc/rlaif-test-prompt/0.0.1",
7472
mlflow_experiment_name="test-rlaif-finetuned-models-exp",
7573
mlflow_run_name="test-rlaif-finetuned-models-run",
76-
training_dataset="arn:aws:sagemaker:us-west-2:729646638167:hub-content/sdktest/DataSet/rlvr-rlaif-oss-test-data/0.0.1",
74+
training_dataset="s3://mc-flows-sdk-testing/input_data/rlvr-rlaif-test-data/train_285.jsonl",
7775
s3_output_path="s3://mc-flows-sdk-testing/output/",
7876
accept_eula=True
7977
)
@@ -100,7 +98,6 @@ def test_rlaif_trainer_with_custom_reward_settings(sagemaker_session):
10098
assert training_job.output_model_package_arn is not None
10199

102100

103-
@pytest.mark.skip(reason="Skipping GPU resource intensive test")
104101
def test_rlaif_trainer_continued_finetuning(sagemaker_session):
105102
"""Test complete RLAIF training workflow with LORA."""
106103

@@ -112,7 +109,7 @@ def test_rlaif_trainer_continued_finetuning(sagemaker_session):
112109
reward_prompt='Builtin.Summarize',
113110
mlflow_experiment_name="test-rlaif-finetuned-models-exp",
114111
mlflow_run_name="test-rlaif-finetuned-models-run",
115-
training_dataset="arn:aws:sagemaker:us-west-2:729646638167:hub-content/sdktest/DataSet/rlvr-rlaif-oss-test-data/0.0.1",
112+
training_dataset="s3://mc-flows-sdk-testing/input_data/rlvr-rlaif-test-data/train_285.jsonl",
116113
s3_output_path="s3://mc-flows-sdk-testing/output/",
117114
accept_eula=True
118115
)

sagemaker-train/tests/integ/train/test_rlvr_trainer_integration.py

Lines changed: 6 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,6 @@
1313
"""Integration tests for RLVR trainer"""
1414
from __future__ import absolute_import
1515

16-
import os
1716
import time
1817
import pytest
1918
import boto3
@@ -22,7 +21,6 @@
2221
from sagemaker.train.common import TrainingType
2322

2423

25-
@pytest.mark.skip(reason="Skipping GPU resource intensive test")
2624
def test_rlvr_trainer_lora_complete_workflow(sagemaker_session):
2725
"""Test complete RLVR training workflow with LORA."""
2826

@@ -32,7 +30,7 @@ def test_rlvr_trainer_lora_complete_workflow(sagemaker_session):
3230
model_package_group="sdk-test-finetuned-models",
3331
mlflow_experiment_name="test-rlvr-finetuned-models-exp",
3432
mlflow_run_name="test-rlvr-finetuned-models-run",
35-
training_dataset="arn:aws:sagemaker:us-west-2:729646638167:hub-content/sdktest/DataSet/rlvr-rlaif-oss-test-data/0.0.1",
33+
training_dataset="s3://mc-flows-sdk-testing/input_data/rlvr-rlaif-test-data/train_285.jsonl",
3634
s3_output_path="s3://mc-flows-sdk-testing/output/",
3735
accept_eula=True
3836
)
@@ -60,7 +58,6 @@ def test_rlvr_trainer_lora_complete_workflow(sagemaker_session):
6058
assert training_job.output_model_package_arn is not None
6159

6260

63-
@pytest.mark.skip(reason="Skipping GPU resource intensive test")
6461
def test_rlvr_trainer_with_custom_reward_function(sagemaker_session):
6562
"""Test RLVR trainer with custom reward function."""
6663

@@ -70,7 +67,7 @@ def test_rlvr_trainer_with_custom_reward_function(sagemaker_session):
7067
model_package_group="sdk-test-finetuned-models",
7168
mlflow_experiment_name="test-rlvr-finetuned-models-exp",
7269
mlflow_run_name="test-rlvr-finetuned-models-run",
73-
training_dataset="arn:aws:sagemaker:us-west-2:729646638167:hub-content/sdktest/DataSet/rlvr-rlaif-oss-test-data/0.0.1",
70+
training_dataset="s3://mc-flows-sdk-testing/input_data/rlvr-rlaif-test-data/train_285.jsonl",
7471
s3_output_path="s3://mc-flows-sdk-testing/output/",
7572
custom_reward_function="arn:aws:sagemaker:us-west-2:729646638167:hub-content/sdktest/JsonDoc/rlvr-test-rf/0.0.1",
7673
accept_eula=True
@@ -98,14 +95,10 @@ def test_rlvr_trainer_with_custom_reward_function(sagemaker_session):
9895
assert training_job.output_model_package_arn is not None
9996

10097

101-
# @pytest.mark.skipif(os.environ.get('AWS_DEFAULT_REGION') != 'us-east-1', reason="Nova models only available in us-east-1")
102-
@pytest.mark.skip(reason="Skipping GPU resource intensive test")
103-
def test_rlvr_trainer_nova_workflow(sagemaker_session):
98+
def test_rlvr_trainer_nova_workflow(sagemaker_session_us_east_1):
10499
"""Test RLVR training workflow with Nova model."""
105-
import os
106-
os.environ['SAGEMAKER_REGION'] = 'us-east-1'
100+
# sagemaker_session_us_east_1 fixture is defined in conftest.py (us-east-1 region)
107101

108-
# For fine-tuning
109102
rlvr_trainer = RLVRTrainer(
110103
model="nova-textgeneration-lite-v2",
111104
model_package_group="sdk-test-finetuned-models",
@@ -115,7 +108,8 @@ def test_rlvr_trainer_nova_workflow(sagemaker_session):
115108
validation_dataset="s3://mc-flows-sdk-testing-us-east-1/input_data/rlvr-nova/grpo-64-sample.jsonl",
116109
s3_output_path="s3://mc-flows-sdk-testing-us-east-1/output/",
117110
custom_reward_function="arn:aws:sagemaker:us-east-1:729646638167:hub-content/sdktest/JsonDoc/rlvr-nova-test-rf/0.0.1",
118-
accept_eula=True
111+
accept_eula=True,
112+
sagemaker_session=sagemaker_session_us_east_1
119113
)
120114
rlvr_trainer.hyperparameters.data_s3_path = 's3://example-bucket'
121115

sagemaker-train/tests/integ/train/test_sft_trainer_integration.py

Lines changed: 8 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,6 @@
1313
"""Integration tests for SFT trainer"""
1414
from __future__ import absolute_import
1515

16-
import os
1716
import time
1817
import pytest
1918
import boto3
@@ -22,15 +21,14 @@
2221
from sagemaker.train.common import TrainingType
2322

2423

25-
@pytest.mark.skip(reason="Skipping GPU resource intensive test")
2624
def test_sft_trainer_lora_complete_workflow(sagemaker_session):
2725
"""Test complete SFT training workflow with LORA."""
2826

2927
sft_trainer = SFTTrainer(
3028
model="meta-textgeneration-llama-3-2-1b-instruct",
3129
training_type=TrainingType.LORA,
3230
model_package_group="arn:aws:sagemaker:us-west-2:729646638167:model-package-group/sdk-test-finetuned-models",
33-
training_dataset="arn:aws:sagemaker:us-west-2:729646638167:hub-content/sdktest/DataSet/sft-oss-test-data/0.0.1",
31+
training_dataset="s3://mc-flows-sdk-testing/input_data/sft/sample_data_256_final.jsonl",
3432
s3_output_path="s3://mc-flows-sdk-testing/output/",
3533
accept_eula=True
3634
)
@@ -58,16 +56,15 @@ def test_sft_trainer_lora_complete_workflow(sagemaker_session):
5856
assert training_job.output_model_package_arn is not None
5957

6058

61-
@pytest.mark.skip(reason="Skipping GPU resource intensive test")
6259
def test_sft_trainer_with_validation_dataset(sagemaker_session):
6360
"""Test SFT trainer with both training and validation datasets."""
6461

6562
sft_trainer = SFTTrainer(
6663
model="meta-textgeneration-llama-3-2-1b-instruct",
6764
training_type=TrainingType.LORA,
6865
model_package_group="arn:aws:sagemaker:us-west-2:729646638167:model-package-group/sdk-test-finetuned-models",
69-
training_dataset="arn:aws:sagemaker:us-west-2:729646638167:hub-content/sdktest/DataSet/sft-oss-test-data/0.0.1",
70-
validation_dataset="arn:aws:sagemaker:us-west-2:729646638167:hub-content/sdktest/DataSet/sft-oss-test-data/0.0.1",
66+
training_dataset="s3://mc-flows-sdk-testing/input_data/sft/sample_data_256_final.jsonl",
67+
validation_dataset="s3://mc-flows-sdk-testing/input_data/sft/sample_data_256_final.jsonl",
7168
accept_eula=True
7269
)
7370

@@ -92,22 +89,19 @@ def test_sft_trainer_with_validation_dataset(sagemaker_session):
9289
assert hasattr(training_job, 'output_model_package_arn')
9390

9491

95-
# @pytest.mark.skipif(os.environ.get('AWS_DEFAULT_REGION') != 'us-east-1', reason="Nova models only available in us-east-1")
96-
@pytest.mark.skip(reason="Skipping GPU resource intensive test")
97-
def test_sft_trainer_nova_workflow(sagemaker_session):
92+
def test_sft_trainer_nova_workflow(sagemaker_session_us_east_1):
9893
"""Test SFT trainer with Nova model."""
99-
import os
100-
os.environ['SAGEMAKER_REGION'] = 'us-east-1'
94+
# sagemaker_session_us_east_1 fixture is defined in conftest.py (us-east-1 region)
10195

102-
# For fine-tuning
10396
sft_trainer_nova = SFTTrainer(
10497
model="nova-textgeneration-lite-v2",
10598
training_type=TrainingType.LORA,
10699
model_package_group="sdk-test-finetuned-models",
107100
mlflow_experiment_name="test-nova-finetuned-models-exp",
108101
mlflow_run_name="test-nova-finetuned-models-run",
109-
training_dataset="arn:aws:sagemaker:us-east-1:729646638167:hub-content/sdktest/DataSet/sft-nova-test-dataset/0.0.1",
110-
s3_output_path="s3://mc-flows-sdk-testing-us-east-1/output/"
102+
training_dataset="s3://mc-flows-sdk-testing-us-east-1/input_data/sft-nova/sft_8_samples.jsonl",
103+
s3_output_path="s3://mc-flows-sdk-testing-us-east-1/output/",
104+
sagemaker_session=sagemaker_session_us_east_1
111105
)
112106

113107
# Create training job

0 commit comments

Comments
 (0)