|
| 1 | +Resolved template parameters: {'role_arn': base_evaluator.py:757 |
| 2 | + 'arn:aws:iam::634683118556:role/service-role/AmazonSageMaker-Exe |
| 3 | + cutionRole-20251116T174807', 'mlflow_resource_arn': |
| 4 | + 'arn:aws:sagemaker:us-east-1:634683118556:mlflow-app/app-DA25Q2S |
| 5 | + 35KHZ', 'mlflow_experiment_name': None, 'mlflow_run_name': None, |
| 6 | + 'model_package_group_arn': |
| 7 | + 'arn:aws:sagemaker:us-east-1:634683118556:model-package-group/tm |
| 8 | + p-humanlike-llama32-rlaif', 'source_model_package_arn': None, |
| 9 | + 'base_model_arn': |
| 10 | + 'arn:aws:sagemaker:us-east-1:aws:hub-content/SageMakerPublicHub/ |
| 11 | + Model/meta-textgeneration-llama-3-2-1b-instruct/1.25.0', |
| 12 | + 's3_output_path': |
| 13 | + 's3://sagemaker-us-east-1-634683118556/tmp-humanlike-llama32-rla |
| 14 | + if/eval', 'dataset_artifact_arn': |
| 15 | + 'arn:aws:sagemaker:us-east-1:634683118556:artifact/c3c6611071894 |
| 16 | + bad6a7f0925a729b02e', 'action_arn_prefix': |
| 17 | + 'arn:aws:sagemaker:us-east-1:634683118556:action', |
| 18 | + 'dataset_uri': |
| 19 | + 'arn:aws:sagemaker:us-east-1:634683118556:hub-content/CKO4ACGI3U |
| 20 | + RQBOO74C9JPLUMQNG02M2I4CIM9M931SQHE0625A30/DataSet/tmp-humanlike |
| 21 | + -rlaif-eval/0.0.1', 'judge_model_id': |
| 22 | + 'anthropic.claude-3-5-sonnet-20240620-v1:0', 'llmaj_metrics': |
| 23 | + '[]', 'custom_metrics_s3_path': |
| 24 | + 's3://sagemaker-us-east-1-634683118556/tmp-humanlike-llama32-rla |
| 25 | + if/eval/evaluationinputs/eval-meta-1517aa3320251202-011237/custo |
| 26 | + m-metrics.json', 'max_new_tokens': '8192', 'temperature': '0', |
| 27 | + 'top_k': '-1', 'top_p': '1.0', 'pipeline_name': |
| 28 | + 'SagemakerModelEvaluationType2-llmaj', 'evaluate_base_model': |
| 29 | + True} |
| 30 | + INFO Rendered pipeline definition: base_evaluator.py:766 |
| 31 | + { |
| 32 | + "Version": "2020-12-01", |
| 33 | + "Metadata": {}, |
| 34 | + "MlflowConfig": { |
| 35 | + "MlflowResourceArn": |
| 36 | + "arn:aws:sagemaker:us-east-1:634683118556:mlflow-app/app-DA25Q2S |
| 37 | + 35KHZ" |
| 38 | + }, |
| 39 | + "Parameters": [], |
| 40 | + "Steps": [ |
| 41 | + { |
| 42 | + "Name": "EvaluateBaseInferenceModel", |
| 43 | + "Type": "Training", |
| 44 | + "Arguments": { |
| 45 | + "TrainingJobName": "BaseInference", |
| 46 | + "RoleArn": |
| 47 | + "arn:aws:iam::634683118556:role/service-role/AmazonSageMaker-Exe |
| 48 | + cutionRole-20251116T174807", |
| 49 | + "ServerlessJobConfig": { |
| 50 | + "BaseModelArn": |
| 51 | + "arn:aws:sagemaker:us-east-1:aws:hub-content/SageMakerPublicHub/ |
| 52 | + Model/meta-textgeneration-llama-3-2-1b-instruct/1.25.0", |
| 53 | + "AcceptEula": true, |
| 54 | + "JobType": "Evaluation", |
| 55 | + "EvaluationType": "BenchmarkEvaluation" |
| 56 | + }, |
| 57 | + "StoppingCondition": { |
| 58 | + "MaxRuntimeInSeconds": 86400 |
| 59 | + }, |
| 60 | + "HyperParameters": { |
| 61 | + "name": "BaseInference", |
| 62 | + "task": "inference_only" |
| 63 | + }, |
| 64 | + "OutputDataConfig": { |
| 65 | + "S3OutputPath": |
| 66 | + "s3://sagemaker-us-east-1-634683118556/tmp-humanlike-llama32-rla |
| 67 | + if/eval", |
| 68 | + "CompressionType": "NONE" |
| 69 | + }, |
| 70 | + "InputDataConfig": [ |
| 71 | + { |
| 72 | + "ChannelName": "train", |
| 73 | + "DataSource": { |
| 74 | + "DatasetSource": { |
| 75 | + "DatasetArn": |
| 76 | + "arn:aws:sagemaker:us-east-1:634683118556:hub-content/CKO4ACGI3U |
| 77 | + RQBOO74C9JPLUMQNG02M2I4CIM9M931SQHE0625A30/DataSet/tmp-humanlike |
| 78 | + -rlaif-eval/0.0.1" |
| 79 | + } |
| 80 | + } |
| 81 | + } |
| 82 | + ] |
| 83 | + } |
| 84 | + }, |
| 85 | + { |
| 86 | + "Name": "EvaluateBaseModelMetrics", |
| 87 | + "Type": "Training", |
| 88 | + "DependsOn": [ |
| 89 | + "EvaluateBaseInferenceModel" |
| 90 | + ], |
| 91 | + "Arguments": { |
| 92 | + "TrainingJobName": { |
| 93 | + "Std:Join": { |
| 94 | + "On": "-", |
| 95 | + "Values": [ |
| 96 | + "base-llmaj-eval", |
| 97 | + { |
| 98 | + "Get": "Execution.PipelineExecutionId" |
| 99 | + } |
| 100 | + ] |
| 101 | + } |
| 102 | + }, |
| 103 | + "RoleArn": |
| 104 | + "arn:aws:iam::634683118556:role/service-role/AmazonSageMaker-Exe |
| 105 | + cutionRole-20251116T174807", |
| 106 | + "ServerlessJobConfig": { |
| 107 | + "BaseModelArn": |
| 108 | + "arn:aws:sagemaker:us-east-1:aws:hub-content/SageMakerPublicHub/ |
| 109 | + Model/meta-textgeneration-llama-3-2-1b-instruct/1.25.0", |
| 110 | + "AcceptEula": true, |
| 111 | + "JobType": "Evaluation", |
| 112 | + "EvaluationType": "LLMAJEvaluation" |
| 113 | + }, |
| 114 | + "StoppingCondition": { |
| 115 | + "MaxRuntimeInSeconds": 86400 |
| 116 | + }, |
| 117 | + "HyperParameters": { |
| 118 | + "name": { |
| 119 | + "Std:Join": { |
| 120 | + "On": "-", |
| 121 | + "Values": [ |
| 122 | + "base-llmaj-eval", |
| 123 | + { |
| 124 | + "Get": "Execution.PipelineExecutionId" |
| 125 | + } |
| 126 | + ] |
| 127 | + } |
| 128 | + }, |
| 129 | + "judge_model_id": |
| 130 | + "anthropic.claude-3-5-sonnet-20240620-v1:0", |
| 131 | + "inference_data_s3_path": { |
| 132 | + "Std:Join": { |
| 133 | + "On": "", |
| 134 | + "Values": [ |
| 135 | + { |
| 136 | + "Get": |
| 137 | + "Steps.EvaluateBaseInferenceModel.OutputDataConfig.S3OutputPath" |
| 138 | + }, |
| 139 | + "/", |
| 140 | + { |
| 141 | + "Get": |
| 142 | + "Steps.EvaluateBaseInferenceModel.TrainingJobName" |
| 143 | + }, |
| 144 | + "/output/output/", |
| 145 | + "BaseInference", |
| 146 | + "/eval_results/inference_output.jsonl" |
| 147 | + ] |
| 148 | + } |
| 149 | + }, |
| 150 | + "output_path": |
| 151 | + "s3://sagemaker-us-east-1-634683118556/tmp-humanlike-llama32-rla |
| 152 | + if/eval", |
| 153 | + "llmaj_metrics": "[]", |
| 154 | + "custom_metrics_s3_path": |
| 155 | + "s3://sagemaker-us-east-1-634683118556/tmp-humanlike-llama32-rla |
| 156 | + if/eval/evaluationinputs/eval-meta-1517aa3320251202-011237/custo |
| 157 | + m-metrics.json", |
| 158 | + "max_new_tokens": "8192", |
| 159 | + "temperature": "0", |
| 160 | + "top_k": "-1", |
| 161 | + "top_p": "1.0" |
| 162 | + }, |
| 163 | + "OutputDataConfig": { |
| 164 | + "S3OutputPath": |
| 165 | + "s3://sagemaker-us-east-1-634683118556/tmp-humanlike-llama32-rla |
| 166 | + if/eval", |
| 167 | + "CompressionType": "NONE" |
| 168 | + } |
| 169 | + } |
| 170 | + } |
| 171 | + ] |
| 172 | + } |
0 commit comments