aws
diff --git a/‎sagemaker-serve/VERSION‎
Lines changed: 1 addition & 1 deletion b/‎sagemaker-serve/VERSION‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎sagemaker-serve/src/sagemaker/serve/__init__.py‎
Lines changed: 24 additions & 1 deletion b/‎sagemaker-serve/src/sagemaker/serve/__init__.py‎
Lines changed: 24 additions & 1 deletion
diff --git a/‎sagemaker-serve/src/sagemaker/serve/ai_inference_recommender/__init__.py‎
Lines changed: 47 additions & 0 deletions b/‎sagemaker-serve/src/sagemaker/serve/ai_inference_recommender/__init__.py‎
Lines changed: 47 additions & 0 deletions
diff --git a/‎sagemaker-serve/src/sagemaker/serve/ai_inference_recommender/_constants.py‎
Lines changed: 21 additions & 0 deletions b/‎sagemaker-serve/src/sagemaker/serve/ai_inference_recommender/_constants.py‎
Lines changed: 21 additions & 0 deletions
@@ -1 +1 @@
-1.13.0
+1.13.1
@@ -29,4 +29,27 @@
 from sagemaker.serve.utils.types import ModelServer
 from sagemaker.serve.model_builder import ModelBuilder
 
-__all__ = ["InferenceSpec", "ModelServer", "ModelBuilder"]
+from sagemaker.serve.ai_inference_recommender import (
+    BenchmarkJob,
+    BenchmarkResult,
+    RecommendationJob,
+    Secret,
+    Workload,
+    FeatureGatedError,
+    WorkloadValidationError,
+    start_benchmark,
+)
+
+__all__ = [
+    "InferenceSpec",
+    "ModelServer",
+    "ModelBuilder",
+    "BenchmarkJob",
+    "BenchmarkResult",
+    "RecommendationJob",
+    "Secret",
+    "Workload",
+    "FeatureGatedError",
+    "WorkloadValidationError",
+    "start_benchmark",
+]
@@ -0,0 +1,47 @@
+# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License"). You
+# may not use this file except in compliance with the License. A copy of
+# the License is located at
+#
+#     http://aws.amazon.com/apache2.0/
+#
+# or in the "license" file accompanying this file. This file is
+# distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF
+# ANY KIND, either express or implied. See the License for the specific
+# language governing permissions and limitations under the License.
+"""SageMaker GenAI inference benchmarking and recommendation."""
+from __future__ import absolute_import
+
+from sagemaker.serve.ai_inference_recommender.exceptions import (
+    FeatureGatedError,
+    WorkloadValidationError,
+)
+from sagemaker.serve.ai_inference_recommender.jobs import (
+    BenchmarkJob,
+    RecommendationJob,
+)
+from sagemaker.serve.ai_inference_recommender.result import (
+    BenchmarkMetric,
+    BenchmarkMetrics,
+    BenchmarkResult,
+)
+from sagemaker.serve.ai_inference_recommender.secrets import Secret
+from sagemaker.serve.ai_inference_recommender.workload import Workload
+from sagemaker.serve.ai_inference_recommender._model_builder_methods import (
+    start_benchmark,
+)
+
+
+__all__ = [
+    "BenchmarkJob",
+    "BenchmarkMetric",
+    "BenchmarkMetrics",
+    "BenchmarkResult",
+    "FeatureGatedError",
+    "RecommendationJob",
+    "Secret",
+    "Workload",
+    "WorkloadValidationError",
+    "start_benchmark",
+]
@@ -0,0 +1,21 @@
+# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License"). You
+# may not use this file except in compliance with the License. A copy of
+# the License is located at
+#
+#     http://aws.amazon.com/apache2.0/
+#
+# or in the "license" file accompanying this file. This file is
+# distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF
+# ANY KIND, either express or implied. See the License for the specific
+# language governing permissions and limitations under the License.
+"""Constants for the AI inference recommender module."""
+from __future__ import absolute_import
+
+MAX_INSTANCE_TYPES = 3
+
+FEATURE_GATING_RUNBOOK_URL = (
+    "https://docs.aws.amazon.com/sagemaker/latest/dg/"
+    "generative-ai-inference-recommendations.html"
+)