UiPath
diff --git a/‎.gitignore‎
Lines changed: 5 additions & 0 deletions b/‎.gitignore‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 15 additions & 1 deletion b/‎pyproject.toml‎
Lines changed: 15 additions & 1 deletion
diff --git a/‎src/uipath_llamaindex/llms/__init__.py‎
Lines changed: 6 additions & 2 deletions b/‎src/uipath_llamaindex/llms/__init__.py‎
Lines changed: 6 additions & 2 deletions
diff --git a/‎src/uipath_llamaindex/llms/_openai.py‎
Lines changed: 2 additions & 13 deletions b/‎src/uipath_llamaindex/llms/_openai.py‎
Lines changed: 2 additions & 13 deletions
diff --git a/‎src/uipath_llamaindex/llms/bedrock.py‎
Lines changed: 272 additions & 0 deletions b/‎src/uipath_llamaindex/llms/bedrock.py‎
Lines changed: 272 additions & 0 deletions
diff --git a/‎src/uipath_llamaindex/llms/supported_models.py‎
Lines changed: 33 additions & 0 deletions b/‎src/uipath_llamaindex/llms/supported_models.py‎
Lines changed: 33 additions & 0 deletions
@@ -177,3 +177,8 @@ cython_debug/
 **/.uipath
 **/**.nupkg
 **/__uipath/
+.claude/settings.local.json
+
+/.vscode/launch.json
+
+playground.py
@@ -1,6 +1,6 @@
 [project]
 name = "uipath-llamaindex"
-version = "0.1.5"
+version = "0.1.6"
 description = "UiPath LlamaIndex SDK"
 readme = { file = "README.md", content-type = "text/markdown" }
 requires-python = ">=3.11"
@@ -24,6 +24,18 @@ maintainers = [
     { name = "Cristian Pufu", email = "cristian.pufu@uipath.com" }
 ]
 
+[project.optional-dependencies]
+bedrock = [
+    "llama-index-llms-bedrock>=0.3.0",
+    "llama-index-llms-bedrock-converse>=0.3.0",
+    "boto3>=1.28.0",
+    "aiobotocore>=2.5.0",
+]
+vertex = [
+    "llama-index-llms-google-genai>=0.8.0",
+    "google-genai>=1.0.0",
+]
+
 [project.entry-points."uipath.middlewares"]
 register = "uipath_llamaindex.middlewares:register_middleware"
 
@@ -58,6 +70,8 @@ select = ["E", "F", "B", "I"]
 
 [tool.ruff.lint.per-file-ignores]
 "*" = ["E501"]
+"src/uipath_llamaindex/llms/bedrock.py" = ["E402"]
+"src/uipath_llamaindex/llms/vertex.py" = ["E402"]
 
 [tool.ruff.format]
 quote-style = "double"
 
@@ -1,9 +1,13 @@
-from ._openai import (
+from ._openai import UiPathOpenAI
+from .supported_models import (
+    BedrockModel,
+    GeminiModel,
     OpenAIModel,
-    UiPathOpenAI,
 )
 
 __all__ = [
     "UiPathOpenAI",
     "OpenAIModel",
+    "GeminiModel",
+    "BedrockModel",
 ]
@@ -1,21 +1,10 @@
 import os
-from enum import Enum
 from typing import Any
 
 from llama_index.llms.azure_openai import AzureOpenAI  # type: ignore
 from uipath.utils import EndpointManager
 
-
-class OpenAIModel(Enum):
-    GPT_4_1_2025_04_14 = "gpt-4.1-2025-04-14"
-    GPT_4_1_MINI_2025_04_14 = "gpt-4.1-mini-2025-04-14"
-    GPT_4_1_NANO_2025_04_14 = "gpt-4.1-nano-2025-04-14"
-    GPT_4O_2024_05_13 = "gpt-4o-2024-05-13"
-    GPT_4O_2024_08_06 = "gpt-4o-2024-08-06"
-    GPT_4O_2024_11_20 = "gpt-4o-2024-11-20"
-    GPT_4O_MINI_2024_07_18 = "gpt-4o-mini-2024-07-18"
-    O3_MINI_2025_01_31 = "o3-mini-2025-01-31"
-    TEXT_DAVINCI_003 = "text-davinci-003"
+from .supported_models import OpenAIModel
 
 
 class UiPathOpenAI(AzureOpenAI):
@@ -42,7 +31,7 @@ def __init__(
         defaults = {
             "model": model_value,
             "deployment_name": model_value,
-            "azure_endpoint": f"{base_url}/{EndpointManager.get_passthrough_endpoint().format(model=model, api_version=api_version)}",
+            "azure_endpoint": f"{base_url}/{EndpointManager.get_passthrough_endpoint().format(model=model_value, api_version=api_version)}",
             "api_key": os.environ.get("UIPATH_ACCESS_TOKEN"),
             "api_version": api_version,
             "is_chat_model": True,
 
@@ -0,0 +1,272 @@
+import logging
+import os
+from typing import Any, Optional, Sequence
+
+from uipath.utils import EndpointManager
+
+from .supported_models import BedrockModel
+
+logger = logging.getLogger(__name__)
+
+
+def _check_bedrock_dependencies() -> None:
+    """Check if required dependencies for UiPath Bedrock LLMs are installed."""
+    import importlib.util
+
+    missing_packages = []
+
+    if importlib.util.find_spec("llama_index.llms.bedrock") is None:
+        missing_packages.append("llama-index-llms-bedrock")
+
+    if importlib.util.find_spec("llama_index.llms.bedrock_converse") is None:
+        missing_packages.append("llama-index-llms-bedrock-converse")
+
+    if importlib.util.find_spec("boto3") is None:
+        missing_packages.append("boto3")
+
+    if importlib.util.find_spec("aiobotocore") is None:
+        missing_packages.append("aiobotocore")
+
+    if missing_packages:
+        packages_str = ", ".join(missing_packages)
+        raise ImportError(
+            f"The following packages are required to use UiPath Bedrock LLMs: {packages_str}\n"
+            "Please install them using one of the following methods:\n\n"
+            "  # Using pip:\n"
+            f"  pip install uipath-llamaindex[bedrock]\n\n"
+            "  # Using uv:\n"
+            f"  uv add 'uipath-llamaindex[bedrock]'\n\n"
+        )
+
+
+_check_bedrock_dependencies()
+
+import boto3  # type: ignore[import-untyped]
+from llama_index.core.base.llms.types import (  # noqa: E402
+    ChatMessage,
+    ChatResponse,
+    ChatResponseAsyncGen,
+    CompletionResponse,
+    CompletionResponseAsyncGen,
+)
+from llama_index.core.llms.callbacks import (  # noqa: E402
+    llm_chat_callback,
+    llm_completion_callback,
+)
+from llama_index.llms.bedrock import Bedrock  # type: ignore[import-untyped]
+from llama_index.llms.bedrock_converse import (  # type: ignore[import-untyped]
+    BedrockConverse,
+)
+
+
+class AwsBedrockCompletionsPassthroughClient:
+    def __init__(
+        self,
+        model: str,
+        token: str,
+        api_flavor: str,
+    ):
+        self.model = model
+        self.token = token
+        self.api_flavor = api_flavor
+        self._vendor = "awsbedrock"
+        self._url: Optional[str] = None
+
+    @property
+    def endpoint(self) -> str:
+        vendor_endpoint = EndpointManager.get_vendor_endpoint()
+        formatted_endpoint = vendor_endpoint.format(
+            vendor=self._vendor,
+            model=self.model,
+        )
+        return formatted_endpoint
+
+    def _build_base_url(self) -> str:
+        if not self._url:
+            env_uipath_url = os.getenv("UIPATH_URL")
+
+            if env_uipath_url:
+                self._url = f"{env_uipath_url.rstrip('/')}/{self.endpoint}"
+            else:
+                raise ValueError("UIPATH_URL environment variable is required")
+
+        return self._url
+
+    def get_client(self):
+        client = boto3.client(
+            "bedrock-runtime",
+            region_name="us-east-1",
+            aws_access_key_id="none",
+            aws_secret_access_key="none",
+            verify=True,
+        )
+        client.meta.events.register(
+            "before-send.bedrock-runtime.*", self._modify_request
+        )
+        return client
+
+    def get_session(self):
+        """Get aiobotocore session for async operations with custom event handlers."""
+        from aiobotocore.session import get_session  # type: ignore[import-untyped]
+
+        session = get_session()
+        session.get_component("event_emitter").register(
+            "before-send.bedrock-runtime.*", self._modify_request
+        )
+        return session
+
+    def _modify_request(self, request, **kwargs):
+        """Intercept boto3 request and redirect to LLM Gateway"""
+        # Detect streaming based on URL suffix:
+        # - converse-stream / invoke-with-response-stream -> streaming
+        # - converse / invoke -> non-streaming
+        streaming = "true" if request.url.endswith("-stream") else "false"
+        request.url = self._build_base_url()
+
+        headers = {
+            "Authorization": f"Bearer {self.token}",
+            "X-UiPath-LlmGateway-ApiFlavor": self.api_flavor,
+            "X-UiPath-Streaming-Enabled": streaming,
+        }
+
+        job_key = os.getenv("UIPATH_JOB_KEY")
+        process_key = os.getenv("UIPATH_PROCESS_KEY")
+        if job_key:
+            headers["X-UiPath-JobKey"] = job_key
+        if process_key:
+            headers["X-UiPath-ProcessKey"] = process_key
+
+        request.headers.update(headers)
+
+
+class UiPathChatBedrockConverse(BedrockConverse):
+    def __init__(
+        self,
+        org_id: Optional[str] = None,
+        tenant_id: Optional[str] = None,
+        token: Optional[str] = None,
+        model: str = BedrockModel.anthropic_claude_haiku_4_5,
+        **kwargs,
+    ):
+        org_id = org_id or os.getenv("UIPATH_ORGANIZATION_ID")
+        tenant_id = tenant_id or os.getenv("UIPATH_TENANT_ID")
+        token = token or os.getenv("UIPATH_ACCESS_TOKEN")
+
+        if not org_id:
+            raise ValueError(
+                "UIPATH_ORGANIZATION_ID environment variable or org_id parameter is required"
+            )
+        if not tenant_id:
+            raise ValueError(
+                "UIPATH_TENANT_ID environment variable or tenant_id parameter is required"
+            )
+        if not token:
+            raise ValueError(
+                "UIPATH_ACCESS_TOKEN environment variable or token parameter is required"
+            )
+
+        passthrough_client = AwsBedrockCompletionsPassthroughClient(
+            model=model,
+            token=token,
+            api_flavor="converse",
+        )
+
+        client = passthrough_client.get_client()
+        botocore_session = passthrough_client.get_session()
+
+        super().__init__(
+            model=model,
+            client=client,
+            botocore_session=botocore_session,
+            region_name="us-east-1",
+            aws_access_key_id="none",
+            aws_secret_access_key="none",
+            **kwargs,
+        )
+
+
+class UiPathChatBedrock(Bedrock):
+    def __init__(
+        self,
+        org_id: Optional[str] = None,
+        tenant_id: Optional[str] = None,
+        token: Optional[str] = None,
+        model: str = BedrockModel.anthropic_claude_haiku_4_5,
+        context_size: int = 200000,
+        **kwargs,
+    ):
+        org_id = org_id or os.getenv("UIPATH_ORGANIZATION_ID")
+        tenant_id = tenant_id or os.getenv("UIPATH_TENANT_ID")
+        token = token or os.getenv("UIPATH_ACCESS_TOKEN")
+
+        if not org_id:
+            raise ValueError(
+                "UIPATH_ORGANIZATION_ID environment variable or org_id parameter is required"
+            )
+        if not tenant_id:
+            raise ValueError(
+                "UIPATH_TENANT_ID environment variable or tenant_id parameter is required"
+            )
+        if not token:
+            raise ValueError(
+                "UIPATH_ACCESS_TOKEN environment variable or token parameter is required"
+            )
+
+        passthrough_client = AwsBedrockCompletionsPassthroughClient(
+            model=model,
+            token=token,
+            api_flavor="invoke",
+        )
+
+        client = passthrough_client.get_client()
+
+        super().__init__(
+            model=model,
+            client=client,
+            context_size=context_size,
+            aws_access_key_id="none",
+            aws_secret_access_key="none",
+            region_name="us-east-1",
+            **kwargs,
+        )
+
+    @llm_completion_callback()
+    async def acomplete(
+        self, prompt: str, formatted: bool = False, **kwargs: Any
+    ) -> CompletionResponse:
+        """Async completion endpoint - delegates to sync complete."""
+        return self.complete(prompt, formatted=formatted, **kwargs)
+
+    @llm_chat_callback()
+    async def astream_chat(
+        self, messages: Sequence[ChatMessage], **kwargs: Any
+    ) -> ChatResponseAsyncGen:
+        """Async streaming chat fallback - calls achat and yields single response."""
+
+        async def gen() -> ChatResponseAsyncGen:
+            response = await self.achat(messages, **kwargs)
+            yield ChatResponse(
+                message=response.message,
+                raw=response.raw,
+                delta=response.message.content or "",
+                additional_kwargs=response.additional_kwargs,
+            )
+
+        return gen()
+
+    @llm_completion_callback()
+    async def astream_complete(
+        self, prompt: str, formatted: bool = False, **kwargs: Any
+    ) -> CompletionResponseAsyncGen:
+        """Async streaming completion fallback - calls acomplete and yields single response."""
+
+        async def gen() -> CompletionResponseAsyncGen:
+            response = await self.acomplete(prompt, formatted=formatted, **kwargs)
+            yield CompletionResponse(
+                text=response.text,
+                raw=response.raw,
+                delta=response.text,
+                additional_kwargs=response.additional_kwargs,
+            )
+
+        return gen()
@@ -0,0 +1,33 @@
+from enum import Enum
+
+
+class OpenAIModel(Enum):
+    GPT_4_1_2025_04_14 = "gpt-4.1-2025-04-14"
+    GPT_4_1_MINI_2025_04_14 = "gpt-4.1-mini-2025-04-14"
+    GPT_4_1_NANO_2025_04_14 = "gpt-4.1-nano-2025-04-14"
+    GPT_4O_2024_05_13 = "gpt-4o-2024-05-13"
+    GPT_4O_2024_08_06 = "gpt-4o-2024-08-06"
+    GPT_4O_2024_11_20 = "gpt-4o-2024-11-20"
+    GPT_4O_MINI_2024_07_18 = "gpt-4o-mini-2024-07-18"
+    O3_MINI_2025_01_31 = "o3-mini-2025-01-31"
+    TEXT_DAVINCI_003 = "text-davinci-003"
+
+
+class GeminiModel:
+    """Supported Google Gemini model identifiers."""
+
+    gemini_2_5_pro = "gemini-2.5-pro"
+    gemini_2_5_flash = "gemini-2.5-flash"
+    gemini_2_0_flash_001 = "gemini-2.0-flash-001"
+
+
+class BedrockModel:
+    """Supported AWS Bedrock model identifiers."""
+
+    # Claude 3.7 models
+    anthropic_claude_3_7_sonnet = "anthropic.claude-3-7-sonnet-20250219-v1:0"
+
+    # Claude 4 models
+    anthropic_claude_sonnet_4 = "anthropic.claude-sonnet-4-20250514-v1:0"
+    anthropic_claude_sonnet_4_5 = "anthropic.claude-sonnet-4-5-20250929-v1:0"
+    anthropic_claude_haiku_4_5 = "anthropic.claude-haiku-4-5-20251001-v1:0"