GetStream
diff --git a/‎…_speech/llm_audio_conversation/README.md‎ ‎…enai_realtime_speech_to_speech/README.md‎examples/openai_realtime_speech_to_speech/llm_audio_conversation/README.md renamed to examples/openai_realtime_speech_to_speech/README.md b/‎…_speech/llm_audio_conversation/README.md‎ ‎…enai_realtime_speech_to_speech/README.md‎examples/openai_realtime_speech_to_speech/llm_audio_conversation/README.md renamed to examples/openai_realtime_speech_to_speech/README.md
diff --git a/‎…peech/llm_audio_conversation/__init__.py‎ ‎…ai_realtime_speech_to_speech/__init__.py‎examples/openai_realtime_speech_to_speech/llm_audio_conversation/__init__.py renamed to examples/openai_realtime_speech_to_speech/__init__.py b/‎…peech/llm_audio_conversation/__init__.py‎ ‎…ai_realtime_speech_to_speech/__init__.py‎examples/openai_realtime_speech_to_speech/llm_audio_conversation/__init__.py renamed to examples/openai_realtime_speech_to_speech/__init__.py
diff --git a/‎examples/openai_realtime_speech_to_speech/llm_audio_conversation/main.py‎
Lines changed: 0 additions & 110 deletions b/‎examples/openai_realtime_speech_to_speech/llm_audio_conversation/main.py‎
Lines changed: 0 additions & 110 deletions
diff --git a/‎examples/openai_realtime_speech_to_speech/main.py‎
Lines changed: 111 additions & 0 deletions b/‎examples/openai_realtime_speech_to_speech/main.py‎
Lines changed: 111 additions & 0 deletions
diff --git a/‎…ch/llm_audio_conversation/pyproject.toml‎ ‎…realtime_speech_to_speech/pyproject.toml‎examples/openai_realtime_speech_to_speech/llm_audio_conversation/pyproject.toml renamed to examples/openai_realtime_speech_to_speech/pyproject.toml
Lines changed: 0 additions & 4 deletions b/‎…ch/llm_audio_conversation/pyproject.toml‎ ‎…realtime_speech_to_speech/pyproject.toml‎examples/openai_realtime_speech_to_speech/llm_audio_conversation/pyproject.toml renamed to examples/openai_realtime_speech_to_speech/pyproject.toml
Lines changed: 0 additions & 4 deletions
diff --git a/‎getstream/plugins/sts/__init__.py‎
Lines changed: 52 additions & 0 deletions b/‎getstream/plugins/sts/__init__.py‎
Lines changed: 52 additions & 0 deletions
diff --git a/‎getstream/plugins/sts/openai_realtime/__init__.py‎
Lines changed: 3 additions & 0 deletions b/‎getstream/plugins/sts/openai_realtime/__init__.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎getstream/plugins/sts/openai_realtime/pyproject.toml‎
Lines changed: 25 additions & 0 deletions b/‎getstream/plugins/sts/openai_realtime/pyproject.toml‎
Lines changed: 25 additions & 0 deletions
@@ -0,0 +1,111 @@
+import asyncio
+import logging
+import os
+from uuid import uuid4
+from dotenv import load_dotenv
+from examples.utils import create_user, open_browser
+from getstream import Stream
+from getstream.plugins.sts.openai_realtime import OpenAIRealtime
+
+
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
+    force=True,  # Override any previous basicConfig calls
+)
+
+# Enable verbose logging for the OpenAI Realtime plugin
+logging.getLogger("getstream.plugins.sts.openai_realtime.sts").setLevel(logging.INFO)
+
+
+async def main():
+    """Run a demo call with an OpenAI Speech-to-Speech agent attached."""
+
+    load_dotenv(os.path.join(os.path.dirname(__file__), "..", ".env"))
+
+    # Initialize Stream client from env vars (STREAM_API_KEY / SECRET / BASE_URL)
+    client = Stream.from_env()
+
+    user_id = f"user-{uuid4()}"
+    create_user(client, user_id, "My User")
+    logging.info("👤 Created user: %s", user_id)
+
+    user_token = client.create_token(user_id, expiration=3600)
+    logging.info("🔑 Created token for user: %s", user_id)
+
+    bot_user_id = f"openai-realtime-speech-to-speech-bot-{uuid4()}"
+    create_user(client, bot_user_id, "OpenAI Realtime Speech to Speech Bot")
+    logging.info("🤖 Created bot user: %s", bot_user_id)
+
+    call_id = str(uuid4())
+    logging.info("📞 Call ID: %s", call_id)
+
+    call = client.video.call("default", call_id)
+    call.get_or_create(data={"created_by_id": bot_user_id})
+    logging.info("📞 Call created: %s", call_id)
+
+    # Open demo browser so you can join from the UI
+    open_browser(client.api_key, user_token, call_id)
+
+    sts_bot = OpenAIRealtime(
+        api_key=os.getenv("OPENAI_API_KEY"),
+        model="gpt-4o-realtime-preview",
+        instructions="You are a friendly assistant; reply verbally in a short sentence.",
+        voice="alloy",
+    )
+
+    @sts_bot.on("connected")
+    async def _on_connected():
+        print("✅ CONNECTED EVENT RECEIVED")
+        logging.info("✅ Bot connected successfully")
+
+    @sts_bot.on("disconnected")
+    async def _on_disconnected():
+        print("❌ DISCONNECTED EVENT RECEIVED")
+        logging.info("❌ Bot disconnected")
+
+    @sts_bot.on("error")
+    async def _on_error(error):
+        print(f"💥 ERROR EVENT RECEIVED: {error}")
+        logging.error("💥 Bot error: %s", error)
+
+    @sts_bot.on("session.created")
+    @sts_bot.on("session.updated")
+    @sts_bot.on("conversation.item.created")
+    @sts_bot.on("response.created")
+    @sts_bot.on("response.done")
+    @sts_bot.on("call.session_participant_joined")
+    @sts_bot.on("call.session_participant_left")
+    async def _on_openai_event(event):
+        print(f"🔔 Event received: {event.type}")
+        print(f"   Event data: {event}")
+        logging.info("🔔 Event: %s", event.type)
+
+    try:
+        logging.info("Connecting to OpenAI Realtime...")
+        
+        # Check if API key is set
+        if not os.getenv("OPENAI_API_KEY"):
+            logging.error("❌ OPENAI_API_KEY not found in environment")
+            return
+        
+        await sts_bot.connect(call, agent_user_id=bot_user_id)
+        logging.info("🎧 Listening for responses... (Press Ctrl+C to stop)")
+        logging.info("💡 Try speaking in the browser to generate audio events!")
+
+        while sts_bot.is_connected:
+            await asyncio.sleep(1)
+
+    except KeyboardInterrupt:  # noqa: WPS420
+        logging.info("\n⏹️  Stopping OpenAI Realtime Speech to Speech bot…")
+    except Exception as e:  # noqa: BLE001
+        logging.exception("❌ Error: %s", e)
+    finally:
+        logging.info("Cleaning up...")
+        await sts_bot.close()
+        client.delete_users([user_id, bot_user_id])
+        logging.info("Cleanup complete")
+
+
+if __name__ == "__main__":
+    asyncio.run(main())
@@ -7,10 +7,6 @@ requires-python = ">=3.9"
 license = {text = "MIT"}
 
 dependencies = [
-    "getstream[webrtc]",
-    "getstream-plugins-stt-deepgram",
-    "getstream-plugins-tts-elevenlabs",
-    "getstream-plugins-vad-silero",
     "python-dotenv>=1.0.0",
     "aiortc>=1.10.1",
     "numpy>=2.0.0",
 
@@ -0,0 +1,52 @@
+import abc
+import logging
+
+from pyee.asyncio import AsyncIOEventEmitter
+
+
+logger = logging.getLogger(__name__)
+
+
+class STS(AsyncIOEventEmitter, abc.ABC):
+    """Speech-to-Speech (full duplex) base class.
+
+    Implementations are expected to:
+    • establish an audio session (usually via Stream Video `Call.connect_openai`)
+    • emit high-level events coming from the AI agent (for example
+      ``conversation.updated`` or ``error``)
+    • optionally expose helper methods like ``update_session`` or
+      ``send_user_message``.
+
+    Events emitted by *all* STS implementations:
+        - *connected*: fired once the underlying websocket is ready
+        - *disconnected*: fired when the websocket is closed (graceful or error)
+        - *error*: emitted for any exception that bubbles up
+        - *<any other event type coming from the provider>*: forwarded verbatim
+    """
+
+    def __init__(self):
+        super().__init__()
+        self._is_connected = False
+
+    # ---------------------------------------------------------------------
+    # Lifecycle helpers
+    # ---------------------------------------------------------------------
+    @abc.abstractmethod
+    async def connect(self, *args, **kwargs):  # pragma: no cover
+        """Establish the realtime connection (provider-specific)."""
+
+    @abc.abstractmethod
+    async def close(self):  # pragma: no cover
+        """Close the connection and release all resources."""
+
+    # Derived classes should set ``self._is_connected`` accordingly so that
+    # embedders can introspect the state.
+    # ---------------------------------------------------------------------
+
+    @property
+    def is_connected(self) -> bool:
+        """Return True if the realtime session is currently active."""
+        return self._is_connected
+
+# Public re-export
+__all__ = ["STS"]
@@ -0,0 +1,3 @@
+from .sts import OpenAIRealtime
+
+__all__ = ["OpenAIRealtime"] 
@@ -0,0 +1,25 @@
+[build-system]
+requires = ["setuptools>=42", "wheel"]
+build-backend = "setuptools.build_meta"
+
+[project]
+name = "getstream-plugins-sts-openai-realtime"
+version = "0.1.0"
+description = "OpenAI Realtime STS plugin for GetStream"
+readme = "README.md"
+requires-python = ">=3.9"
+license = {text = "MIT"}
+dependencies = [
+    "getstream[webrtc]",
+
+]
+
+[project.optional-dependencies]
+test = [
+    "pytest>=7.0.0",
+    "pytest-asyncio>=0.18.0",
+]
+
+[tool.uv.sources]
+getstream = { workspace = true }
+getstream-plugins-sts-openai-realtime = { workspace = true }
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+from .sts import OpenAIRealtime`
	`2`	`+`
	`3`	`+__all__ = ["OpenAIRealtime"]`