deepgram
diff --git a/‎examples/530-voice-agent-multi-provider-proxy-python/.env.example‎
Lines changed: 13 additions & 0 deletions b/‎examples/530-voice-agent-multi-provider-proxy-python/.env.example‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎examples/530-voice-agent-multi-provider-proxy-python/README.md‎
Lines changed: 69 additions & 0 deletions b/‎examples/530-voice-agent-multi-provider-proxy-python/README.md‎
Lines changed: 69 additions & 0 deletions
diff --git a/‎examples/530-voice-agent-multi-provider-proxy-python/requirements.txt‎
Lines changed: 6 additions & 0 deletions b/‎examples/530-voice-agent-multi-provider-proxy-python/requirements.txt‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎examples/530-voice-agent-multi-provider-proxy-python/src/__init__.py‎ b/‎examples/530-voice-agent-multi-provider-proxy-python/src/__init__.py‎
diff --git a/‎examples/530-voice-agent-multi-provider-proxy-python/src/agent.py‎
Lines changed: 147 additions & 0 deletions b/‎examples/530-voice-agent-multi-provider-proxy-python/src/agent.py‎
Lines changed: 147 additions & 0 deletions
diff --git a/‎examples/530-voice-agent-multi-provider-proxy-python/src/config.py‎
Lines changed: 50 additions & 0 deletions b/‎examples/530-voice-agent-multi-provider-proxy-python/src/config.py‎
Lines changed: 50 additions & 0 deletions
@@ -0,0 +1,13 @@
+# Deepgram — https://console.deepgram.com/
+DEEPGRAM_API_KEY=
+
+# Active LLM provider: "openai" or "bedrock"
+LLM_PROVIDER=openai
+
+# OpenAI — https://platform.openai.com/api-keys
+OPENAI_API_KEY=
+
+# Amazon Bedrock — https://console.aws.amazon.com/bedrock/
+AWS_ACCESS_KEY_ID=
+AWS_SECRET_ACCESS_KEY=
+AWS_REGION=us-east-1
@@ -0,0 +1,69 @@
+# Multi-Provider Chat Completions Proxy for Deepgram Voice Agent
+
+An OpenAI-compatible proxy server that sits between the Deepgram Voice Agent API and multiple LLM backends. Swap between OpenAI and Amazon Bedrock by changing one environment variable — no code changes needed.
+
+## What you'll build
+
+A FastAPI server exposing `/v1/chat/completions` that the Deepgram Voice Agent uses as its "think" endpoint. The proxy translates requests to whichever LLM backend you configure (`openai` or `bedrock`), so you can switch providers without modifying the agent code.
+
+## Prerequisites
+
+- Python 3.10+
+- Deepgram account — [get a free API key](https://console.deepgram.com/)
+- OpenAI account — [get an API key](https://platform.openai.com/api-keys) (for OpenAI provider)
+- AWS account with Bedrock access — [enable models](https://console.aws.amazon.com/bedrock/) (for Bedrock provider)
+
+## Environment variables
+
+| Variable | Where to find it |
+|----------|-----------------|
+| `DEEPGRAM_API_KEY` | [Deepgram console](https://console.deepgram.com/) |
+| `LLM_PROVIDER` | Set to `openai` or `bedrock` |
+| `OPENAI_API_KEY` | [OpenAI dashboard](https://platform.openai.com/api-keys) |
+| `AWS_ACCESS_KEY_ID` | [AWS IAM console](https://console.aws.amazon.com/iam/) |
+| `AWS_SECRET_ACCESS_KEY` | [AWS IAM console](https://console.aws.amazon.com/iam/) |
+| `AWS_REGION` | Your Bedrock-enabled region (default: `us-east-1`) |
+
+## Install and run
+
+```bash
+cp .env.example .env
+# Fill in your credentials in .env
+
+pip install -r requirements.txt
+
+# Start the proxy server
+uvicorn src.proxy:app --port 8080
+
+# In another terminal — run the Voice Agent client
+python -m src.agent
+```
+
+## Key parameters
+
+| Parameter | Value | Description |
+|-----------|-------|-------------|
+| `LLM_PROVIDER` | `openai` / `bedrock` | Which LLM backend the proxy routes to |
+| `think.endpoint.url` | `http://localhost:8080/v1/chat/completions` | Voice Agent sends LLM requests here instead of OpenAI |
+| `listen.provider.model` | `nova-3` | Deepgram STT model for speech recognition |
+| `speak.provider.model` | `aura-2-thalia-en` | Deepgram TTS model for voice output |
+
+## How it works
+
+1. **Start the proxy** — FastAPI server exposes an OpenAI-compatible `/v1/chat/completions` endpoint
+2. **Configure the Voice Agent** — the agent's `think.endpoint.url` points at the proxy instead of OpenAI's API directly
+3. **Agent connects to Deepgram** — the Voice Agent WebSocket opens and sends settings with the custom think endpoint
+4. **User speaks** — Deepgram STT transcribes audio via nova-3, then the agent sends chat completions to the proxy
+5. **Proxy dispatches** — based on `LLM_PROVIDER`, the proxy forwards to OpenAI or translates to Bedrock's Converse API
+6. **Response flows back** — the proxy returns an OpenAI-format response, the agent speaks it via Deepgram TTS
+
+### Adding a new provider
+
+1. Add the provider's env vars to `.env.example`
+2. Add a new branch in `src/config.py:load_provider_config()`
+3. Add a `_forward_{provider}()` function in `src/proxy.py`
+4. Register it in `_DISPATCH`
+
+## Starter templates
+
+[deepgram-starters](https://github.com/orgs/deepgram-starters/repositories)
@@ -0,0 +1,6 @@
+deepgram-sdk==6.1.1
+fastapi==0.135.3
+uvicorn[standard]==0.44.0
+httpx==0.28.1
+python-dotenv==1.2.2
+boto3==1.42.85
@@ -0,0 +1,147 @@
+"""Deepgram Voice Agent client that routes its LLM calls through the local proxy.
+
+Connects to the Deepgram Voice Agent API via the Python SDK and configures
+a custom "think" endpoint pointing at the proxy server. This lets you swap
+LLM backends (OpenAI, Bedrock, etc.) without touching the agent code — just
+change LLM_PROVIDER in your .env file.
+
+Usage:
+    # First start the proxy:
+    uvicorn src.proxy:app --port 8080
+
+    # Then run the agent:
+    python -m src.agent
+"""
+
+import os
+import signal
+import sys
+import threading
+
+from dotenv import load_dotenv
+
+load_dotenv()
+
+from deepgram import DeepgramClient
+from deepgram.agent.v1.types.agent_v1settings import AgentV1Settings
+from deepgram.agent.v1.types.agent_v1conversation_text import AgentV1ConversationText
+from deepgram.agent.v1.types.agent_v1settings_applied import AgentV1SettingsApplied
+from deepgram.agent.v1.types.agent_v1welcome import AgentV1Welcome
+from deepgram.agent.v1.types.agent_v1agent_thinking import AgentV1AgentThinking
+from deepgram.agent.v1.types.agent_v1agent_audio_done import AgentV1AgentAudioDone
+from deepgram.agent.v1.types.agent_v1error import AgentV1Error
+from deepgram.agent.v1.types.agent_v1function_call_request import AgentV1FunctionCallRequest
+from deepgram.agent.v1.types.agent_v1send_function_call_response import AgentV1SendFunctionCallResponse
+
+PROXY_URL = os.environ.get("PROXY_URL", "http://localhost:8080")
+
+
+def build_agent_settings(proxy_url: str = PROXY_URL) -> AgentV1Settings:
+    """Build the Voice Agent settings that point the think endpoint at the proxy.
+
+    The key insight: setting think.endpoint.url to our proxy means every LLM
+    call the agent makes goes through the proxy, which routes to whichever
+    backend LLM_PROVIDER selects. Changing providers requires zero code changes
+    in this file — just update .env.
+    """
+    return AgentV1Settings(
+        type="Settings",
+        # ← tag is REQUIRED on every Deepgram API call
+        tags=["deepgram-examples"],
+        audio={
+            "input": {"encoding": "linear16", "sample_rate": 16000},
+            "output": {"encoding": "linear16", "sample_rate": 16000},
+        },
+        agent={
+            "listen": {
+                "provider": {"type": "deepgram", "model": "nova-3"},
+            },
+            "think": {
+                "provider": {"type": "open_ai", "model": "proxy"},
+                # ← THIS enables custom LLM routing: the Voice Agent sends
+                # chat-completions requests to our proxy instead of OpenAI
+                "endpoint": {
+                    "url": f"{proxy_url}/v1/chat/completions",
+                    "headers": {},
+                },
+                "prompt": (
+                    "You are a helpful voice assistant. Keep responses brief "
+                    "and conversational — the user is speaking to you, not reading."
+                ),
+            },
+            "speak": {
+                "provider": {"type": "deepgram", "model": "aura-2-thalia-en"},
+            },
+            "greeting": "Hello! I'm your voice assistant powered by Deepgram. How can I help?",
+        },
+    )
+
+
+def run_agent(proxy_url: str = PROXY_URL) -> None:
+    """Connect to the Deepgram Voice Agent API and stream microphone audio.
+
+    This is a demonstration entry point. In production you'd pipe audio from
+    a phone call, browser WebSocket, or other source instead of the microphone.
+    """
+    if not os.environ.get("DEEPGRAM_API_KEY"):
+        print("Error: DEEPGRAM_API_KEY not set", file=sys.stderr)
+        sys.exit(1)
+
+    client = DeepgramClient()
+    settings = build_agent_settings(proxy_url)
+
+    print(f"[agent] Connecting to Deepgram Voice Agent (proxy at {proxy_url})...")
+
+    with client.agent.v1.connect() as connection:
+        connection.send_settings(settings)
+
+        stop_event = threading.Event()
+
+        def on_recv():
+            while not stop_event.is_set():
+                try:
+                    msg = connection.recv()
+                except Exception:
+                    break
+
+                if isinstance(msg, AgentV1Welcome):
+                    print(f"[agent] Connected — request_id: {msg.request_id}")
+                elif isinstance(msg, AgentV1SettingsApplied):
+                    print("[agent] Settings applied — proxy endpoint active")
+                elif isinstance(msg, AgentV1ConversationText):
+                    print(f"[{msg.role}] {msg.content}")
+                elif isinstance(msg, AgentV1AgentThinking):
+                    print("[agent] Thinking...")
+                elif isinstance(msg, AgentV1AgentAudioDone):
+                    print("[agent] Audio done")
+                elif isinstance(msg, AgentV1Error):
+                    print(f"[agent] Error: {msg.description}")
+                elif isinstance(msg, bytes):
+                    pass
+                elif isinstance(msg, AgentV1FunctionCallRequest):
+                    for fn in msg.functions or []:
+                        connection.send_function_call_response(
+                            AgentV1SendFunctionCallResponse(
+                                type="FunctionCallResponse",
+                                id=fn.id,
+                                output='{"error": "no functions registered"}',
+                            )
+                        )
+
+        recv_thread = threading.Thread(target=on_recv, daemon=True)
+        recv_thread.start()
+
+        print("[agent] Agent is running. Press Ctrl+C to stop.")
+        print("[agent] (No microphone input in this demo — connect a real audio source)")
+
+        def handle_signal(sig, frame):
+            stop_event.set()
+
+        signal.signal(signal.SIGINT, handle_signal)
+
+        stop_event.wait()
+        print("\n[agent] Shutting down...")
+
+
+if __name__ == "__main__":
+    run_agent()
@@ -0,0 +1,50 @@
+"""Provider configuration for the multi-provider chat completions proxy.
+
+Reads LLM_PROVIDER from the environment and returns the corresponding
+backend configuration. Adding a new provider means adding one more
+elif branch and its env vars to .env.example.
+"""
+
+import os
+from dataclasses import dataclass
+
+
+@dataclass(frozen=True)
+class ProviderConfig:
+    name: str
+    model: str
+    api_base: str | None
+    api_key: str | None
+    extra_headers: dict[str, str]
+
+
+def load_provider_config() -> ProviderConfig:
+    provider = os.environ.get("LLM_PROVIDER", "openai").lower()
+
+    if provider == "openai":
+        return ProviderConfig(
+            name="openai",
+            model=os.environ.get("OPENAI_MODEL", "gpt-4o-mini"),
+            api_base="https://api.openai.com/v1",
+            api_key=os.environ.get("OPENAI_API_KEY"),
+            extra_headers={},
+        )
+
+    if provider == "bedrock":
+        # Amazon Bedrock doesn't natively expose an OpenAI-compatible API.
+        # This proxy bridges that gap — but you still need valid AWS creds
+        # so the proxy can call Bedrock's invoke-model endpoint.
+        return ProviderConfig(
+            name="bedrock",
+            model=os.environ.get(
+                "BEDROCK_MODEL_ID",
+                "anthropic.claude-3-haiku-20240307-v1:0",
+            ),
+            api_base=None,
+            api_key=None,
+            extra_headers={},
+        )
+
+    raise ValueError(
+        f"Unknown LLM_PROVIDER '{provider}'. Supported: openai, bedrock"
+    )