diff --git a/.openclaw-sync/source.json b/.openclaw-sync/source.json index 412e9bb40..a10934cad 100644 --- a/.openclaw-sync/source.json +++ b/.openclaw-sync/source.json @@ -1,5 +1,5 @@ { "repository": "openclaw/openclaw", - "sha": "3f217964d1f9063d7ad5ea8851eaac02b8c31b5c", - "syncedAt": "2026-05-07T23:42:07.494Z" + "sha": "63ec912786b27f4613a746420eed34f9714bcd11", + "syncedAt": "2026-05-07T23:48:52.502Z" } diff --git a/docs/gateway/config-agents.md b/docs/gateway/config-agents.md index c2936a965..0e13d148d 100644 --- a/docs/gateway/config-agents.md +++ b/docs/gateway/config-agents.md @@ -1388,7 +1388,7 @@ Defaults for Talk mode (macOS/iOS/Android). provider: "openai", providers: { openai: { - model: "gpt-realtime", + model: "gpt-realtime-2", voice: "alloy", }, }, diff --git a/docs/nodes/talk.md b/docs/nodes/talk.md index 4bc69ef82..15f9f4d86 100644 --- a/docs/nodes/talk.md +++ b/docs/nodes/talk.md @@ -81,7 +81,7 @@ Supported keys: providers: { openai: { apiKey: "openai_api_key", - model: "gpt-realtime", + model: "gpt-realtime-2", voice: "alloy", }, }, diff --git a/docs/providers/google.md b/docs/providers/google.md index d4b826ff1..47ef51430 100644 --- a/docs/providers/google.md +++ b/docs/providers/google.md @@ -398,9 +398,10 @@ Gateway relay transport, which keeps provider credentials on the Gateway. For maintainer live verification, run `OPENAI_API_KEY=... GEMINI_API_KEY=... node --import tsx scripts/dev/realtime-talk-live-smoke.ts`. -The Google leg mints the same constrained Live API token shape used by Control -UI Talk, opens the browser WebSocket endpoint, sends the initial setup payload, -and waits for `setupComplete`. +The smoke also covers OpenAI backend/WebRTC paths; the Google leg mints the same +constrained Live API token shape used by Control UI Talk, opens the browser +WebSocket endpoint, sends the initial setup payload, and waits for +`setupComplete`. ## Advanced configuration diff --git a/docs/providers/openai.md b/docs/providers/openai.md index 85b9750aa..425670cae 100644 --- a/docs/providers/openai.md +++ b/docs/providers/openai.md @@ -641,15 +641,15 @@ Legacy `plugins.entries.openai.config.personality` is still read as a compatibil | Setting | Config path | Default | |---------|------------|---------| - | Model | `plugins.entries.voice-call.config.realtime.providers.openai.model` | `gpt-realtime-1.5` | + | Model | `plugins.entries.voice-call.config.realtime.providers.openai.model` | `gpt-realtime-2` | | Voice | `...openai.voice` | `alloy` | - | Temperature | `...openai.temperature` | `0.8` | + | Temperature (Azure deployment bridge) | `...openai.temperature` | `0.8` | | VAD threshold | `...openai.vadThreshold` | `0.5` | | Silence duration | `...openai.silenceDurationMs` | `500` | | API key | `...openai.apiKey` | Falls back to `OPENAI_API_KEY` | - Supports Azure OpenAI via `azureEndpoint` and `azureDeployment` config keys for backend realtime bridges. Supports bidirectional tool calling. Uses G.711 u-law audio format. + Backend OpenAI realtime bridges use the GA Realtime WebSocket session shape, which does not accept `session.temperature`. Azure OpenAI deployments remain available via `azureEndpoint` and `azureDeployment` and keep the deployment-compatible session shape. Supports bidirectional tool calling and G.711 u-law audio. @@ -657,9 +657,8 @@ Legacy `plugins.entries.openai.config.personality` is still read as a compatibil ephemeral client secret and a direct browser WebRTC SDP exchange against the OpenAI Realtime API. Maintainer live verification is available with `OPENAI_API_KEY=... GEMINI_API_KEY=... node --import tsx scripts/dev/realtime-talk-live-smoke.ts`; - the OpenAI leg mints a client secret in Node, generates a browser SDP offer - with fake microphone media, posts it to OpenAI, and applies the SDP answer - without logging secrets. + the OpenAI legs verify both the backend WebSocket bridge and the browser + WebRTC SDP exchange without logging secrets. diff --git a/docs/web/control-ui.md b/docs/web/control-ui.md index 88dec0720..8a9edd506 100644 --- a/docs/web/control-ui.md +++ b/docs/web/control-ui.md @@ -175,7 +175,7 @@ Imported themes are stored only in the current browser profile. They are not wri In the Chat composer, the Talk control is the waves button next to the microphone dictation button. When Talk starts, the composer status row shows `Connecting Talk...`, then `Talk live` while audio is connected, or `Asking OpenClaw...` while a realtime tool call is consulting the configured larger model through `talk.client.toolCall`. - Maintainer live smoke: `OPENAI_API_KEY=... GEMINI_API_KEY=... node --import tsx scripts/dev/realtime-talk-live-smoke.ts` verifies the OpenAI browser WebRTC SDP exchange, Google Live constrained-token browser WebSocket setup, and the Gateway relay browser adapter with fake microphone media. The command prints provider status only and does not log secrets. + Maintainer live smoke: `OPENAI_API_KEY=... GEMINI_API_KEY=... node --import tsx scripts/dev/realtime-talk-live-smoke.ts` verifies the OpenAI backend WebSocket bridge, OpenAI browser WebRTC SDP exchange, Google Live constrained-token browser WebSocket setup, and the Gateway relay browser adapter with fake microphone media. The command prints provider status only and does not log secrets.