@openclaw/voice-call 2026.3.13 → 2026.5.1-beta.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (103) hide show
  1. package/README.md +25 -5
  2. package/api.ts +16 -0
  3. package/cli-metadata.ts +10 -0
  4. package/config-api.ts +12 -0
  5. package/index.test.ts +866 -0
  6. package/index.ts +353 -148
  7. package/openclaw.plugin.json +336 -157
  8. package/package.json +33 -5
  9. package/runtime-api.ts +20 -0
  10. package/runtime-entry.ts +1 -0
  11. package/setup-api.ts +47 -0
  12. package/src/allowlist.test.ts +18 -0
  13. package/src/cli.ts +533 -68
  14. package/src/config-compat.test.ts +120 -0
  15. package/src/config-compat.ts +227 -0
  16. package/src/config.test.ts +160 -12
  17. package/src/config.ts +243 -74
  18. package/src/core-bridge.ts +2 -147
  19. package/src/deep-merge.test.ts +40 -0
  20. package/src/gateway-continue-operation.ts +200 -0
  21. package/src/http-headers.ts +6 -3
  22. package/src/manager/context.ts +6 -5
  23. package/src/manager/events.test.ts +179 -19
  24. package/src/manager/events.ts +48 -30
  25. package/src/manager/lifecycle.ts +53 -0
  26. package/src/manager/lookup.test.ts +52 -0
  27. package/src/manager/outbound.test.ts +464 -0
  28. package/src/manager/outbound.ts +148 -55
  29. package/src/manager/store.ts +18 -6
  30. package/src/manager/timers.test.ts +129 -0
  31. package/src/manager/timers.ts +4 -3
  32. package/src/manager/twiml.test.ts +13 -0
  33. package/src/manager/twiml.ts +8 -0
  34. package/src/manager.closed-loop.test.ts +30 -12
  35. package/src/manager.inbound-allowlist.test.ts +77 -10
  36. package/src/manager.notify.test.ts +344 -20
  37. package/src/manager.restore.test.ts +95 -8
  38. package/src/manager.test-harness.ts +8 -6
  39. package/src/manager.ts +79 -5
  40. package/src/media-stream.test.ts +578 -81
  41. package/src/media-stream.ts +235 -54
  42. package/src/providers/base.ts +19 -0
  43. package/src/providers/mock.ts +7 -1
  44. package/src/providers/plivo.test.ts +50 -6
  45. package/src/providers/plivo.ts +14 -6
  46. package/src/providers/shared/call-status.ts +2 -1
  47. package/src/providers/shared/guarded-json-api.test.ts +106 -0
  48. package/src/providers/shared/guarded-json-api.ts +1 -1
  49. package/src/providers/telnyx.test.ts +178 -6
  50. package/src/providers/telnyx.ts +40 -3
  51. package/src/providers/twilio/api.test.ts +145 -0
  52. package/src/providers/twilio/api.ts +67 -16
  53. package/src/providers/twilio/twiml-policy.ts +6 -10
  54. package/src/providers/twilio/webhook.ts +1 -1
  55. package/src/providers/twilio.test.ts +425 -25
  56. package/src/providers/twilio.ts +230 -77
  57. package/src/providers/twilio.types.ts +17 -0
  58. package/src/realtime-defaults.ts +3 -0
  59. package/src/realtime-fast-context.test.ts +88 -0
  60. package/src/realtime-fast-context.ts +165 -0
  61. package/src/realtime-transcription.runtime.ts +4 -0
  62. package/src/realtime-voice.runtime.ts +5 -0
  63. package/src/response-generator.test.ts +277 -0
  64. package/src/response-generator.ts +186 -40
  65. package/src/response-model.test.ts +71 -0
  66. package/src/response-model.ts +23 -0
  67. package/src/runtime.test.ts +351 -0
  68. package/src/runtime.ts +254 -24
  69. package/src/telephony-audio.test.ts +61 -0
  70. package/src/telephony-audio.ts +1 -79
  71. package/src/telephony-tts.test.ts +133 -12
  72. package/src/telephony-tts.ts +155 -2
  73. package/src/test-fixtures.ts +26 -7
  74. package/src/tts-provider-voice.test.ts +34 -0
  75. package/src/tts-provider-voice.ts +21 -0
  76. package/src/tunnel.test.ts +166 -0
  77. package/src/tunnel.ts +1 -1
  78. package/src/types.ts +24 -37
  79. package/src/utils.test.ts +17 -0
  80. package/src/voice-mapping.test.ts +34 -0
  81. package/src/voice-mapping.ts +3 -2
  82. package/src/webhook/realtime-handler.test.ts +598 -0
  83. package/src/webhook/realtime-handler.ts +485 -0
  84. package/src/webhook/stale-call-reaper.test.ts +88 -0
  85. package/src/webhook/stale-call-reaper.ts +5 -0
  86. package/src/webhook/tailscale.test.ts +214 -0
  87. package/src/webhook/tailscale.ts +19 -5
  88. package/src/webhook-exposure.test.ts +33 -0
  89. package/src/webhook-exposure.ts +84 -0
  90. package/src/webhook-security.test.ts +172 -21
  91. package/src/webhook-security.ts +43 -29
  92. package/src/webhook.hangup-once.lifecycle.test.ts +135 -0
  93. package/src/webhook.test.ts +1145 -27
  94. package/src/webhook.ts +513 -100
  95. package/src/webhook.types.ts +5 -0
  96. package/src/websocket-test-support.ts +72 -0
  97. package/tsconfig.json +16 -0
  98. package/CHANGELOG.md +0 -121
  99. package/src/providers/index.ts +0 -10
  100. package/src/providers/stt-openai-realtime.test.ts +0 -42
  101. package/src/providers/stt-openai-realtime.ts +0 -311
  102. package/src/providers/tts-openai.test.ts +0 -43
  103. package/src/providers/tts-openai.ts +0 -221
@@ -0,0 +1,120 @@
1
+ import { describe, expect, it } from "vitest";
2
+ import {
3
+ VOICE_CALL_LEGACY_CONFIG_REMOVAL_VERSION,
4
+ collectVoiceCallLegacyConfigIssues,
5
+ formatVoiceCallLegacyConfigWarnings,
6
+ migrateVoiceCallLegacyConfigInput,
7
+ normalizeVoiceCallLegacyConfigInput,
8
+ parseVoiceCallPluginConfig,
9
+ } from "./config-compat.js";
10
+
11
+ describe("voice-call config compatibility", () => {
12
+ it("maps deprecated provider and twilio.from fields into canonical config", () => {
13
+ const parsed = parseVoiceCallPluginConfig({
14
+ enabled: true,
15
+ provider: "log",
16
+ twilio: {
17
+ from: "+15550001234",
18
+ },
19
+ });
20
+
21
+ expect(parsed.provider).toBe("mock");
22
+ expect(parsed.fromNumber).toBe("+15550001234");
23
+ });
24
+
25
+ it("moves legacy streaming OpenAI fields into streaming.providers.openai", () => {
26
+ const normalized = normalizeVoiceCallLegacyConfigInput({
27
+ streaming: {
28
+ enabled: true,
29
+ sttProvider: "openai",
30
+ openaiApiKey: "sk-test", // pragma: allowlist secret
31
+ sttModel: "gpt-4o-transcribe",
32
+ silenceDurationMs: 700,
33
+ vadThreshold: 0.4,
34
+ },
35
+ });
36
+
37
+ expect(normalized).toMatchObject({
38
+ streaming: {
39
+ enabled: true,
40
+ provider: "openai",
41
+ providers: {
42
+ openai: {
43
+ apiKey: "sk-test",
44
+ model: "gpt-4o-transcribe",
45
+ silenceDurationMs: 700,
46
+ vadThreshold: 0.4,
47
+ },
48
+ },
49
+ },
50
+ });
51
+ expect((normalized.streaming as Record<string, unknown>).openaiApiKey).toBeUndefined();
52
+ expect((normalized.streaming as Record<string, unknown>).sttModel).toBeUndefined();
53
+ });
54
+
55
+ it("reports doctor-oriented legacy issues and warnings", () => {
56
+ const raw = {
57
+ provider: "log",
58
+ twilio: {
59
+ from: "+15550001234",
60
+ },
61
+ streaming: {
62
+ sttProvider: "openai",
63
+ openaiApiKey: "sk-test", // pragma: allowlist secret
64
+ },
65
+ };
66
+
67
+ expect(collectVoiceCallLegacyConfigIssues(raw)).toEqual([
68
+ {
69
+ path: "provider",
70
+ replacement: "provider",
71
+ message: 'Replace provider "log" with "mock".',
72
+ },
73
+ {
74
+ path: "twilio.from",
75
+ replacement: "fromNumber",
76
+ message: "Move twilio.from to fromNumber.",
77
+ },
78
+ {
79
+ path: "streaming.sttProvider",
80
+ replacement: "streaming.provider",
81
+ message: "Move streaming.sttProvider to streaming.provider.",
82
+ },
83
+ {
84
+ path: "streaming.openaiApiKey",
85
+ replacement: "streaming.providers.openai.apiKey",
86
+ message: "Move streaming.openaiApiKey to streaming.providers.openai.apiKey.",
87
+ },
88
+ ]);
89
+ expect(
90
+ formatVoiceCallLegacyConfigWarnings({
91
+ value: raw,
92
+ configPathPrefix: "plugins.entries.voice-call.config",
93
+ doctorFixCommand: "openclaw doctor --fix",
94
+ }),
95
+ ).toEqual([
96
+ `[voice-call] legacy config keys detected under plugins.entries.voice-call.config; runtime loading will not rewrite them, and support for the legacy shape will be removed in ${VOICE_CALL_LEGACY_CONFIG_REMOVAL_VERSION}. Run "openclaw doctor --fix".`,
97
+ '[voice-call] plugins.entries.voice-call.config.provider: Replace provider "log" with "mock".',
98
+ "[voice-call] plugins.entries.voice-call.config.twilio.from: Move twilio.from to fromNumber.",
99
+ "[voice-call] plugins.entries.voice-call.config.streaming.sttProvider: Move streaming.sttProvider to streaming.provider.",
100
+ "[voice-call] plugins.entries.voice-call.config.streaming.openaiApiKey: Move streaming.openaiApiKey to streaming.providers.openai.apiKey.",
101
+ ]);
102
+ });
103
+
104
+ it("returns doctor migration change lines", () => {
105
+ const migration = migrateVoiceCallLegacyConfigInput({
106
+ value: {
107
+ provider: "log",
108
+ streaming: {
109
+ sttProvider: "openai",
110
+ },
111
+ },
112
+ configPathPrefix: "plugins.entries.voice-call.config",
113
+ });
114
+
115
+ expect(migration.changes).toEqual([
116
+ 'Moved plugins.entries.voice-call.config.provider "log" → "mock".',
117
+ "Moved plugins.entries.voice-call.config.streaming.sttProvider → plugins.entries.voice-call.config.streaming.provider.",
118
+ ]);
119
+ });
120
+ });
@@ -0,0 +1,227 @@
1
+ import { asOptionalRecord, readStringField } from "openclaw/plugin-sdk/text-runtime";
2
+ import type { VoiceCallConfig } from "./config.js";
3
+ import { VoiceCallConfigSchema } from "./config.js";
4
+
5
+ export const VOICE_CALL_LEGACY_CONFIG_REMOVAL_VERSION = "2026.6.0";
6
+
7
+ type VoiceCallLegacyConfigIssue = {
8
+ path: string;
9
+ replacement: string;
10
+ message: string;
11
+ };
12
+
13
+ const asObject = asOptionalRecord;
14
+ const getString = readStringField;
15
+
16
+ function getNumber(obj: Record<string, unknown> | undefined, key: string): number | undefined {
17
+ const value = obj?.[key];
18
+ return typeof value === "number" ? value : undefined;
19
+ }
20
+
21
+ function mergeProviderConfig(
22
+ providersValue: unknown,
23
+ providerId: string,
24
+ compatValues: Record<string, unknown>,
25
+ ): Record<string, unknown> | undefined {
26
+ if (Object.keys(compatValues).length === 0) {
27
+ return asObject(providersValue);
28
+ }
29
+
30
+ const providers = asObject(providersValue) ?? {};
31
+ const existing = asObject(providers[providerId]) ?? {};
32
+ return {
33
+ ...providers,
34
+ [providerId]: {
35
+ ...existing,
36
+ ...compatValues,
37
+ },
38
+ };
39
+ }
40
+
41
+ export function collectVoiceCallLegacyConfigIssues(value: unknown): VoiceCallLegacyConfigIssue[] {
42
+ const raw = asObject(value) ?? {};
43
+ const twilio = asObject(raw.twilio);
44
+ const streaming = asObject(raw.streaming);
45
+
46
+ const issues: VoiceCallLegacyConfigIssue[] = [];
47
+ if (raw.provider === "log") {
48
+ issues.push({
49
+ path: "provider",
50
+ replacement: "provider",
51
+ message: 'Replace provider "log" with "mock".',
52
+ });
53
+ }
54
+ if (typeof twilio?.from === "string") {
55
+ issues.push({
56
+ path: "twilio.from",
57
+ replacement: "fromNumber",
58
+ message: "Move twilio.from to fromNumber.",
59
+ });
60
+ }
61
+ if (typeof streaming?.sttProvider === "string") {
62
+ issues.push({
63
+ path: "streaming.sttProvider",
64
+ replacement: "streaming.provider",
65
+ message: "Move streaming.sttProvider to streaming.provider.",
66
+ });
67
+ }
68
+ if (typeof streaming?.openaiApiKey === "string") {
69
+ issues.push({
70
+ path: "streaming.openaiApiKey",
71
+ replacement: "streaming.providers.openai.apiKey",
72
+ message: "Move streaming.openaiApiKey to streaming.providers.openai.apiKey.",
73
+ });
74
+ }
75
+ if (typeof streaming?.sttModel === "string") {
76
+ issues.push({
77
+ path: "streaming.sttModel",
78
+ replacement: "streaming.providers.openai.model",
79
+ message: "Move streaming.sttModel to streaming.providers.openai.model.",
80
+ });
81
+ }
82
+ if (typeof streaming?.silenceDurationMs === "number") {
83
+ issues.push({
84
+ path: "streaming.silenceDurationMs",
85
+ replacement: "streaming.providers.openai.silenceDurationMs",
86
+ message: "Move streaming.silenceDurationMs to streaming.providers.openai.silenceDurationMs.",
87
+ });
88
+ }
89
+ if (typeof streaming?.vadThreshold === "number") {
90
+ issues.push({
91
+ path: "streaming.vadThreshold",
92
+ replacement: "streaming.providers.openai.vadThreshold",
93
+ message: "Move streaming.vadThreshold to streaming.providers.openai.vadThreshold.",
94
+ });
95
+ }
96
+
97
+ return issues;
98
+ }
99
+
100
+ export function formatVoiceCallLegacyConfigWarnings(params: {
101
+ value: unknown;
102
+ configPathPrefix: string;
103
+ doctorFixCommand: string;
104
+ }): string[] {
105
+ const issues = collectVoiceCallLegacyConfigIssues(params.value);
106
+ if (issues.length === 0) {
107
+ return [];
108
+ }
109
+
110
+ return [
111
+ `[voice-call] legacy config keys detected under ${params.configPathPrefix}; runtime loading will not rewrite them, and support for the legacy shape will be removed in ${VOICE_CALL_LEGACY_CONFIG_REMOVAL_VERSION}. Run "${params.doctorFixCommand}".`,
112
+ ...issues.map(
113
+ (issue) => `[voice-call] ${params.configPathPrefix}.${issue.path}: ${issue.message}`,
114
+ ),
115
+ ];
116
+ }
117
+
118
+ export function migrateVoiceCallLegacyConfigInput(params: {
119
+ value: unknown;
120
+ configPathPrefix?: string;
121
+ }): {
122
+ config: Record<string, unknown>;
123
+ changes: string[];
124
+ issues: VoiceCallLegacyConfigIssue[];
125
+ } {
126
+ const raw = asObject(params.value) ?? {};
127
+ const twilio = asObject(raw.twilio);
128
+ const streaming = asObject(raw.streaming);
129
+ const configPathPrefix = params.configPathPrefix ?? "plugins.entries.voice-call.config";
130
+ const issues = collectVoiceCallLegacyConfigIssues(raw);
131
+
132
+ const legacyStreamingOpenAICompat: Record<string, unknown> = {};
133
+ const streamingOpenAIApiKey = getString(streaming, "openaiApiKey");
134
+ if (streamingOpenAIApiKey) {
135
+ legacyStreamingOpenAICompat.apiKey = streamingOpenAIApiKey;
136
+ }
137
+ const streamingSttModel = getString(streaming, "sttModel");
138
+ if (streamingSttModel) {
139
+ legacyStreamingOpenAICompat.model = streamingSttModel;
140
+ }
141
+ const streamingSilenceDurationMs = getNumber(streaming, "silenceDurationMs");
142
+ if (streamingSilenceDurationMs !== undefined) {
143
+ legacyStreamingOpenAICompat.silenceDurationMs = streamingSilenceDurationMs;
144
+ }
145
+ const streamingVadThreshold = getNumber(streaming, "vadThreshold");
146
+ if (streamingVadThreshold !== undefined) {
147
+ legacyStreamingOpenAICompat.vadThreshold = streamingVadThreshold;
148
+ }
149
+ const streamingProvider = getString(streaming, "provider");
150
+ const legacyStreamingProvider = getString(streaming, "sttProvider");
151
+
152
+ const normalizedStreaming: Record<string, unknown> | undefined = streaming
153
+ ? {
154
+ ...streaming,
155
+ provider: streamingProvider ?? legacyStreamingProvider,
156
+ providers: mergeProviderConfig(streaming.providers, "openai", legacyStreamingOpenAICompat),
157
+ }
158
+ : undefined;
159
+
160
+ if (normalizedStreaming) {
161
+ delete normalizedStreaming.sttProvider;
162
+ delete normalizedStreaming.openaiApiKey;
163
+ delete normalizedStreaming.sttModel;
164
+ delete normalizedStreaming.silenceDurationMs;
165
+ delete normalizedStreaming.vadThreshold;
166
+ }
167
+
168
+ const normalizedTwilio = twilio
169
+ ? {
170
+ ...twilio,
171
+ }
172
+ : undefined;
173
+ if (normalizedTwilio) {
174
+ delete normalizedTwilio.from;
175
+ }
176
+
177
+ const config = {
178
+ ...raw,
179
+ provider: raw.provider === "log" ? "mock" : raw.provider,
180
+ fromNumber: raw.fromNumber ?? (typeof twilio?.from === "string" ? twilio.from : undefined),
181
+ twilio: normalizedTwilio,
182
+ streaming: normalizedStreaming,
183
+ };
184
+
185
+ const changes: string[] = [];
186
+ if (raw.provider === "log") {
187
+ changes.push(`Moved ${configPathPrefix}.provider "log" → "mock".`);
188
+ }
189
+ if (typeof twilio?.from === "string" && typeof raw.fromNumber !== "string") {
190
+ changes.push(`Moved ${configPathPrefix}.twilio.from → ${configPathPrefix}.fromNumber.`);
191
+ }
192
+ if (typeof streaming?.sttProvider === "string") {
193
+ changes.push(
194
+ `Moved ${configPathPrefix}.streaming.sttProvider → ${configPathPrefix}.streaming.provider.`,
195
+ );
196
+ }
197
+ if (typeof streaming?.openaiApiKey === "string") {
198
+ changes.push(
199
+ `Moved ${configPathPrefix}.streaming.openaiApiKey → ${configPathPrefix}.streaming.providers.openai.apiKey.`,
200
+ );
201
+ }
202
+ if (typeof streaming?.sttModel === "string") {
203
+ changes.push(
204
+ `Moved ${configPathPrefix}.streaming.sttModel → ${configPathPrefix}.streaming.providers.openai.model.`,
205
+ );
206
+ }
207
+ if (typeof streaming?.silenceDurationMs === "number") {
208
+ changes.push(
209
+ `Moved ${configPathPrefix}.streaming.silenceDurationMs → ${configPathPrefix}.streaming.providers.openai.silenceDurationMs.`,
210
+ );
211
+ }
212
+ if (typeof streaming?.vadThreshold === "number") {
213
+ changes.push(
214
+ `Moved ${configPathPrefix}.streaming.vadThreshold → ${configPathPrefix}.streaming.providers.openai.vadThreshold.`,
215
+ );
216
+ }
217
+
218
+ return { config, changes, issues };
219
+ }
220
+
221
+ export function normalizeVoiceCallLegacyConfigInput(value: unknown): Record<string, unknown> {
222
+ return migrateVoiceCallLegacyConfigInput({ value }).config;
223
+ }
224
+
225
+ export function parseVoiceCallPluginConfig(value: unknown): VoiceCallConfig {
226
+ return VoiceCallConfigSchema.parse(normalizeVoiceCallLegacyConfigInput(value));
227
+ }
@@ -1,5 +1,7 @@
1
1
  import { afterEach, beforeEach, describe, expect, it } from "vitest";
2
2
  import {
3
+ VoiceCallConfigSchema,
4
+ resolveTwilioAuthToken,
3
5
  validateProviderConfig,
4
6
  normalizeVoiceCallConfig,
5
7
  resolveVoiceCallConfig,
@@ -11,11 +13,25 @@ function createBaseConfig(provider: "telnyx" | "twilio" | "plivo" | "mock"): Voi
11
13
  return createVoiceCallBaseConfig({ provider });
12
14
  }
13
15
 
16
+ function envRef(id: string) {
17
+ return { source: "env" as const, provider: "default", id };
18
+ }
19
+
20
+ function requireElevenLabsTtsConfig(config: Pick<VoiceCallConfig, "tts">) {
21
+ const tts = config.tts;
22
+ const elevenlabs = tts?.providers?.elevenlabs;
23
+ if (!elevenlabs || typeof elevenlabs !== "object") {
24
+ throw new Error("voice-call config did not preserve nested elevenlabs TTS config");
25
+ }
26
+ return { tts, elevenlabs };
27
+ }
28
+
14
29
  describe("validateProviderConfig", () => {
15
30
  const originalEnv = { ...process.env };
16
31
  const clearProviderEnv = () => {
17
32
  delete process.env.TWILIO_ACCOUNT_SID;
18
33
  delete process.env.TWILIO_AUTH_TOKEN;
34
+ delete process.env.TWILIO_FROM_NUMBER;
19
35
  delete process.env.TELNYX_API_KEY;
20
36
  delete process.env.TELNYX_CONNECTION_ID;
21
37
  delete process.env.TELNYX_PUBLIC_KEY;
@@ -54,6 +70,7 @@ describe("validateProviderConfig", () => {
54
70
  if (provider === "twilio") {
55
71
  process.env.TWILIO_ACCOUNT_SID = "AC123";
56
72
  process.env.TWILIO_AUTH_TOKEN = "secret";
73
+ process.env.TWILIO_FROM_NUMBER = "+15550001234";
57
74
  } else if (provider === "telnyx") {
58
75
  process.env.TELNYX_API_KEY = "KEY123";
59
76
  process.env.TELNYX_CONNECTION_ID = "CONN456";
@@ -69,6 +86,24 @@ describe("validateProviderConfig", () => {
69
86
  });
70
87
 
71
88
  describe("twilio provider", () => {
89
+ it("accepts SecretRef-backed auth tokens before runtime resolution", () => {
90
+ const config = VoiceCallConfigSchema.parse({
91
+ enabled: true,
92
+ provider: "twilio",
93
+ fromNumber: "+15550001234",
94
+ twilio: {
95
+ accountSid: "AC123",
96
+ authToken: envRef("TWILIO_AUTH_TOKEN"),
97
+ },
98
+ });
99
+
100
+ expect(config.twilio?.authToken).toEqual(envRef("TWILIO_AUTH_TOKEN"));
101
+ expect(validateProviderConfig(config)).toMatchObject({ valid: true, errors: [] });
102
+ expect(() => resolveTwilioAuthToken(config)).toThrow(
103
+ 'plugins.entries.voice-call.config.twilio.authToken: unresolved SecretRef "env:default:TWILIO_AUTH_TOKEN"',
104
+ );
105
+ });
106
+
72
107
  it("passes validation with mixed config and env vars", () => {
73
108
  process.env.TWILIO_AUTH_TOKEN = "secret";
74
109
  let config = createBaseConfig("twilio");
@@ -81,6 +116,20 @@ describe("validateProviderConfig", () => {
81
116
  expect(result.errors).toEqual([]);
82
117
  });
83
118
 
119
+ it("resolves the Twilio from number from environment", () => {
120
+ process.env.TWILIO_ACCOUNT_SID = "AC123";
121
+ process.env.TWILIO_AUTH_TOKEN = "secret";
122
+ process.env.TWILIO_FROM_NUMBER = "+15550001234";
123
+
124
+ const config = resolveVoiceCallConfig({
125
+ ...createBaseConfig("twilio"),
126
+ fromNumber: undefined,
127
+ });
128
+
129
+ expect(config.fromNumber).toBe("+15550001234");
130
+ expect(validateProviderConfig(config)).toMatchObject({ valid: true, errors: [] });
131
+ });
132
+
84
133
  it("fails validation when required twilio credentials are missing", () => {
85
134
  process.env.TWILIO_AUTH_TOKEN = "secret";
86
135
  const missingSid = validateProviderConfig(resolveVoiceCallConfig(createBaseConfig("twilio")));
@@ -170,6 +219,43 @@ describe("validateProviderConfig", () => {
170
219
  expect(result.errors).toEqual([]);
171
220
  });
172
221
  });
222
+
223
+ describe("realtime config", () => {
224
+ it("rejects disabled inbound policy for realtime mode", () => {
225
+ const config = createBaseConfig("twilio");
226
+ config.realtime.enabled = true;
227
+ config.inboundPolicy = "disabled";
228
+
229
+ const result = validateProviderConfig(config);
230
+
231
+ expect(result.valid).toBe(false);
232
+ expect(result.errors).toContain(
233
+ 'plugins.entries.voice-call.config.inboundPolicy must not be "disabled" when realtime.enabled is true',
234
+ );
235
+ });
236
+
237
+ it("rejects enabling realtime and streaming together", () => {
238
+ const config = createBaseConfig("twilio");
239
+ config.realtime.enabled = true;
240
+ config.streaming.enabled = true;
241
+ config.inboundPolicy = "allowlist";
242
+
243
+ const result = validateProviderConfig(config);
244
+
245
+ expect(result.valid).toBe(false);
246
+ expect(result.errors).toContain(
247
+ "plugins.entries.voice-call.config.realtime.enabled and plugins.entries.voice-call.config.streaming.enabled cannot both be true",
248
+ );
249
+ });
250
+ });
251
+ });
252
+
253
+ describe("resolveVoiceCallConfig", () => {
254
+ it("enables the pre-answer stale call reaper by default", () => {
255
+ const config = resolveVoiceCallConfig({ enabled: true, provider: "mock" });
256
+
257
+ expect(config.staleCallReaperSeconds).toBe(120);
258
+ });
173
259
  });
174
260
 
175
261
  describe("normalizeVoiceCallConfig", () => {
@@ -185,34 +271,96 @@ describe("normalizeVoiceCallConfig", () => {
185
271
 
186
272
  expect(normalized.serve.path).toBe("/voice/webhook");
187
273
  expect(normalized.streaming.streamPath).toBe("/custom-stream");
188
- expect(normalized.streaming.sttModel).toBe("gpt-4o-transcribe");
274
+ expect(normalized.streaming.provider).toBeUndefined();
275
+ expect(normalized.streaming.providers).toEqual({});
276
+ expect(normalized.realtime.streamPath).toBe("/voice/stream/realtime");
277
+ expect(normalized.realtime.toolPolicy).toBe("safe-read-only");
278
+ expect(normalized.realtime.fastContext).toEqual({
279
+ enabled: false,
280
+ timeoutMs: 800,
281
+ maxResults: 3,
282
+ sources: ["memory", "sessions"],
283
+ fallbackToConsult: false,
284
+ });
285
+ expect(normalized.realtime.instructions).toContain("openclaw_agent_consult");
189
286
  expect(normalized.tunnel.provider).toBe("none");
190
287
  expect(normalized.webhookSecurity.allowedHosts).toEqual([]);
191
288
  });
192
289
 
290
+ it("derives the realtime stream path from a custom webhook path", () => {
291
+ const normalized = normalizeVoiceCallConfig({
292
+ enabled: true,
293
+ provider: "twilio",
294
+ serve: {
295
+ path: "/custom/webhook",
296
+ },
297
+ });
298
+
299
+ expect(normalized.realtime.streamPath).toBe("/custom/stream/realtime");
300
+ });
301
+
193
302
  it("accepts partial nested TTS overrides and preserves nested objects", () => {
194
303
  const normalized = normalizeVoiceCallConfig({
195
304
  tts: {
196
305
  provider: "elevenlabs",
197
- elevenlabs: {
198
- apiKey: {
199
- source: "env",
200
- provider: "elevenlabs",
201
- id: "ELEVENLABS_API_KEY",
202
- },
203
- voiceSettings: {
204
- speed: 1.1,
306
+ providers: {
307
+ elevenlabs: {
308
+ apiKey: {
309
+ source: "env",
310
+ provider: "elevenlabs",
311
+ id: "ELEVENLABS_API_KEY",
312
+ },
313
+ voiceSettings: {
314
+ speed: 1.1,
315
+ },
205
316
  },
206
317
  },
207
318
  },
208
319
  });
209
320
 
210
- expect(normalized.tts?.provider).toBe("elevenlabs");
211
- expect(normalized.tts?.elevenlabs?.apiKey).toEqual({
321
+ const { tts, elevenlabs } = requireElevenLabsTtsConfig(normalized);
322
+ expect(tts.provider).toBe("elevenlabs");
323
+ expect(elevenlabs.apiKey).toEqual({
212
324
  source: "env",
213
325
  provider: "elevenlabs",
214
326
  id: "ELEVENLABS_API_KEY",
215
327
  });
216
- expect(normalized.tts?.elevenlabs?.voiceSettings).toEqual({ speed: 1.1 });
328
+ expect(elevenlabs.voiceSettings).toEqual({ speed: 1.1 });
329
+ });
330
+ });
331
+
332
+ describe("resolveVoiceCallConfig", () => {
333
+ it("preserves configured realtime instructions without env indirection", () => {
334
+ const resolved = resolveVoiceCallConfig({
335
+ enabled: true,
336
+ provider: "twilio",
337
+ realtime: {
338
+ enabled: true,
339
+ instructions: "Stay concise.",
340
+ },
341
+ });
342
+
343
+ expect(resolved.realtime.instructions).toBe("Stay concise.");
344
+ expect(resolved.realtime.toolPolicy).toBe("safe-read-only");
345
+ expect(resolved.realtime.provider).toBeUndefined();
346
+ });
347
+
348
+ it("leaves responseModel unset so voice responses can inherit runtime defaults", () => {
349
+ const resolved = resolveVoiceCallConfig({
350
+ enabled: true,
351
+ provider: "mock",
352
+ });
353
+
354
+ expect(resolved.responseModel).toBeUndefined();
355
+ });
356
+
357
+ it("preserves the configured voice response agent id", () => {
358
+ const resolved = resolveVoiceCallConfig({
359
+ enabled: true,
360
+ provider: "mock",
361
+ agentId: "voice",
362
+ });
363
+
364
+ expect(resolved.agentId).toBe("voice");
217
365
  });
218
366
  });