@johpaz/hive 1.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CONTRIBUTING.md +44 -0
- package/README.md +310 -0
- package/package.json +96 -0
- package/packages/cli/package.json +28 -0
- package/packages/cli/src/commands/agent-run.ts +168 -0
- package/packages/cli/src/commands/agents.ts +398 -0
- package/packages/cli/src/commands/chat.ts +142 -0
- package/packages/cli/src/commands/config.ts +50 -0
- package/packages/cli/src/commands/cron.ts +161 -0
- package/packages/cli/src/commands/dev.ts +95 -0
- package/packages/cli/src/commands/doctor.ts +133 -0
- package/packages/cli/src/commands/gateway.ts +443 -0
- package/packages/cli/src/commands/logs.ts +57 -0
- package/packages/cli/src/commands/mcp.ts +175 -0
- package/packages/cli/src/commands/message.ts +77 -0
- package/packages/cli/src/commands/onboard.ts +1868 -0
- package/packages/cli/src/commands/security.ts +144 -0
- package/packages/cli/src/commands/service.ts +50 -0
- package/packages/cli/src/commands/sessions.ts +116 -0
- package/packages/cli/src/commands/skills.ts +187 -0
- package/packages/cli/src/commands/update.ts +25 -0
- package/packages/cli/src/index.ts +185 -0
- package/packages/cli/src/utils/token.ts +6 -0
- package/packages/code-bridge/README.md +78 -0
- package/packages/code-bridge/package.json +18 -0
- package/packages/code-bridge/src/index.ts +95 -0
- package/packages/code-bridge/src/process-manager.ts +212 -0
- package/packages/code-bridge/src/schemas.ts +133 -0
- package/packages/core/package.json +46 -0
- package/packages/core/src/agent/agent-loop.ts +369 -0
- package/packages/core/src/agent/compaction.ts +140 -0
- package/packages/core/src/agent/context-compiler.ts +378 -0
- package/packages/core/src/agent/context-guard.ts +91 -0
- package/packages/core/src/agent/context.ts +138 -0
- package/packages/core/src/agent/conversation-store.ts +198 -0
- package/packages/core/src/agent/curator.ts +158 -0
- package/packages/core/src/agent/hooks.ts +166 -0
- package/packages/core/src/agent/index.ts +116 -0
- package/packages/core/src/agent/llm-client.ts +503 -0
- package/packages/core/src/agent/native-tools.ts +505 -0
- package/packages/core/src/agent/prompt-builder.ts +532 -0
- package/packages/core/src/agent/providers/index.ts +167 -0
- package/packages/core/src/agent/providers.ts +1 -0
- package/packages/core/src/agent/reflector.ts +170 -0
- package/packages/core/src/agent/service.ts +64 -0
- package/packages/core/src/agent/stuck-loop.ts +133 -0
- package/packages/core/src/agent/supervisor.ts +39 -0
- package/packages/core/src/agent/tracer.ts +102 -0
- package/packages/core/src/agent/workspace.ts +110 -0
- package/packages/core/src/canvas/canvas-manager.test.ts +161 -0
- package/packages/core/src/canvas/canvas-manager.ts +319 -0
- package/packages/core/src/canvas/canvas-tools.ts +420 -0
- package/packages/core/src/canvas/emitter.ts +115 -0
- package/packages/core/src/canvas/index.ts +2 -0
- package/packages/core/src/channels/base.ts +138 -0
- package/packages/core/src/channels/discord.ts +260 -0
- package/packages/core/src/channels/index.ts +7 -0
- package/packages/core/src/channels/manager.ts +383 -0
- package/packages/core/src/channels/slack.ts +287 -0
- package/packages/core/src/channels/telegram.ts +502 -0
- package/packages/core/src/channels/webchat.ts +128 -0
- package/packages/core/src/channels/whatsapp.ts +375 -0
- package/packages/core/src/config/index.ts +12 -0
- package/packages/core/src/config/loader.ts +529 -0
- package/packages/core/src/events/event-bus.ts +169 -0
- package/packages/core/src/gateway/index.ts +5 -0
- package/packages/core/src/gateway/initializer.ts +290 -0
- package/packages/core/src/gateway/lane-queue.ts +169 -0
- package/packages/core/src/gateway/resolver.ts +108 -0
- package/packages/core/src/gateway/router.ts +124 -0
- package/packages/core/src/gateway/server.ts +3317 -0
- package/packages/core/src/gateway/session.ts +95 -0
- package/packages/core/src/gateway/slash-commands.ts +192 -0
- package/packages/core/src/heartbeat/index.ts +157 -0
- package/packages/core/src/index.ts +19 -0
- package/packages/core/src/integrations/catalog.ts +286 -0
- package/packages/core/src/integrations/env.ts +64 -0
- package/packages/core/src/integrations/index.ts +2 -0
- package/packages/core/src/memory/index.ts +1 -0
- package/packages/core/src/memory/notes.ts +68 -0
- package/packages/core/src/plugins/api.ts +128 -0
- package/packages/core/src/plugins/index.ts +2 -0
- package/packages/core/src/plugins/loader.ts +365 -0
- package/packages/core/src/resilience/circuit-breaker.ts +225 -0
- package/packages/core/src/security/google-chat.ts +269 -0
- package/packages/core/src/security/index.ts +192 -0
- package/packages/core/src/security/pairing.ts +250 -0
- package/packages/core/src/security/rate-limit.ts +270 -0
- package/packages/core/src/security/signal.ts +321 -0
- package/packages/core/src/state/store.ts +312 -0
- package/packages/core/src/storage/bun-sqlite-store.ts +188 -0
- package/packages/core/src/storage/crypto.ts +101 -0
- package/packages/core/src/storage/db-context.ts +333 -0
- package/packages/core/src/storage/onboarding.ts +1087 -0
- package/packages/core/src/storage/schema.ts +541 -0
- package/packages/core/src/storage/seed.ts +571 -0
- package/packages/core/src/storage/sqlite.ts +387 -0
- package/packages/core/src/storage/usage.ts +212 -0
- package/packages/core/src/tools/bridge-events.ts +74 -0
- package/packages/core/src/tools/browser.ts +275 -0
- package/packages/core/src/tools/codebridge.ts +421 -0
- package/packages/core/src/tools/coordinator-tools.ts +179 -0
- package/packages/core/src/tools/cron.ts +611 -0
- package/packages/core/src/tools/exec.ts +140 -0
- package/packages/core/src/tools/fs.ts +364 -0
- package/packages/core/src/tools/index.ts +12 -0
- package/packages/core/src/tools/memory.ts +176 -0
- package/packages/core/src/tools/notify.ts +113 -0
- package/packages/core/src/tools/project-management.ts +376 -0
- package/packages/core/src/tools/project.ts +375 -0
- package/packages/core/src/tools/read.ts +158 -0
- package/packages/core/src/tools/web.ts +436 -0
- package/packages/core/src/tools/workspace.ts +171 -0
- package/packages/core/src/utils/benchmark.ts +80 -0
- package/packages/core/src/utils/crypto.ts +73 -0
- package/packages/core/src/utils/date.ts +42 -0
- package/packages/core/src/utils/index.ts +4 -0
- package/packages/core/src/utils/logger.ts +388 -0
- package/packages/core/src/utils/retry.ts +70 -0
- package/packages/core/src/voice/index.ts +583 -0
- package/packages/core/tsconfig.json +9 -0
- package/packages/mcp/package.json +26 -0
- package/packages/mcp/src/config.ts +13 -0
- package/packages/mcp/src/index.ts +1 -0
- package/packages/mcp/src/logger.ts +42 -0
- package/packages/mcp/src/manager.ts +434 -0
- package/packages/mcp/src/transports/index.ts +67 -0
- package/packages/mcp/src/transports/sse.ts +241 -0
- package/packages/mcp/src/transports/websocket.ts +159 -0
- package/packages/skills/package.json +21 -0
- package/packages/skills/src/bundled/agent_management/SKILL.md +24 -0
- package/packages/skills/src/bundled/browser_automation/SKILL.md +30 -0
- package/packages/skills/src/bundled/context_compact/SKILL.md +35 -0
- package/packages/skills/src/bundled/cron_manager/SKILL.md +52 -0
- package/packages/skills/src/bundled/file_manager/SKILL.md +76 -0
- package/packages/skills/src/bundled/http_client/SKILL.md +24 -0
- package/packages/skills/src/bundled/memory/SKILL.md +42 -0
- package/packages/skills/src/bundled/project_management/SKILL.md +26 -0
- package/packages/skills/src/bundled/shell/SKILL.md +43 -0
- package/packages/skills/src/bundled/system_notify/SKILL.md +52 -0
- package/packages/skills/src/bundled/voice/SKILL.md +25 -0
- package/packages/skills/src/bundled/web_search/SKILL.md +29 -0
- package/packages/skills/src/index.ts +1 -0
- package/packages/skills/src/loader.ts +282 -0
- package/packages/tools/package.json +43 -0
- package/packages/tools/src/browser/browser.test.ts +111 -0
- package/packages/tools/src/browser/index.ts +272 -0
- package/packages/tools/src/canvas/index.ts +220 -0
- package/packages/tools/src/cron/cron.test.ts +164 -0
- package/packages/tools/src/cron/index.ts +304 -0
- package/packages/tools/src/filesystem/filesystem.test.ts +240 -0
- package/packages/tools/src/filesystem/index.ts +379 -0
- package/packages/tools/src/git/index.ts +239 -0
- package/packages/tools/src/index.ts +4 -0
- package/packages/tools/src/shell/detect-env.ts +70 -0
- package/packages/tools/tsconfig.json +9 -0
|
@@ -0,0 +1,583 @@
|
|
|
1
|
+
import { getDb } from "../storage/sqlite";
|
|
2
|
+
import { decryptApiKey } from "../storage/crypto";
|
|
3
|
+
import { logger } from "../utils/logger";
|
|
4
|
+
|
|
5
|
+
export interface VoiceConfig {
|
|
6
|
+
voiceEnabled: boolean;
|
|
7
|
+
ttsEnabled: boolean;
|
|
8
|
+
sttProvider: string | null;
|
|
9
|
+
ttsProvider: string | null;
|
|
10
|
+
ttsVoiceId: string | null;
|
|
11
|
+
}
|
|
12
|
+
|
|
13
|
+
export interface AudioInput {
|
|
14
|
+
type: "buffer" | "url" | "base64";
|
|
15
|
+
data: Buffer | string;
|
|
16
|
+
mimeType?: string;
|
|
17
|
+
}
|
|
18
|
+
|
|
19
|
+
export interface AudioOutput {
|
|
20
|
+
type: "buffer" | "base64";
|
|
21
|
+
data: Buffer | string;
|
|
22
|
+
mimeType: string;
|
|
23
|
+
}
|
|
24
|
+
|
|
25
|
+
const log = logger.child("voice");
|
|
26
|
+
|
|
27
|
+
class VoiceService {
|
|
28
|
+
private static instance: VoiceService;
|
|
29
|
+
|
|
30
|
+
private constructor() {}
|
|
31
|
+
|
|
32
|
+
static getInstance(): VoiceService {
|
|
33
|
+
if (!VoiceService.instance) {
|
|
34
|
+
VoiceService.instance = new VoiceService();
|
|
35
|
+
}
|
|
36
|
+
return VoiceService.instance;
|
|
37
|
+
}
|
|
38
|
+
|
|
39
|
+
getChannelVoiceConfig(channelId: string): VoiceConfig {
|
|
40
|
+
const db = getDb();
|
|
41
|
+
const result = db.query(`
|
|
42
|
+
SELECT voice_enabled, tts_enabled, stt_provider, tts_provider, tts_voice_id
|
|
43
|
+
FROM channels WHERE id = ?
|
|
44
|
+
`).get(channelId) as {
|
|
45
|
+
voice_enabled: number;
|
|
46
|
+
tts_enabled: number;
|
|
47
|
+
stt_provider: string | null;
|
|
48
|
+
tts_provider: string | null;
|
|
49
|
+
tts_voice_id: string | null;
|
|
50
|
+
} | undefined;
|
|
51
|
+
|
|
52
|
+
if (!result) {
|
|
53
|
+
return {
|
|
54
|
+
voiceEnabled: false,
|
|
55
|
+
ttsEnabled: false,
|
|
56
|
+
sttProvider: null,
|
|
57
|
+
ttsProvider: null,
|
|
58
|
+
ttsVoiceId: null,
|
|
59
|
+
};
|
|
60
|
+
}
|
|
61
|
+
|
|
62
|
+
return {
|
|
63
|
+
voiceEnabled: result.voice_enabled === 1,
|
|
64
|
+
ttsEnabled: result.tts_enabled === 1,
|
|
65
|
+
sttProvider: result.stt_provider,
|
|
66
|
+
ttsProvider: result.tts_provider,
|
|
67
|
+
ttsVoiceId: result.tts_voice_id,
|
|
68
|
+
};
|
|
69
|
+
}
|
|
70
|
+
|
|
71
|
+
async transcribe(audio: AudioInput, modelId: string): Promise<string> {
|
|
72
|
+
const isGroq = modelId.startsWith("whisper");
|
|
73
|
+
const isOpenAi = modelId === "whisper-1";
|
|
74
|
+
|
|
75
|
+
if (isGroq) {
|
|
76
|
+
return this.transcribeWithGroq(audio, modelId);
|
|
77
|
+
} else if (isOpenAi) {
|
|
78
|
+
return this.transcribeWithOpenAIWhisper(audio);
|
|
79
|
+
}
|
|
80
|
+
|
|
81
|
+
log.warn(`Unknown STT provider ${modelId}, defaulting to Groq Whisper`);
|
|
82
|
+
return this.transcribeWithGroq(audio, "whisper-large-v3-turbo");
|
|
83
|
+
}
|
|
84
|
+
|
|
85
|
+
private async getProviderApiKey(providerId: string): Promise<string | null> {
|
|
86
|
+
const db = getDb();
|
|
87
|
+
const provider = db.query(`
|
|
88
|
+
SELECT api_key_encrypted, api_key_iv FROM providers WHERE id = ?
|
|
89
|
+
`).get(providerId) as { api_key_encrypted: string; api_key_iv: string } | undefined;
|
|
90
|
+
|
|
91
|
+
if (!provider?.api_key_encrypted) {
|
|
92
|
+
return null;
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
try {
|
|
96
|
+
return await decryptApiKey(provider.api_key_encrypted, provider.api_key_iv);
|
|
97
|
+
} catch (error) {
|
|
98
|
+
log.error(`Failed to decrypt API key for provider ${providerId}: ${(error as Error).message}`);
|
|
99
|
+
return null;
|
|
100
|
+
}
|
|
101
|
+
}
|
|
102
|
+
|
|
103
|
+
private async transcribeWithGroq(audio: AudioInput, modelId: string): Promise<string> {
|
|
104
|
+
const key = await this.getProviderApiKey("groq") || process.env.GROQ_API_KEY;
|
|
105
|
+
if (!key) {
|
|
106
|
+
throw new Error("GROQ_API_KEY not configured. Configúrala en Proveedores o en las variables de entorno.");
|
|
107
|
+
}
|
|
108
|
+
|
|
109
|
+
let audioData: ArrayBuffer | Uint8Array;
|
|
110
|
+
|
|
111
|
+
if (audio.type === "buffer") {
|
|
112
|
+
audioData = new Uint8Array((audio.data as Buffer));
|
|
113
|
+
} else if (audio.type === "base64") {
|
|
114
|
+
const buf = Buffer.from(audio.data as string, "base64");
|
|
115
|
+
audioData = new Uint8Array(buf);
|
|
116
|
+
} else if (audio.type === "url") {
|
|
117
|
+
const response = await fetch(audio.data as string);
|
|
118
|
+
const ab = await response.arrayBuffer();
|
|
119
|
+
audioData = new Uint8Array(ab);
|
|
120
|
+
} else {
|
|
121
|
+
throw new Error("Invalid audio input type");
|
|
122
|
+
}
|
|
123
|
+
|
|
124
|
+
const blob = new Blob([audioData as BlobPart], { type: audio.mimeType || "audio/ogg" });
|
|
125
|
+
const formData = new FormData();
|
|
126
|
+
formData.append("file", blob, "audio.ogg");
|
|
127
|
+
formData.append("model", modelId);
|
|
128
|
+
formData.append("response_format", "json");
|
|
129
|
+
formData.append("language", "es");
|
|
130
|
+
|
|
131
|
+
const result = await fetch("https://api.groq.com/openai/v1/audio/transcriptions", {
|
|
132
|
+
method: "POST",
|
|
133
|
+
headers: {
|
|
134
|
+
"Authorization": `Bearer ${key}`,
|
|
135
|
+
},
|
|
136
|
+
body: formData,
|
|
137
|
+
});
|
|
138
|
+
|
|
139
|
+
if (!result.ok) {
|
|
140
|
+
const error = await result.text();
|
|
141
|
+
throw new Error(`Groq Whisper transcription failed: ${error}`);
|
|
142
|
+
}
|
|
143
|
+
|
|
144
|
+
const data = await result.json() as { text: string };
|
|
145
|
+
return data.text;
|
|
146
|
+
}
|
|
147
|
+
|
|
148
|
+
private async transcribeWithOpenAIWhisper(audio: AudioInput): Promise<string> {
|
|
149
|
+
const key = await this.getProviderApiKey("openai") || process.env.OPENAI_API_KEY;
|
|
150
|
+
if (!key) {
|
|
151
|
+
throw new Error("OPENAI_API_KEY not configured. Configúrala en Proveedores o en las variables de entorno.");
|
|
152
|
+
}
|
|
153
|
+
|
|
154
|
+
let audioData: ArrayBuffer | Uint8Array;
|
|
155
|
+
|
|
156
|
+
if (audio.type === "buffer") {
|
|
157
|
+
audioData = new Uint8Array(audio.data as Buffer);
|
|
158
|
+
} else if (audio.type === "base64") {
|
|
159
|
+
const buf = Buffer.from(audio.data as string, "base64");
|
|
160
|
+
audioData = new Uint8Array(buf);
|
|
161
|
+
} else if (audio.type === "url") {
|
|
162
|
+
const response = await fetch(audio.data as string);
|
|
163
|
+
const ab = await response.arrayBuffer();
|
|
164
|
+
audioData = new Uint8Array(ab);
|
|
165
|
+
} else {
|
|
166
|
+
throw new Error("Invalid audio input type");
|
|
167
|
+
}
|
|
168
|
+
|
|
169
|
+
const blob = new Blob([audioData as BlobPart], { type: audio.mimeType || "audio/webm" });
|
|
170
|
+
const formData = new FormData();
|
|
171
|
+
formData.append("file", blob, "audio.webm");
|
|
172
|
+
|
|
173
|
+
formData.append("model", "whisper-1");
|
|
174
|
+
formData.append("response_format", "json");
|
|
175
|
+
formData.append("language", "es");
|
|
176
|
+
|
|
177
|
+
const result = await fetch("https://api.openai.com/v1/audio/transcriptions", {
|
|
178
|
+
method: "POST",
|
|
179
|
+
headers: {
|
|
180
|
+
"Authorization": `Bearer ${key}`,
|
|
181
|
+
},
|
|
182
|
+
body: formData,
|
|
183
|
+
});
|
|
184
|
+
|
|
185
|
+
if (!result.ok) {
|
|
186
|
+
const error = await result.text();
|
|
187
|
+
throw new Error(`OpenAI Whisper transcription failed: ${error}`);
|
|
188
|
+
}
|
|
189
|
+
|
|
190
|
+
const data = await result.json() as { text: string };
|
|
191
|
+
return data.text;
|
|
192
|
+
}
|
|
193
|
+
|
|
194
|
+
async speak(text: string, modelId: string, voiceId?: string): Promise<AudioOutput> {
|
|
195
|
+
const isElevenLabs = modelId.startsWith("eleven");
|
|
196
|
+
const isOpenAI = modelId.startsWith("tts-") || modelId.startsWith("gpt-");
|
|
197
|
+
const isGemini = modelId.startsWith("gemini");
|
|
198
|
+
const isQwen = modelId.startsWith("qwen");
|
|
199
|
+
|
|
200
|
+
if (isElevenLabs) {
|
|
201
|
+
return this.speakWithElevenLabs(text, modelId, voiceId);
|
|
202
|
+
} else if (isOpenAI) {
|
|
203
|
+
return this.speakWithOpenAI(text, modelId, voiceId);
|
|
204
|
+
} else if (isGemini) {
|
|
205
|
+
return this.speakWithGemini(text, modelId, voiceId);
|
|
206
|
+
} else if (isQwen) {
|
|
207
|
+
return this.speakWithQwen(text, modelId, voiceId);
|
|
208
|
+
}
|
|
209
|
+
|
|
210
|
+
log.warn(`Unknown TTS provider ${modelId}, defaulting to ElevenLabs Flash`);
|
|
211
|
+
return this.speakWithElevenLabs(text, "eleven_flash_v2_5", voiceId);
|
|
212
|
+
}
|
|
213
|
+
|
|
214
|
+
private async speakWithElevenLabs(text: string, modelId: string, voiceId?: string): Promise<AudioOutput> {
|
|
215
|
+
const apiKey = await this.getProviderApiKey("elevenlabs");
|
|
216
|
+
const key = apiKey || process.env.ELEVENLABS_API_KEY;
|
|
217
|
+
|
|
218
|
+
if (!key) {
|
|
219
|
+
throw new Error("ELEVENLABS_API_KEY not configured");
|
|
220
|
+
}
|
|
221
|
+
|
|
222
|
+
const voice = voiceId || "21m00Tcm4TlvDq8ikWAM";
|
|
223
|
+
|
|
224
|
+
const response = await fetch(`https://api.elevenlabs.io/v1/text-to-speech/${voice}`, {
|
|
225
|
+
method: "POST",
|
|
226
|
+
headers: {
|
|
227
|
+
"Content-Type": "application/json",
|
|
228
|
+
"xi-api-key": key,
|
|
229
|
+
},
|
|
230
|
+
body: JSON.stringify({
|
|
231
|
+
text,
|
|
232
|
+
model_id: modelId,
|
|
233
|
+
voice_settings: {
|
|
234
|
+
stability: 0.5,
|
|
235
|
+
similarity_boost: 0.75,
|
|
236
|
+
},
|
|
237
|
+
}),
|
|
238
|
+
});
|
|
239
|
+
|
|
240
|
+
if (!response.ok) {
|
|
241
|
+
const error = await response.text();
|
|
242
|
+
throw new Error(`ElevenLabs TTS failed: ${error}`);
|
|
243
|
+
}
|
|
244
|
+
|
|
245
|
+
const buffer = await response.arrayBuffer();
|
|
246
|
+
return {
|
|
247
|
+
type: "buffer",
|
|
248
|
+
data: Buffer.from(buffer),
|
|
249
|
+
mimeType: "audio/mpeg",
|
|
250
|
+
};
|
|
251
|
+
}
|
|
252
|
+
|
|
253
|
+
private async speakWithOpenAI(text: string, modelId: string = "gpt-4o-mini-tts", voiceId?: string): Promise<AudioOutput> {
|
|
254
|
+
const apiKey = await this.getProviderApiKey("openai-tts");
|
|
255
|
+
const key = apiKey || process.env.OPENAI_API_KEY;
|
|
256
|
+
|
|
257
|
+
if (!key) {
|
|
258
|
+
throw new Error("OPENAI_API_KEY not configured");
|
|
259
|
+
}
|
|
260
|
+
|
|
261
|
+
const voice = voiceId || "alloy";
|
|
262
|
+
|
|
263
|
+
const response = await fetch("https://api.openai.com/v1/audio/speech", {
|
|
264
|
+
method: "POST",
|
|
265
|
+
headers: {
|
|
266
|
+
"Content-Type": "application/json",
|
|
267
|
+
"Authorization": `Bearer ${key}`,
|
|
268
|
+
},
|
|
269
|
+
body: JSON.stringify({
|
|
270
|
+
model: modelId,
|
|
271
|
+
voice,
|
|
272
|
+
input: text,
|
|
273
|
+
response_format: "mp3",
|
|
274
|
+
}),
|
|
275
|
+
});
|
|
276
|
+
|
|
277
|
+
if (!response.ok) {
|
|
278
|
+
const error = await response.text();
|
|
279
|
+
throw new Error(`OpenAI TTS failed: ${error}`);
|
|
280
|
+
}
|
|
281
|
+
|
|
282
|
+
const buffer = await response.arrayBuffer();
|
|
283
|
+
return {
|
|
284
|
+
type: "buffer",
|
|
285
|
+
data: Buffer.from(buffer),
|
|
286
|
+
mimeType: "audio/mpeg",
|
|
287
|
+
};
|
|
288
|
+
}
|
|
289
|
+
|
|
290
|
+
private async speakWithGemini(text: string, modelId: string, voiceId?: string): Promise<AudioOutput> {
|
|
291
|
+
const key = process.env.GEMINI_API_KEY;
|
|
292
|
+
|
|
293
|
+
if (!key) {
|
|
294
|
+
throw new Error("GEMINI_API_KEY not configured");
|
|
295
|
+
}
|
|
296
|
+
|
|
297
|
+
const voiceName = voiceId || "Aoede";
|
|
298
|
+
|
|
299
|
+
const response = await fetch(`https://generativelanguage.googleapis.com/v1beta/models/${modelId}:generateContent?key=${key}`, {
|
|
300
|
+
method: "POST",
|
|
301
|
+
headers: {
|
|
302
|
+
"Content-Type": "application/json",
|
|
303
|
+
},
|
|
304
|
+
body: JSON.stringify({
|
|
305
|
+
contents: [{
|
|
306
|
+
parts: [{
|
|
307
|
+
text: `Genera audio de este texto: ${text}`,
|
|
308
|
+
}]
|
|
309
|
+
}],
|
|
310
|
+
generationConfig: {
|
|
311
|
+
responseModalities: ["AUDIO"],
|
|
312
|
+
speechConfig: {
|
|
313
|
+
languageCode: "es-ES",
|
|
314
|
+
voiceConfig: {
|
|
315
|
+
prebuiltVoiceConfig: {
|
|
316
|
+
voiceName,
|
|
317
|
+
},
|
|
318
|
+
},
|
|
319
|
+
},
|
|
320
|
+
},
|
|
321
|
+
}),
|
|
322
|
+
});
|
|
323
|
+
|
|
324
|
+
if (!response.ok) {
|
|
325
|
+
const error = await response.text();
|
|
326
|
+
throw new Error(`Gemini TTS failed: ${error}`);
|
|
327
|
+
}
|
|
328
|
+
|
|
329
|
+
const data = await response.json() as { candidates?: Array<{ content?: { parts?: Array<{ inlineData?: { data: string } }> } }> };
|
|
330
|
+
const audioData = data.candidates?.[0]?.content?.parts?.[0]?.inlineData?.data;
|
|
331
|
+
|
|
332
|
+
if (!audioData) {
|
|
333
|
+
throw new Error("No audio returned from Gemini");
|
|
334
|
+
}
|
|
335
|
+
|
|
336
|
+
const buffer = Buffer.from(audioData, "base64");
|
|
337
|
+
return {
|
|
338
|
+
type: "buffer",
|
|
339
|
+
data: buffer,
|
|
340
|
+
mimeType: "audio/mpeg",
|
|
341
|
+
};
|
|
342
|
+
}
|
|
343
|
+
|
|
344
|
+
private async speakWithQwen(text: string, modelId: string, voiceId?: string): Promise<AudioOutput> {
|
|
345
|
+
const key = process.env.DASHSCOPE_API_KEY;
|
|
346
|
+
|
|
347
|
+
if (!key) {
|
|
348
|
+
throw new Error("DASHSCOPE_API_KEY not configured");
|
|
349
|
+
}
|
|
350
|
+
|
|
351
|
+
const voice = voiceId || "ruoxi";
|
|
352
|
+
|
|
353
|
+
const response = await fetch("https://dashscope.aliyuncs.com/api/v1/services/audio/t2a/generation", {
|
|
354
|
+
method: "POST",
|
|
355
|
+
headers: {
|
|
356
|
+
"Content-Type": "application/json",
|
|
357
|
+
"Authorization": `Bearer ${key}`,
|
|
358
|
+
},
|
|
359
|
+
body: JSON.stringify({
|
|
360
|
+
model: modelId,
|
|
361
|
+
input: {
|
|
362
|
+
text,
|
|
363
|
+
},
|
|
364
|
+
parameters: {
|
|
365
|
+
voice,
|
|
366
|
+
format: "mp3",
|
|
367
|
+
},
|
|
368
|
+
}),
|
|
369
|
+
});
|
|
370
|
+
|
|
371
|
+
if (!response.ok) {
|
|
372
|
+
const error = await response.text();
|
|
373
|
+
throw new Error(`Qwen TTS failed: ${error}`);
|
|
374
|
+
}
|
|
375
|
+
|
|
376
|
+
const data = await response.json() as { output?: { audio?: string } };
|
|
377
|
+
const audioData = data.output?.audio;
|
|
378
|
+
|
|
379
|
+
if (!audioData) {
|
|
380
|
+
throw new Error("No audio returned from Qwen");
|
|
381
|
+
}
|
|
382
|
+
|
|
383
|
+
const buffer = Buffer.from(audioData, "base64");
|
|
384
|
+
return {
|
|
385
|
+
type: "buffer",
|
|
386
|
+
data: buffer,
|
|
387
|
+
mimeType: "audio/mpeg",
|
|
388
|
+
};
|
|
389
|
+
}
|
|
390
|
+
|
|
391
|
+
getConfiguredVoiceProviders(): { groq: boolean; elevenlabs: boolean; openai: boolean; gemini: boolean; qwen: boolean } {
|
|
392
|
+
const db = getDb();
|
|
393
|
+
const hasDbKey = (providerId: string): boolean => {
|
|
394
|
+
const row = db.query(
|
|
395
|
+
`SELECT api_key_encrypted FROM providers WHERE id = ? AND api_key_encrypted IS NOT NULL AND api_key_encrypted != ''`
|
|
396
|
+
).get(providerId) as { api_key_encrypted: string } | undefined;
|
|
397
|
+
return !!row;
|
|
398
|
+
};
|
|
399
|
+
|
|
400
|
+
return {
|
|
401
|
+
groq: hasDbKey("groq") || !!(process.env.GROQ_API_KEY),
|
|
402
|
+
elevenlabs: hasDbKey("elevenlabs") || !!(process.env.ELEVENLABS_API_KEY),
|
|
403
|
+
openai: hasDbKey("openai") || !!(process.env.OPENAI_API_KEY),
|
|
404
|
+
gemini: hasDbKey("gemini") || !!(process.env.GEMINI_API_KEY),
|
|
405
|
+
qwen: hasDbKey("qwen") || !!(process.env.DASHSCOPE_API_KEY),
|
|
406
|
+
};
|
|
407
|
+
}
|
|
408
|
+
|
|
409
|
+
getOpenAIVoices(): Array<{ id: string; name: string }> {
|
|
410
|
+
return [
|
|
411
|
+
{ id: "alloy", name: "Alloy" },
|
|
412
|
+
{ id: "echo", name: "Echo" },
|
|
413
|
+
{ id: "fable", name: "Fable" },
|
|
414
|
+
{ id: "onyx", name: "Onyx" },
|
|
415
|
+
{ id: "nova", name: "Nova" },
|
|
416
|
+
{ id: "shimmer", name: "Shimmer" },
|
|
417
|
+
{ id: "ash", name: "Ash" },
|
|
418
|
+
{ id: "ballad", name: "Ballad" },
|
|
419
|
+
{ id: "coral", name: "Coral" },
|
|
420
|
+
{ id: "sage", name: "Sage" },
|
|
421
|
+
{ id: "verse", name: "Verse" },
|
|
422
|
+
];
|
|
423
|
+
}
|
|
424
|
+
|
|
425
|
+
getGeminiVoices(): Array<{ id: string; name: string }> {
|
|
426
|
+
return [
|
|
427
|
+
{ id: "Puck", name: "Puck" },
|
|
428
|
+
{ id: "Charon", name: "Charon" },
|
|
429
|
+
{ id: "Kore", name: "Kore" },
|
|
430
|
+
{ id: "Fenrir", name: "Fenrir" },
|
|
431
|
+
{ id: "Aoede", name: "Aoede" },
|
|
432
|
+
{ id: "Orbit", name: "Orbit" },
|
|
433
|
+
{ id: "Zephyr", name: "Zephyr" },
|
|
434
|
+
{ id: "Autonoe", name: "Autonoe" },
|
|
435
|
+
{ id: "Enceladus", name: "Enceladus" },
|
|
436
|
+
{ id: "Iapetus", name: "Iapetus" },
|
|
437
|
+
{ id: "Umbriel", name: "Umbriel" },
|
|
438
|
+
{ id: "Algieba", name: "Algieba" },
|
|
439
|
+
{ id: "Despina", name: "Despina" },
|
|
440
|
+
{ id: "Erinome", name: "Erinome" },
|
|
441
|
+
{ id: "Laomedeia", name: "Laomedeia" },
|
|
442
|
+
{ id: "Achernar", name: "Achernar" },
|
|
443
|
+
{ id: "Rasalgethi", name: "Rasalgethi" },
|
|
444
|
+
{ id: "Schedar", name: "Schedar" },
|
|
445
|
+
{ id: "Sulafat", name: "Sulafat" },
|
|
446
|
+
{ id: "Vindemiatrix", name: "Vindemiatrix" },
|
|
447
|
+
{ id: "Zubenelgenubi", name: "Zubenelgenubi" },
|
|
448
|
+
{ id: "Pulcherrima", name: "Pulcherrima" },
|
|
449
|
+
{ id: "Achird", name: "Achird" },
|
|
450
|
+
{ id: "Zubeneschamali", name: "Zubeneschamali" },
|
|
451
|
+
{ id: "Sadachbia", name: "Sadachbia" },
|
|
452
|
+
{ id: "Sadaltager", name: "Sadaltager" },
|
|
453
|
+
{ id: "Sheratan", name: "Sheratan" },
|
|
454
|
+
];
|
|
455
|
+
}
|
|
456
|
+
|
|
457
|
+
getQwenVoices(): Array<{ id: string; name: string }> {
|
|
458
|
+
return [
|
|
459
|
+
{ id: "ruoxi", name: "Ruoxi (F, Chinese)" },
|
|
460
|
+
{ id: "longhua", name: "Longhua (M, Chinese)" },
|
|
461
|
+
{ id: "lingli", name: "Lingli (F, Chinese)" },
|
|
462
|
+
{ id: "zhiyan", name: "Zhiyan (F, Chinese)" },
|
|
463
|
+
{ id: "aicheng", name: "Aicheng (F, Chinese)" },
|
|
464
|
+
{ id: "aida", name: "Aida (F, Chinese)" },
|
|
465
|
+
{ id: "yucheng", name: "Yucheng (M, Chinese)" },
|
|
466
|
+
{ id: "yijia", name: "Yijia (F, Chinese)" },
|
|
467
|
+
{ id: "yinan", name: "Yinan (M, Chinese)" },
|
|
468
|
+
{ id: "sijia", name: "Sijia (F, Chinese)" },
|
|
469
|
+
{ id: "sicheng", name: "Sicheng (M, Chinese)" },
|
|
470
|
+
{ id: "siqi", name: "Siqi (F, Chinese)" },
|
|
471
|
+
{ id: "aixia", name: "Aixia (F, Chinese)" },
|
|
472
|
+
];
|
|
473
|
+
}
|
|
474
|
+
|
|
475
|
+
async getElevenLabsVoices(): Promise<Array<{ id: string; name: string; category: string }>> {
|
|
476
|
+
const apiKey = await this.getProviderApiKey("elevenlabs");
|
|
477
|
+
const key = apiKey || process.env.ELEVENLABS_API_KEY;
|
|
478
|
+
|
|
479
|
+
if (!key) {
|
|
480
|
+
throw new Error("ELEVENLABS_API_KEY not configured");
|
|
481
|
+
}
|
|
482
|
+
|
|
483
|
+
const response = await fetch("https://api.elevenlabs.io/v1/voices", {
|
|
484
|
+
headers: {
|
|
485
|
+
"xi-api-key": key,
|
|
486
|
+
},
|
|
487
|
+
});
|
|
488
|
+
|
|
489
|
+
if (!response.ok) {
|
|
490
|
+
const error = await response.text();
|
|
491
|
+
throw new Error(`Failed to fetch ElevenLabs voices: ${error}`);
|
|
492
|
+
}
|
|
493
|
+
|
|
494
|
+
const data = await response.json() as { voices: Array<{ voice_id: string; name: string; category: string }> };
|
|
495
|
+
return data.voices.map(v => ({
|
|
496
|
+
id: v.voice_id,
|
|
497
|
+
name: v.name,
|
|
498
|
+
category: v.category,
|
|
499
|
+
}));
|
|
500
|
+
}
|
|
501
|
+
|
|
502
|
+
normalizeAudioFromChannel(channelType: string, audioData: unknown): AudioInput {
|
|
503
|
+
switch (channelType) {
|
|
504
|
+
case "telegram":
|
|
505
|
+
return this.normalizeTelegramAudio(audioData);
|
|
506
|
+
case "discord":
|
|
507
|
+
return this.normalizeDiscordAudio(audioData);
|
|
508
|
+
case "whatsapp":
|
|
509
|
+
return this.normalizeWhatsAppAudio(audioData);
|
|
510
|
+
case "slack":
|
|
511
|
+
return this.normalizeSlackAudio(audioData);
|
|
512
|
+
case "webchat":
|
|
513
|
+
return this.normalizeWebChatAudio(audioData);
|
|
514
|
+
default:
|
|
515
|
+
throw new Error(`Unknown channel type: ${channelType}`);
|
|
516
|
+
}
|
|
517
|
+
}
|
|
518
|
+
|
|
519
|
+
private normalizeTelegramAudio(audioData: unknown): AudioInput {
|
|
520
|
+
const data = audioData as { fileId?: string; buffer?: Buffer; url?: string };
|
|
521
|
+
|
|
522
|
+
if (data.buffer) {
|
|
523
|
+
return { type: "buffer", data: data.buffer, mimeType: "audio/ogg" };
|
|
524
|
+
}
|
|
525
|
+
if (data.url) {
|
|
526
|
+
return { type: "url", data: data.url, mimeType: "audio/ogg" };
|
|
527
|
+
}
|
|
528
|
+
throw new Error("Telegram audio missing buffer or URL");
|
|
529
|
+
}
|
|
530
|
+
|
|
531
|
+
private normalizeDiscordAudio(audioData: unknown): AudioInput {
|
|
532
|
+
const data = audioData as { buffer?: Buffer; url?: string; mimeType?: string };
|
|
533
|
+
|
|
534
|
+
if (data.buffer) {
|
|
535
|
+
return { type: "buffer", data: data.buffer, mimeType: data.mimeType || "audio/webm" };
|
|
536
|
+
}
|
|
537
|
+
if (data.url) {
|
|
538
|
+
return { type: "url", data: data.url, mimeType: data.mimeType || "audio/webm" };
|
|
539
|
+
}
|
|
540
|
+
throw new Error("Discord audio missing buffer or URL");
|
|
541
|
+
}
|
|
542
|
+
|
|
543
|
+
private normalizeWhatsAppAudio(audioData: unknown): AudioInput {
|
|
544
|
+
const data = audioData as { mediaId?: string; buffer?: Buffer; url?: string };
|
|
545
|
+
|
|
546
|
+
if (data.buffer) {
|
|
547
|
+
return { type: "buffer", data: data.buffer, mimeType: "audio/ogg" };
|
|
548
|
+
}
|
|
549
|
+
if (data.url) {
|
|
550
|
+
return { type: "url", data: data.url, mimeType: "audio/ogg" };
|
|
551
|
+
}
|
|
552
|
+
if (data.mediaId) {
|
|
553
|
+
return { type: "url", data: `https://wa.me/${data.mediaId}`, mimeType: "audio/ogg" };
|
|
554
|
+
}
|
|
555
|
+
throw new Error("WhatsApp audio missing buffer, URL, or mediaId");
|
|
556
|
+
}
|
|
557
|
+
|
|
558
|
+
private normalizeSlackAudio(audioData: unknown): AudioInput {
|
|
559
|
+
const data = audioData as { buffer?: Buffer; url?: string; mimeType?: string };
|
|
560
|
+
|
|
561
|
+
if (data.buffer) {
|
|
562
|
+
return { type: "buffer", data: data.buffer, mimeType: data.mimeType || "audio/webm" };
|
|
563
|
+
}
|
|
564
|
+
if (data.url) {
|
|
565
|
+
return { type: "url", data: data.url, mimeType: data.mimeType || "audio/webm" };
|
|
566
|
+
}
|
|
567
|
+
throw new Error("Slack audio missing buffer or URL");
|
|
568
|
+
}
|
|
569
|
+
|
|
570
|
+
private normalizeWebChatAudio(audioData: unknown): AudioInput {
|
|
571
|
+
const data = audioData as { base64?: string; buffer?: Buffer };
|
|
572
|
+
|
|
573
|
+
if (data.base64) {
|
|
574
|
+
return { type: "base64", data: data.base64, mimeType: "audio/webm" };
|
|
575
|
+
}
|
|
576
|
+
if (data.buffer) {
|
|
577
|
+
return { type: "buffer", data: data.buffer, mimeType: "audio/webm" };
|
|
578
|
+
}
|
|
579
|
+
throw new Error("WebChat audio missing base64 or buffer");
|
|
580
|
+
}
|
|
581
|
+
}
|
|
582
|
+
|
|
583
|
+
export const voiceService = VoiceService.getInstance();
|
|
@@ -0,0 +1,26 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "@johpaz/hive-mcp",
|
|
3
|
+
"version": "1.1.0",
|
|
4
|
+
"private": true,
|
|
5
|
+
"description": "Hive MCP Client — Model Context Protocol client layer",
|
|
6
|
+
"main": "./src/index.ts",
|
|
7
|
+
"license": "MIT",
|
|
8
|
+
"files": [
|
|
9
|
+
"src/"
|
|
10
|
+
],
|
|
11
|
+
"scripts": {
|
|
12
|
+
"test": "bun test"
|
|
13
|
+
},
|
|
14
|
+
"dependencies": {
|
|
15
|
+
"@modelcontextprotocol/sdk": "latest",
|
|
16
|
+
"zod": "latest"
|
|
17
|
+
},
|
|
18
|
+
"devDependencies": {
|
|
19
|
+
"typescript": "latest",
|
|
20
|
+
"@types/bun": "latest"
|
|
21
|
+
},
|
|
22
|
+
"exports": {
|
|
23
|
+
".": "./src/index.ts",
|
|
24
|
+
"./transports": "./src/transports/index.ts"
|
|
25
|
+
}
|
|
26
|
+
}
|
|
@@ -0,0 +1,13 @@
|
|
|
1
|
+
export interface MCPConfig {
|
|
2
|
+
servers?: Record<string, MCPServerConfig>;
|
|
3
|
+
}
|
|
4
|
+
|
|
5
|
+
export interface MCPServerConfig {
|
|
6
|
+
transport: "stdio" | "sse" | "websocket";
|
|
7
|
+
enabled?: boolean;
|
|
8
|
+
command?: string;
|
|
9
|
+
args?: string[];
|
|
10
|
+
env?: Record<string, string>;
|
|
11
|
+
url?: string;
|
|
12
|
+
headers?: Record<string, string>;
|
|
13
|
+
}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
export * from "./manager.ts";
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
export type LogLevel = "debug" | "info" | "warn" | "error";
|
|
2
|
+
export type LogHandler = (level: LogLevel, context: string, message: string, data?: Record<string, unknown>) => void;
|
|
3
|
+
|
|
4
|
+
class Logger {
|
|
5
|
+
private context: string;
|
|
6
|
+
private level: LogLevel = "info";
|
|
7
|
+
private handler: LogHandler | null = null;
|
|
8
|
+
|
|
9
|
+
constructor(context: string, handler: LogHandler | null = null) {
|
|
10
|
+
this.context = context;
|
|
11
|
+
this.handler = handler;
|
|
12
|
+
}
|
|
13
|
+
|
|
14
|
+
setHandler(handler: LogHandler | null): void {
|
|
15
|
+
this.handler = handler;
|
|
16
|
+
}
|
|
17
|
+
|
|
18
|
+
private log(level: LogLevel, message: string, data?: Record<string, unknown>): void {
|
|
19
|
+
if (this.handler) {
|
|
20
|
+
this.handler(level, this.context, message, data);
|
|
21
|
+
return;
|
|
22
|
+
}
|
|
23
|
+
|
|
24
|
+
// Silent by default if no handler is set, to avoid standard console pollution.
|
|
25
|
+
// The consumer (e.g., Hive Agent) should set a handler to bridge these logs.
|
|
26
|
+
}
|
|
27
|
+
|
|
28
|
+
debug(message: string, data?: Record<string, unknown>): void { this.log("debug", message, data); }
|
|
29
|
+
info(message: string, data?: Record<string, unknown>): void { this.log("info", message, data); }
|
|
30
|
+
warn(message: string, data?: Record<string, unknown>): void { this.log("warn", message, data); }
|
|
31
|
+
error(message: string, data?: Record<string, unknown>): void { this.log("error", message, data); }
|
|
32
|
+
|
|
33
|
+
child(context: string): Logger {
|
|
34
|
+
return new Logger(`${this.context}:${context}`, this.handler);
|
|
35
|
+
}
|
|
36
|
+
|
|
37
|
+
setLevel(level: LogLevel): void {
|
|
38
|
+
this.level = level;
|
|
39
|
+
}
|
|
40
|
+
}
|
|
41
|
+
|
|
42
|
+
export const logger = new Logger("mcp");
|