npm - @iletai/nzb - Versions diffs - 1.3.3 → 1.3.4 - Mend

@iletai/nzb 1.3.3 → 1.3.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/config.js CHANGED Viewed

@@ -14,6 +14,7 @@ const configSchema = z.object({
     SHOW_REASONING: z.string().optional(),
     LOG_CHANNEL_ID: z.string().optional(),
     NODE_EXTRA_CA_CERTS: z.string().optional(),
+    OPENAI_API_KEY: z.string().optional(),
 });
 const raw = configSchema.parse(process.env);
 // Apply NODE_EXTRA_CA_CERTS from .env if not already set via environment.
@@ -43,6 +44,7 @@ export const config = {
     apiPort: parsedPort,
     logChannelId: parsedLogChannelId,
     workerTimeoutMs: parsedWorkerTimeout,
+    openaiApiKey: raw.OPENAI_API_KEY,
     get copilotModel() {
         return _copilotModel;
     },

package/dist/setup.js CHANGED Viewed

@@ -215,6 +215,20 @@ ${BOLD}╔═══════════════════════
     else {
         console.log(`\n${DIM}  Skipping Google. You can always set it up later with: nzb setup${RESET}\n`);
     }
+    // ── Voice / Whisper Setup ────────────────────────────────
+    console.log(`${BOLD}━━━ Voice Message Setup (optional) ━━━${RESET}\n`);
+    console.log(`NZB can transcribe voice messages using OpenAI's Whisper API.`);
+    console.log(`You need an OpenAI API key from ${CYAN}https://platform.openai.com/api-keys${RESET}`);
+    console.log();
+    const existingOpenaiKey = existing.OPENAI_API_KEY;
+    const openaiKey = await ask(rl, `  OpenAI API Key ${existingOpenaiKey ? `${DIM}(Enter to keep existing)${RESET}` : `${DIM}(Enter to skip)${RESET}`}: `);
+    const finalOpenaiKey = openaiKey.trim() || existingOpenaiKey || "";
+    if (finalOpenaiKey) {
+        console.log(`\n${GREEN}  ✓ Whisper transcription enabled${RESET}\n`);
+    }
+    else {
+        console.log(`\n${DIM}  Skipping voice. Voice messages will be saved but not transcribed.${RESET}\n`);
+    }
     // ── Model picker ─────────────────────────────────────────
     console.log(`\n${BOLD}━━━ Default Model ━━━${RESET}\n`);
     console.log(`${DIM}Fetching available models from Copilot...${RESET}`);
@@ -241,6 +255,8 @@ ${BOLD}╔═══════════════════════
         lines.push(`AUTHORIZED_USER_ID=${userId}`);
     lines.push(`API_PORT=${apiPort}`);
     lines.push(`COPILOT_MODEL=${model}`);
+    if (finalOpenaiKey)
+        lines.push(`OPENAI_API_KEY=${finalOpenaiKey}`);
     writeFileSync(ENV_PATH, lines.join("\n") + "\n");
     // ── Done ─────────────────────────────────────────────────
     console.log(`

package/dist/telegram/bot.js CHANGED Viewed

@@ -736,6 +736,110 @@ export function createBot() {
             });
         }
     });
+    // Handle voice messages — download, transcribe via Whisper, send to AI
+    bot.on("message:voice", async (ctx) => {
+        const chatId = ctx.chat.id;
+        const userMessageId = ctx.message.message_id;
+        const duration = ctx.message.voice.duration;
+        void logInfo(`🎤 Voice received: ${duration}s`);
+        try {
+            await ctx.react("👀");
+        }
+        catch { }
+        // Limit voice duration to 5 minutes
+        if (duration > 300) {
+            await ctx.reply("❌ Voice too long (max 5 min).", { reply_parameters: { message_id: userMessageId } });
+            return;
+        }
+        try {
+            const file = await ctx.api.getFile(ctx.message.voice.file_id);
+            const filePath = file.file_path;
+            if (!filePath) {
+                await ctx.reply("❌ Could not download voice.", { reply_parameters: { message_id: userMessageId } });
+                return;
+            }
+            const url = `https://api.telegram.org/file/bot${config.telegramBotToken}/${filePath}`;
+            const { mkdtempSync, writeFileSync } = await import("fs");
+            const { join } = await import("path");
+            const { tmpdir } = await import("os");
+            const tmpDir = mkdtempSync(join(tmpdir(), "nzb-voice-"));
+            const ext = filePath.split(".").pop() || "oga";
+            const localPath = join(tmpDir, `voice.${ext}`);
+            const response = await fetch(url);
+            const buffer = Buffer.from(await response.arrayBuffer());
+            writeFileSync(localPath, buffer);
+            let prompt;
+            if (config.openaiApiKey) {
+                // Transcribe using OpenAI Whisper API
+                try {
+                    const formData = new FormData();
+                    formData.append("file", new Blob([buffer], { type: "audio/ogg" }), `voice.${ext}`);
+                    formData.append("model", "whisper-1");
+                    const whisperResp = await fetch("https://api.openai.com/v1/audio/transcriptions", {
+                        method: "POST",
+                        headers: { Authorization: `Bearer ${config.openaiApiKey}` },
+                        body: formData,
+                    });
+                    if (!whisperResp.ok) {
+                        const errText = await whisperResp.text();
+                        throw new Error(`Whisper API ${whisperResp.status}: ${errText.slice(0, 200)}`);
+                    }
+                    const result = (await whisperResp.json());
+                    const transcript = result.text?.trim();
+                    if (!transcript) {
+                        prompt = `[User sent a voice message (${duration}s) but transcription was empty. File saved at: ${localPath}]`;
+                    }
+                    else {
+                        prompt = `[Voice message transcribed (${duration}s)]: ${transcript}`;
+                    }
+                }
+                catch (whisperErr) {
+                    console.error("[nzb] Whisper transcription failed:", whisperErr instanceof Error ? whisperErr.message : whisperErr);
+                    prompt = `[User sent a voice message (${duration}s), saved at: ${localPath}. Transcription failed: ${whisperErr instanceof Error ? whisperErr.message : String(whisperErr)}]`;
+                }
+            }
+            else {
+                prompt = `[User sent a voice message (${duration}s), saved at: ${localPath}. No OPENAI_API_KEY configured for transcription. You can tell the user to set it up in ~/.nzb/.env]`;
+            }
+            sendToOrchestrator(prompt, { type: "telegram", chatId, messageId: userMessageId }, (text, done) => {
+                if (done) {
+                    const formatted = toTelegramMarkdown(text);
+                    const chunks = chunkMessage(formatted);
+                    const fallbackChunks = chunkMessage(text);
+                    void (async () => {
+                        for (let i = 0; i < chunks.length; i++) {
+                            if (i > 0)
+                                await new Promise((r) => setTimeout(r, 300));
+                            const pageTag = chunks.length > 1 ? `📄 ${i + 1}/${chunks.length}\n` : "";
+                            try {
+                                await ctx.api.sendMessage(chatId, pageTag + chunks[i], {
+                                    parse_mode: "MarkdownV2",
+                                    reply_parameters: i === 0 ? { message_id: userMessageId } : undefined,
+                                });
+                            }
+                            catch {
+                                try {
+                                    await ctx.api.sendMessage(chatId, pageTag + (fallbackChunks[i] ?? chunks[i]), {
+                                        reply_parameters: i === 0 ? { message_id: userMessageId } : undefined,
+                                    });
+                                }
+                                catch { }
+                            }
+                        }
+                        try {
+                            await ctx.api.setMessageReaction(chatId, userMessageId, [{ type: "emoji", emoji: "👍" }]);
+                        }
+                        catch { }
+                    })();
+                }
+            });
+        }
+        catch (err) {
+            await ctx.reply(`❌ Error processing voice: ${err instanceof Error ? err.message : String(err)}`, {
+                reply_parameters: { message_id: userMessageId },
+            });
+        }
+    });
     return bot;
 }
 export async function startBot() {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
 	"name": "@iletai/nzb",
-	"version": "1.3.3",
+	"version": "1.3.4",
 	"description": "NZB — a personal AI assistant for developers, built on the GitHub Copilot SDK",
 	"bin": {
 		"nzb": "dist/cli.js"