npm - @luanpoppe/ai - Versions diffs - 1.0.8 → 1.0.10 - Mend

@luanpoppe/ai 1.0.8 → 1.0.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

package/dist/@types/audio.d.ts +1 -0
package/dist/@types/audio.d.ts.map +1 -1
package/dist/@types/audio.js +15 -0
package/dist/@types/audio.js.map +1 -1
package/dist/index.d.ts +3 -3
package/dist/index.d.ts.map +1 -1
package/dist/langchain/audio-transcription.d.ts +8 -3
package/dist/langchain/audio-transcription.d.ts.map +1 -1
package/dist/langchain/audio-transcription.js +49 -42
package/dist/langchain/audio-transcription.js.map +1 -1
package/dist/langchain/messages.js +1 -1
package/dist/langchain/messages.js.map +1 -1
package/dist/utils/files-utils.d.ts +2 -2
package/dist/utils/files-utils.d.ts.map +1 -1
package/dist/utils/files-utils.js +10 -2
package/dist/utils/files-utils.js.map +1 -1
package/docs/LANGCHAIN_WHISPER_WINDOWS_BUG.md +209 -0
package/package.json +2 -1
package/src/@types/audio.ts +15 -0
package/src/index.ts +5 -2
package/src/langchain/audio-transcription.ts +69 -46
package/src/langchain/messages.ts +1 -1
package/src/utils/files-utils.ts +16 -3
package/tests/unit/langchain/audio-transcription.test.ts +137 -244

package/dist/@types/audio.d.ts CHANGED Viewed

@@ -1,3 +1,4 @@
 export type AudioBuffer = Buffer | ArrayBuffer | Uint8Array;
 export type AudioMimeType = "audio/mpeg" | "audio/mp3" | "audio/wav" | "audio/wave" | "audio/x-wav" | "audio/mp4" | "audio/m4a" | "audio/webm" | "audio/ogg" | "audio/flac" | "audio/aac" | "audio/opus";
+export declare const MIME_TO_EXTENSION: Record<AudioMimeType, string>;
 //# sourceMappingURL=audio.d.ts.map

package/dist/@types/audio.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"audio.d.ts","sourceRoot":"","sources":["../../src/@types/audio.ts"],"names":[],"mappings":"AAAA,MAAM,MAAM,WAAW,GAAG,MAAM,GAAG,WAAW,GAAG,UAAU,CAAC;AAE5D,MAAM,MAAM,aAAa,GACrB,YAAY,GACZ,WAAW,GACX,WAAW,GACX,YAAY,GACZ,aAAa,GACb,WAAW,GACX,WAAW,GACX,YAAY,GACZ,WAAW,GACX,YAAY,GACZ,WAAW,GACX,YAAY,CAAC"}
1	+ {"version":3,"file":"audio.d.ts","sourceRoot":"","sources":["../../src/@types/audio.ts"],"names":[],"mappings":"AAAA,MAAM,MAAM,WAAW,GAAG,MAAM,GAAG,WAAW,GAAG,UAAU,CAAC;AAE5D,MAAM,MAAM,aAAa,GACrB,YAAY,GACZ,WAAW,GACX,WAAW,GACX,YAAY,GACZ,aAAa,GACb,WAAW,GACX,WAAW,GACX,YAAY,GACZ,WAAW,GACX,YAAY,GACZ,WAAW,GACX,YAAY,CAAC;AAEjB,eAAO,MAAM,iBAAiB,EAAE,MAAM,CAAC,aAAa,EAAE,MAAM,CAa3D,CAAC"}

package/dist/@types/audio.js CHANGED Viewed

@@ -1,3 +1,18 @@
 "use strict";
 Object.defineProperty(exports, "__esModule", { value: true });
+exports.MIME_TO_EXTENSION = void 0;
+exports.MIME_TO_EXTENSION = {
+    "audio/mpeg": "mp3",
+    "audio/mp3": "mp3",
+    "audio/wav": "wav",
+    "audio/wave": "wav",
+    "audio/x-wav": "wav",
+    "audio/mp4": "mp4",
+    "audio/m4a": "m4a",
+    "audio/webm": "webm",
+    "audio/ogg": "ogg",
+    "audio/flac": "flac",
+    "audio/aac": "aac",
+    "audio/opus": "opus",
+};
 //# sourceMappingURL=audio.js.map

package/dist/@types/audio.js.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"audio.js","sourceRoot":"","sources":["../../src/@types/audio.ts"],"names":[],"mappings":""}
1	+ {"version":3,"file":"audio.js","sourceRoot":"","sources":["../../src/@types/audio.ts"],"names":[],"mappings":";;;AAgBa,QAAA,iBAAiB,GAAkC;IAC9D,YAAY,EAAE,KAAK;IACnB,WAAW,EAAE,KAAK;IAClB,WAAW,EAAE,KAAK;IAClB,YAAY,EAAE,KAAK;IACnB,aAAa,EAAE,KAAK;IACpB,WAAW,EAAE,KAAK;IAClB,WAAW,EAAE,KAAK;IAClB,YAAY,EAAE,MAAM;IACpB,WAAW,EAAE,KAAK;IAClB,YAAY,EAAE,MAAM;IACpB,WAAW,EAAE,KAAK;IAClB,YAAY,EAAE,MAAM;CACrB,CAAC"}

package/dist/index.d.ts CHANGED Viewed

@@ -2,7 +2,7 @@ import { LangchainModels, LLMModelConfig } from "./langchain/models";
 import { AIModelNames } from "./@types/model-names";
 import z from "zod";
 import { MessageInput } from "./langchain/messages";
-import { AgentMiddleware, BaseMessage } from "langchain";
+import { AgentMiddleware, BaseMessage, createAgent } from "langchain";
 import { ClientTool, ServerTool } from "@langchain/core/tools";
 import { LangchainMessages } from "./langchain/messages";
 import { LangchainTools } from "./langchain/tools";
@@ -44,7 +44,7 @@ export declare class Langchain {
      */
     private normalizeSchemaForOpenAI;
     getRawAgent(params: LangchainCallParams, outputSchema?: z.ZodSchema | undefined): {
-        agent: import("langchain").ReactAgent<import("langchain").AgentTypeConfig<Record<string, any>, import("@langchain/core/utils/types").InteropZodObject | import("langchain").AnyAnnotationRoot | undefined, import("@langchain/core/utils/types").InteropZodObject | import("langchain").AnyAnnotationRoot, readonly AgentMiddleware<any, any, any, readonly (ClientTool | ServerTool)[]>[], readonly (ClientTool | ServerTool)[]>>;
+        agent: ReturnType<typeof createAgent>;
     };
     private getModel;
     private standardAgent;
@@ -55,5 +55,5 @@ export { LangchainAudioTranscription } from "./langchain/audio-transcription";
 export { AudioUtils } from "./utils/audio-utils";
 export type { AudioBuffer, AudioMimeType } from "./@types/audio";
 export type { AudioContentBlock, HumanMessageWithAudioOptions, } from "./langchain/messages";
-export type { WhisperTranscriptionOptions } from "./langchain/audio-transcription";
+export type { WhisperModel, WhisperTranscriptionOptions, } from "./langchain/audio-transcription";
 //# sourceMappingURL=index.d.ts.map

package/dist/index.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../src/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,eAAe,EAAE,cAAc,EAAE,MAAM,oBAAoB,CAAC;AACrE,OAAO,EAAE,YAAY,EAAE,MAAM,sBAAsB,CAAC;AACpD,OAAO,CAAC,MAAM,KAAK,CAAC;AACpB,OAAO,EAAE,YAAY,EAAE,MAAM,sBAAsB,CAAC;AACpD,OAAO,EACL,eAAe,EACf,WAAW,~~EAIZ~~,MAAM,WAAW,CAAC;AACnB,OAAO,EAAE,UAAU,EAAE,UAAU,EAAE,MAAM,uBAAuB,CAAC;AAC/D,OAAO,EAAE,iBAAiB,EAAE,MAAM,sBAAsB,CAAC;AACzD,OAAO,EAAE,cAAc,EAAE,MAAM,mBAAmB,CAAC;AAEnD,KAAK,oBAAoB,GAAG;IAC1B,iBAAiB,CAAC,EAAE,MAAM,CAAC;IAC3B,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,gBAAgB,CAAC,EAAE,MAAM,CAAC;CAC3B,CAAC;AAEF,MAAM,MAAM,mBAAmB,GAAG;IAChC,KAAK,CAAC,EAAE;QACN,UAAU,CAAC,EAAE,eAAe,EAAE,CAAC;QAC/B,KAAK,CAAC,EAAE,CAAC,UAAU,GAAG,UAAU,CAAC,EAAE,CAAC;KACrC,CAAC;IAEF,WAAW,CAAC,EAAE,IAAI,CAAC,cAAc,EAAE,QAAQ,GAAG,OAAO,CAAC,CAAC;IAEvD,OAAO,EAAE,YAAY,CAAC;IACtB,QAAQ,EAAE,YAAY,EAAE,CAAC;IACzB,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,UAAU,CAAC,EAAE,MAAM,CAAC;CACrB,CAAC;AAEF,MAAM,MAAM,mBAAmB,GAAG,OAAO,CAAC;IACxC,IAAI,EAAE,MAAM,CAAC;IACb,QAAQ,EAAE,WAAW,EAAE,CAAC;CACzB,CAAC,CAAC;AAEH,MAAM,MAAM,mCAAmC,CAAC,CAAC,SAAS,CAAC,CAAC,SAAS,IACnE,mBAAmB,GAAG;IACpB,YAAY,EAAE,CAAC,CAAC;CACjB,CAAC;AAEJ,MAAM,MAAM,mCAAmC,CAAC,CAAC,IAAI,OAAO,CAAC;IAC3D,QAAQ,EAAE,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;CACtB,CAAC,CAAC;AAEH,qBAAa,SAAS;IACR,OAAO,CAAC,MAAM;gBAAN,MAAM,EAAE,oBAAoB;IAE1C,IAAI,CAAC,MAAM,EAAE,mBAAmB,GAAG,mBAAmB;IAiBtD,oBAAoB,CAAC,CAAC,SAAS,CAAC,CAAC,SAAS,EAC9C,MAAM,EAAE,mCAAmC,CAAC,CAAC,CAAC,GAC7C,mCAAmC,CAAC,OAAO,MAAM,CAAC,YAAY,CAAC;IAwBlE;;;;OAIG;IACH,OAAO,CAAC,wBAAwB;IAoChC,WAAW,CACT,MAAM,EAAE,mBAAmB,EAC3B,YAAY,CAAC,EAAE,CAAC,CAAC,SAAS,GAAG,SAAS~~;;;IAUxC~~,OAAO,CAAC,QAAQ;IAiChB,OAAO,CAAC,aAAa;IAkBrB,OAAO,CAAC,mBAAmB;CAU5B;AAED,OAAO,EAAE,eAAe,EAAE,iBAAiB,EAAE,cAAc,EAAE,CAAC;AAC9D,OAAO,EAAE,2BAA2B,EAAE,MAAM,iCAAiC,CAAC;AAC9E,OAAO,EAAE,UAAU,EAAE,MAAM,qBAAqB,CAAC;AACjD,YAAY,EAAE,WAAW,EAAE,aAAa,EAAE,MAAM,gBAAgB,CAAC;AACjE,YAAY,EACV,iBAAiB,EACjB,4BAA4B,GAC7B,MAAM,sBAAsB,CAAC;AAC9B,YAAY,~~EAAE~~,2BAA2B,~~EAAE~~,MAAM,iCAAiC,CAAC"}
1	+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../src/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,eAAe,EAAE,cAAc,EAAE,MAAM,oBAAoB,CAAC;AACrE,OAAO,EAAE,YAAY,EAAE,MAAM,sBAAsB,CAAC;AACpD,OAAO,CAAC,MAAM,KAAK,CAAC;AACpB,OAAO,EAAE,YAAY,EAAE,MAAM,sBAAsB,CAAC;AACpD,OAAO,EACL,eAAe,EACf,WAAW,EACX,WAAW,EAGZ,MAAM,WAAW,CAAC;AACnB,OAAO,EAAE,UAAU,EAAE,UAAU,EAAE,MAAM,uBAAuB,CAAC;AAC/D,OAAO,EAAE,iBAAiB,EAAE,MAAM,sBAAsB,CAAC;AACzD,OAAO,EAAE,cAAc,EAAE,MAAM,mBAAmB,CAAC;AAEnD,KAAK,oBAAoB,GAAG;IAC1B,iBAAiB,CAAC,EAAE,MAAM,CAAC;IAC3B,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,gBAAgB,CAAC,EAAE,MAAM,CAAC;CAC3B,CAAC;AAEF,MAAM,MAAM,mBAAmB,GAAG;IAChC,KAAK,CAAC,EAAE;QACN,UAAU,CAAC,EAAE,eAAe,EAAE,CAAC;QAC/B,KAAK,CAAC,EAAE,CAAC,UAAU,GAAG,UAAU,CAAC,EAAE,CAAC;KACrC,CAAC;IAEF,WAAW,CAAC,EAAE,IAAI,CAAC,cAAc,EAAE,QAAQ,GAAG,OAAO,CAAC,CAAC;IAEvD,OAAO,EAAE,YAAY,CAAC;IACtB,QAAQ,EAAE,YAAY,EAAE,CAAC;IACzB,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,UAAU,CAAC,EAAE,MAAM,CAAC;CACrB,CAAC;AAEF,MAAM,MAAM,mBAAmB,GAAG,OAAO,CAAC;IACxC,IAAI,EAAE,MAAM,CAAC;IACb,QAAQ,EAAE,WAAW,EAAE,CAAC;CACzB,CAAC,CAAC;AAEH,MAAM,MAAM,mCAAmC,CAAC,CAAC,SAAS,CAAC,CAAC,SAAS,IACnE,mBAAmB,GAAG;IACpB,YAAY,EAAE,CAAC,CAAC;CACjB,CAAC;AAEJ,MAAM,MAAM,mCAAmC,CAAC,CAAC,IAAI,OAAO,CAAC;IAC3D,QAAQ,EAAE,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;CACtB,CAAC,CAAC;AAEH,qBAAa,SAAS;IACR,OAAO,CAAC,MAAM;gBAAN,MAAM,EAAE,oBAAoB;IAE1C,IAAI,CAAC,MAAM,EAAE,mBAAmB,GAAG,mBAAmB;IAiBtD,oBAAoB,CAAC,CAAC,SAAS,CAAC,CAAC,SAAS,EAC9C,MAAM,EAAE,mCAAmC,CAAC,CAAC,CAAC,GAC7C,mCAAmC,CAAC,OAAO,MAAM,CAAC,YAAY,CAAC;IAwBlE;;;;OAIG;IACH,OAAO,CAAC,wBAAwB;IAoChC,WAAW,CACT,MAAM,EAAE,mBAAmB,EAC3B,YAAY,CAAC,EAAE,CAAC,CAAC,SAAS,GAAG,SAAS,GACrC;QAAE,KAAK,EAAE,UAAU,CAAC,OAAO,WAAW,CAAC,CAAA;KAAE;IAS5C,OAAO,CAAC,QAAQ;IAiChB,OAAO,CAAC,aAAa;IAkBrB,OAAO,CAAC,mBAAmB;CAU5B;AAED,OAAO,EAAE,eAAe,EAAE,iBAAiB,EAAE,cAAc,EAAE,CAAC;AAC9D,OAAO,EAAE,2BAA2B,EAAE,MAAM,iCAAiC,CAAC;AAC9E,OAAO,EAAE,UAAU,EAAE,MAAM,qBAAqB,CAAC;AACjD,YAAY,EAAE,WAAW,EAAE,aAAa,EAAE,MAAM,gBAAgB,CAAC;AACjE,YAAY,EACV,iBAAiB,EACjB,4BAA4B,GAC7B,MAAM,sBAAsB,CAAC;AAC9B,YAAY,EACV,YAAY,EACZ,2BAA2B,GAC5B,MAAM,iCAAiC,CAAC"}

package/dist/langchain/audio-transcription.d.ts CHANGED Viewed

@@ -1,13 +1,18 @@
-import type { AudioBuffer } from "../@types/audio";
+import type { AudioBuffer, AudioMimeType } from "../@types/audio";
+/** Modelos disponíveis na API de transcrição OpenAI (Speech-to-Text) */
+export type WhisperModel = "whisper-1" | "gpt-4o-transcribe" | "gpt-4o-mini-transcribe" | "gpt-4o-mini-transcribe-2025-12-15" | "gpt-4o-transcribe-diarize";
 export type WhisperTranscriptionOptions = {
-    language?: string;
+    /** Modelo de transcrição. Padrão: "whisper-1". gpt-4o-transcribe e gpt-4o-mini-transcribe têm maior qualidade. */
+    model?: WhisperModel;
+    languageIn2Digits?: string;
     prompt?: string;
     responseFormat?: "json" | "text" | "srt" | "verbose_json" | "vtt";
     temperature?: number;
     timestampGranularities?: ("word" | "segment")[];
+    /** Formato do áudio: extensão ("mp3", "wav", "webm") ou MIME type ("audio/wav", "audio/webm") */
+    format?: string | AudioMimeType;
 };
 export declare class LangchainAudioTranscription {
-    private static extractTextFromDocs;
     static transcribeWithWhisper(audioBuffer: AudioBuffer, options?: WhisperTranscriptionOptions, openAIApiKey?: string): Promise<string>;
     static transcribeFileWithWhisper(filePath: string, options?: WhisperTranscriptionOptions, openAIApiKey?: string): Promise<string>;
 }

package/dist/langchain/audio-transcription.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"audio-transcription.d.ts","sourceRoot":"","sources":["../../src/langchain/audio-transcription.ts"],"names":[],"mappings":"~~AAEA~~,OAAO,KAAK,EAAE,WAAW,EAAE,MAAM,iBAAiB,CAAC;~~AAInD~~,MAAM,MAAM,2BAA2B,GAAG;IACxC,~~QAAQ~~,CAAC,EAAE,MAAM,CAAC;~~IAClB~~,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,cAAc,CAAC,EAAE,MAAM,GAAG,MAAM,GAAG,KAAK,GAAG,cAAc,GAAG,KAAK,CAAC;IAClE,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,sBAAsB,CAAC,EAAE,CAAC,MAAM,GAAG,SAAS,CAAC,EAAE,CAAC;~~CACjD~~,~~CAAC~~;~~AAEF~~,~~qBAAa~~,~~2BAA2B;IACtC~~,~~OAAO~~,~~CAAC,~~MAAM,CAAC,~~mBAAmB~~;~~WAYrB~~,qBAAqB,CAChC,WAAW,EAAE,WAAW,EACxB,OAAO,GAAE,2BAAgC,EACzC,YAAY,CAAC,EAAE,MAAM,GACpB,OAAO,CAAC,MAAM,CAAC;~~WAsCL~~,yBAAyB,CACpC,QAAQ,EAAE,MAAM,EAChB,OAAO,GAAE,2BAAgC,EACzC,YAAY,CAAC,EAAE,MAAM,GACpB,OAAO,CAAC,MAAM,CAAC;~~CAQnB~~"}
1	+ {"version":3,"file":"audio-transcription.d.ts","sourceRoot":"","sources":["../../src/langchain/audio-transcription.ts"],"names":[],"mappings":"AAIA,OAAO,KAAK,EAAE,WAAW,EAAE,aAAa,EAAE,MAAM,iBAAiB,CAAC;AAGlE,wEAAwE;AACxE,MAAM,MAAM,YAAY,GACpB,WAAW,GACX,mBAAmB,GACnB,wBAAwB,GACxB,mCAAmC,GACnC,2BAA2B,CAAC;AAEhC,MAAM,MAAM,2BAA2B,GAAG;IACxC,kHAAkH;IAClH,KAAK,CAAC,EAAE,YAAY,CAAC;IACrB,iBAAiB,CAAC,EAAE,MAAM,CAAC;IAC3B,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,cAAc,CAAC,EAAE,MAAM,GAAG,MAAM,GAAG,KAAK,GAAG,cAAc,GAAG,KAAK,CAAC;IAClE,WAAW,CAAC,EAAE,MAAM,CAAC;IACrB,sBAAsB,CAAC,EAAE,CAAC,MAAM,GAAG,SAAS,CAAC,EAAE,CAAC;IAChD,iGAAiG;IACjG,MAAM,CAAC,EAAE,MAAM,GAAG,aAAa,CAAC;CACjC,CAAC;AAgBF,qBAAa,2BAA2B;WACzB,qBAAqB,CAChC,WAAW,EAAE,WAAW,EACxB,OAAO,GAAE,2BAAgC,EACzC,YAAY,CAAC,EAAE,MAAM,GACpB,OAAO,CAAC,MAAM,CAAC;WAwCL,yBAAyB,CACpC,QAAQ,EAAE,MAAM,EAChB,OAAO,GAAE,2BAAgC,EACzC,YAAY,CAAC,EAAE,MAAM,GACpB,OAAO,CAAC,MAAM,CAAC;CAcnB"}

package/dist/langchain/audio-transcription.js CHANGED Viewed

@@ -32,62 +32,69 @@ var __importStar = (this && this.__importStar) || (function () {
         return result;
     };
 })();
+var __importDefault = (this && this.__importDefault) || function (mod) {
+    return (mod && mod.__esModule) ? mod : { "default": mod };
+};
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.LangchainAudioTranscription = void 0;
 const fs = __importStar(require("fs"));
-const openai_whisper_audio_1 = require("@langchain/community/document_loaders/fs/openai_whisper_audio");
-const files_utils_1 = require("../utils/files-utils");
+const path = __importStar(require("path"));
+const openai_1 = __importDefault(require("openai"));
+const openai_2 = require("openai");
+const audio_1 = require("../@types/audio");
+function getExtension(format) {
+    if (!format)
+        return "mp3";
+    if (format.startsWith("audio/")) {
+        return audio_1.MIME_TO_EXTENSION[format] ?? "mp3";
+    }
+    return format.replace(/^\./, "");
+}
+function toBuffer(audioBuffer) {
+    if (audioBuffer instanceof Buffer)
+        return audioBuffer;
+    if (audioBuffer instanceof ArrayBuffer)
+        return Buffer.from(audioBuffer);
+    return Buffer.from(audioBuffer);
+}
 class LangchainAudioTranscription {
-    static extractTextFromDocs(docs) {
-        if (docs.length === 0) {
-            throw new Error("Nenhum documento foi retornado pela transcrição");
+    static async transcribeWithWhisper(audioBuffer, options = {}, openAIApiKey) {
+        if (openAIApiKey) {
+            process.env.OPENAI_API_KEY = openAIApiKey;
         }
-        const firstDoc = docs[0];
-        if (!firstDoc) {
-            throw new Error("Documento vazio retornado pela transcrição");
+        const buffer = toBuffer(audioBuffer);
+        const extension = getExtension(options.format);
+        const fileName = `whisper-${Date.now()}.${extension}`;
+        const file = await (0, openai_2.toFile)(buffer, fileName);
+        const openai = new openai_1.default();
+        const transcriptionParams = {
+            file,
+            model: options.model ?? "whisper-1",
+            response_format: options.responseFormat ?? "text",
+        };
+        if (options.languageIn2Digits) {
+            transcriptionParams.language = options.languageIn2Digits;
         }
-        // LangChain.js usa pageContent (camelCase), não page_content
-        return firstDoc.pageContent;
-    }
-    static async transcribeWithWhisper(audioBuffer, options = {}, openAIApiKey) {
-        const tempFilePath = files_utils_1.FilesUtils.createTempFile(audioBuffer, "whisper");
-        try {
-            // Configura a API key se fornecida
-            if (openAIApiKey) {
-                process.env.OPENAI_API_KEY = openAIApiKey;
-            }
-            const transcriptionParams = {
-                response_format: options.responseFormat || "text",
-            };
-            if (options.language) {
-                transcriptionParams.language = options.language;
-            }
-            if (options.prompt) {
-                transcriptionParams.prompt = options.prompt;
-            }
-            if (options.temperature !== undefined) {
-                transcriptionParams.temperature = options.temperature;
-            }
-            if (options.timestampGranularities) {
-                transcriptionParams.timestamp_granularities =
-                    options.timestampGranularities;
-            }
-            const loader = new openai_whisper_audio_1.OpenAIWhisperAudio(tempFilePath, {
-                transcriptionCreateParams: transcriptionParams,
-            });
-            const docs = await loader.load();
-            return this.extractTextFromDocs(docs);
+        if (options.prompt) {
+            transcriptionParams.prompt = options.prompt;
+        }
+        if (options.temperature !== undefined) {
+            transcriptionParams.temperature = options.temperature;
         }
-        finally {
-            files_utils_1.FilesUtils.cleanupTempFile(tempFilePath);
+        if (options.timestampGranularities) {
+            transcriptionParams.timestamp_granularities =
+                options.timestampGranularities;
         }
+        const response = await openai.audio.transcriptions.create(transcriptionParams);
+        return typeof response === "string" ? response : response.text;
     }
     static async transcribeFileWithWhisper(filePath, options = {}, openAIApiKey) {
         if (!fs.existsSync(filePath)) {
             throw new Error(`Arquivo não encontrado: ${filePath}`);
         }
         const audioBuffer = fs.readFileSync(filePath);
-        return this.transcribeWithWhisper(audioBuffer, options, openAIApiKey);
+        const format = options.format ?? (path.extname(filePath).replace(/^\./, "") || "mp3");
+        return this.transcribeWithWhisper(audioBuffer, { ...options, format }, openAIApiKey);
     }
 }
 exports.LangchainAudioTranscription = LangchainAudioTranscription;

package/dist/langchain/audio-transcription.js.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"audio-transcription.js","sourceRoot":"","sources":["../../src/langchain/audio-transcription.ts"],"names":[],"mappings":"~~;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;AACA~~,uCAAyB;~~AAEzB~~,~~wGAAmG~~;~~AACnG~~,~~sDAAkD~~;~~AAUlD~~,~~MAAa~~,~~2BAA2B~~;~~IAC9B~~,~~MAAM~~,CAAC,~~mBAAmB~~,CAAC,~~IAAgB~~;~~QACjD~~,~~IAAI~~,~~IAAI~~,CAAC,MAAM,~~KAAK~~,CAAC,EAAE,CAAC;~~YACtB~~,~~MAAM~~,~~IAAI~~,~~KAAK,~~CAAC,~~iDAAiD~~,CAAC,CAAC;~~QACrE~~,CAAC;~~QACD~~,MAAM,~~QAAQ~~,~~GAAG~~,~~IAAI~~,CAAC,CAAC,CAAC,CAAC;~~QACzB~~,IAAI,~~CAAC~~,~~QAAQ~~,~~EAAE~~,CAAC;~~YACd~~,~~MAAM,~~IAAI,~~KAAK~~,CAAC,~~4CAA4C~~,CAAC,CAAC~~;QAChE~~,CAAC;~~QACD~~,~~6DAA6D;QAC7D,~~OAAO,~~QAAQ~~,CAAC,~~WAAW~~,CAAC;~~IAC9B~~,CAAC;~~IAED~~,MAAM,CAAC,KAAK,CAAC,qBAAqB,CAChC,WAAwB,EACxB,UAAuC,EAAE,EACzC,YAAqB;QAErB,~~MAAM~~,YAAY,~~GAAG~~,~~wBAAU~~,CAAC,cAAc,CAAC,WAAW,~~EAAE~~,SAAS,CAAC,CAAC;~~QAEvE~~,IAAI,CAAC~~;YACH~~,~~mCAAmC;YACnC~~,IAAI,~~YAAY~~,EAAE,CAAC;~~gBACjB~~,~~OAAO~~,~~CAAC~~,GAAG,~~CAAC~~,~~cAAc~~,~~GAAG~~,~~YAAY~~,CAAC;~~YAC5C~~,CAAC;~~YAED~~,MAAM,mBAAmB,~~GAAQ~~;~~gBAC/B~~,eAAe,EAAE,OAAO,CAAC,cAAc,IAAI,MAAM;~~aAClD~~,CAAC;~~YAEF~~,IAAI,OAAO,CAAC,~~QAAQ~~,EAAE,CAAC;~~gBACrB~~,mBAAmB,CAAC,QAAQ,GAAG,OAAO,CAAC,~~QAAQ~~,CAAC;~~YAClD~~,CAAC;~~YACD~~,IAAI,OAAO,CAAC,MAAM,EAAE,CAAC;~~gBACnB~~,mBAAmB,CAAC,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC;~~YAC9C~~,CAAC;~~YACD~~,IAAI,OAAO,CAAC,WAAW,KAAK,SAAS,EAAE,CAAC;~~gBACtC~~,mBAAmB,CAAC,WAAW,GAAG,OAAO,CAAC,WAAW,CAAC;~~YACxD~~,CAAC;~~YACD~~,IAAI,OAAO,CAAC,sBAAsB,EAAE,CAAC;~~gBACnC~~,mBAAmB,CAAC,uBAAuB;~~oBACzC~~,OAAO,CAAC,sBAAsB,CAAC;~~YACnC~~,CAAC;~~YAED~~,MAAM,~~MAAM~~,GAAG,~~IAAI~~,~~yCAAkB~~,CAAC,~~YAAY~~,~~EAAE;gBAClD~~,~~yBAAyB~~,~~EAAE,mBAAmB;aAC/C,~~CAAC,~~CAAC;YAEH,~~MAAM,~~IAAI~~,~~GAAe~~,~~MAAM~~,~~MAAM,~~CAAC~~,IAAI,EAAE,CAAC~~;~~YAC7C~~,OAAO,~~IAAI~~,~~CAAC~~,~~mBAAmB~~,~~CAAC~~,~~IAAI,~~CAAC,CAAC~~;QACxC~~,CAAC~~;gBAAS~~,CAAC~~;YACT~~,~~wBAAU,~~CAAC,~~eAAe,~~CAAC,~~YAAY~~,CAAC,~~CAAC;QAC3C~~,CAAC;~~IACH~~,CAAC;IAED,MAAM,CAAC,KAAK,CAAC,yBAAyB,CACpC,QAAgB,EAChB,UAAuC,EAAE,EACzC,YAAqB;QAErB,IAAI,CAAC,EAAE,CAAC,UAAU,CAAC,QAAQ,CAAC,EAAE,CAAC;YAC7B,MAAM,IAAI,KAAK,CAAC,2BAA2B,QAAQ,EAAE,CAAC,CAAC;QACzD,CAAC;QAED,MAAM,WAAW,GAAG,EAAE,CAAC,YAAY,CAAC,QAAQ,CAAC,CAAC;QAC9C,OAAO,IAAI,CAAC,~~qBAAqB~~,CAAC,WAAW,EAAE,OAAO,EAAE,YAAY,~~CAAC~~,CAAC;~~IACxE~~,CAAC;CACF;~~AAnED~~,~~kEAmEC~~"}
1	+ {"version":3,"file":"audio-transcription.js","sourceRoot":"","sources":["../../src/langchain/audio-transcription.ts"],"names":[],"mappings":";;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;AAAA,uCAAyB;AACzB,2CAA6B;AAC7B,oDAA4B;AAC5B,mCAAgC;AAEhC,2CAAoD;AAsBpD,SAAS,YAAY,CAAC,MAA+B;IACnD,IAAI,CAAC,MAAM;QAAE,OAAO,KAAK,CAAC;IAC1B,IAAI,MAAM,CAAC,UAAU,CAAC,QAAQ,CAAC,EAAE,CAAC;QAChC,OAAO,yBAAiB,CAAC,MAAuB,CAAC,IAAI,KAAK,CAAC;IAC7D,CAAC;IACD,OAAO,MAAM,CAAC,OAAO,CAAC,KAAK,EAAE,EAAE,CAAC,CAAC;AACnC,CAAC;AAED,SAAS,QAAQ,CAAC,WAAwB;IACxC,IAAI,WAAW,YAAY,MAAM;QAAE,OAAO,WAAW,CAAC;IACtD,IAAI,WAAW,YAAY,WAAW;QAAE,OAAO,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC;IACxE,OAAO,MAAM,CAAC,IAAI,CAAC,WAAyB,CAAC,CAAC;AAChD,CAAC;AAED,MAAa,2BAA2B;IACtC,MAAM,CAAC,KAAK,CAAC,qBAAqB,CAChC,WAAwB,EACxB,UAAuC,EAAE,EACzC,YAAqB;QAErB,IAAI,YAAY,EAAE,CAAC;YACjB,OAAO,CAAC,GAAG,CAAC,cAAc,GAAG,YAAY,CAAC;QAC5C,CAAC;QAED,MAAM,MAAM,GAAG,QAAQ,CAAC,WAAW,CAAC,CAAC;QACrC,MAAM,SAAS,GAAG,YAAY,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC;QAC/C,MAAM,QAAQ,GAAG,WAAW,IAAI,CAAC,GAAG,EAAE,IAAI,SAAS,EAAE,CAAC;QAEtD,MAAM,IAAI,GAAG,MAAM,IAAA,eAAM,EAAC,MAAM,EAAE,QAAQ,CAAC,CAAC;QAE5C,MAAM,MAAM,GAAG,IAAI,gBAAM,EAAE,CAAC;QAE5B,MAAM,mBAAmB,GAA2C;YAClE,IAAI;YACJ,KAAK,EAAE,OAAO,CAAC,KAAK,IAAI,WAAW;YACnC,eAAe,EAAE,OAAO,CAAC,cAAc,IAAI,MAAM;SAClD,CAAC;QAEF,IAAI,OAAO,CAAC,iBAAiB,EAAE,CAAC;YAC9B,mBAAmB,CAAC,QAAQ,GAAG,OAAO,CAAC,iBAAiB,CAAC;QAC3D,CAAC;QACD,IAAI,OAAO,CAAC,MAAM,EAAE,CAAC;YACnB,mBAAmB,CAAC,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC;QAC9C,CAAC;QACD,IAAI,OAAO,CAAC,WAAW,KAAK,SAAS,EAAE,CAAC;YACtC,mBAAmB,CAAC,WAAW,GAAG,OAAO,CAAC,WAAW,CAAC;QACxD,CAAC;QACD,IAAI,OAAO,CAAC,sBAAsB,EAAE,CAAC;YACnC,mBAAmB,CAAC,uBAAuB;gBACzC,OAAO,CAAC,sBAAsB,CAAC;QACnC,CAAC;QAED,MAAM,QAAQ,GAAG,MAAM,MAAM,CAAC,KAAK,CAAC,cAAc,CAAC,MAAM,CACvD,mBAAmB,CACpB,CAAC;QAEF,OAAO,OAAO,QAAQ,KAAK,QAAQ,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,CAAC,QAAQ,CAAC,IAAI,CAAC;IACjE,CAAC;IAED,MAAM,CAAC,KAAK,CAAC,yBAAyB,CACpC,QAAgB,EAChB,UAAuC,EAAE,EACzC,YAAqB;QAErB,IAAI,CAAC,EAAE,CAAC,UAAU,CAAC,QAAQ,CAAC,EAAE,CAAC;YAC7B,MAAM,IAAI,KAAK,CAAC,2BAA2B,QAAQ,EAAE,CAAC,CAAC;QACzD,CAAC;QAED,MAAM,WAAW,GAAG,EAAE,CAAC,YAAY,CAAC,QAAQ,CAAC,CAAC;QAC9C,MAAM,MAAM,GACV,OAAO,CAAC,MAAM,IAAI,CAAC,IAAI,CAAC,OAAO,CAAC,QAAQ,CAAC,CAAC,OAAO,CAAC,KAAK,EAAE,EAAE,CAAC,IAAI,KAAK,CAAC,CAAC;QACzE,OAAO,IAAI,CAAC,qBAAqB,CAC/B,WAAW,EACX,EAAE,GAAG,OAAO,EAAE,MAAM,EAAE,EACtB,YAAY,CACb,CAAC;IACJ,CAAC;CACF;AA/DD,kEA+DC"}

package/dist/langchain/messages.js CHANGED Viewed

@@ -57,7 +57,7 @@ class LangchainMessages {
             // Prepara opções de transcrição - só inclui language se não houver mimeType
             // Com exactOptionalPropertyTypes: true, não podemos passar undefined explicitamente
             const transcriptionOptions = mimeType
-                ? {}
+                ? { format: mimeType }
                 : { language: "pt" };
             const transcribedText = await audio_transcription_1.LangchainAudioTranscription.transcribeWithWhisper(audioBuffer, transcriptionOptions, openAIApiKey);
             // Combina o texto original (se fornecido) com a transcrição

package/dist/langchain/messages.js.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"messages.js","sourceRoot":"","sources":["../../src/langchain/messages.ts"],"names":[],"mappings":";;;AAAA,yCAAmE;AACnE,sDAAkD;AAElD,+DAAoE;AAuBpE,MAAa,iBAAiB;IAC5B,MAAM,CAAC,MAAM,CAAC,OAAe;QAC3B,OAAO,IAAI,yBAAa,CAAC,OAAO,CAAC,CAAC;IACpC,CAAC;IAED,MAAM,CAAC,KAAK,CAAC,OAAe;QAC1B,OAAO,IAAI,wBAAY,CAAC,OAAO,CAAC,CAAC;IACnC,CAAC;IAED,MAAM,CAAC,KAAK,CAAC,UAAU,CACrB,OAAqC;QAErC,MAAM,EAAE,KAAK,EAAE,IAAI,EAAE,QAAQ,GAAG,MAAM,EAAE,YAAY,EAAE,GAAG,OAAO,CAAC;QACjE,MAAM,EAAE,MAAM,EAAE,QAAQ,EAAE,QAAQ,EAAE,GAAG,KAAK,CAAC;QAE7C,OAAO,IAAI,CAAC,2BAA2B,CACrC,MAAM,EACN,IAAI,EACJ,QAAQ,EACR,QAAQ,EACR,QAAQ,EACR,YAAY,CACb,CAAC;IACJ,CAAC;IAED,MAAM,CAAC,EAAE,CAAC,OAAe;QACvB,OAAO,IAAI,qBAAS,CAAC,OAAO,CAAC,CAAC;IAChC,CAAC;IAEO,MAAM,CAAC,KAAK,CAAC,2BAA2B,CAC9C,WAAwB,EACxB,IAAa,EACb,QAAwB,EACxB,QAAiB,EACjB,WAAyC,MAAM,EAC/C,YAAqB;QAErB,gFAAgF;QAChF,IAAI,QAAQ,KAAK,QAAQ;YACvB,OAAO,MAAM,IAAI,CAAC,kBAAkB,CAClC,WAAW,EACX,QAAQ,EACR,IAAI,EACJ,YAAY,CACb,CAAC;QAEJ,4GAA4G;QAC5G,MAAM,UAAU,GAAG,wBAAU,CAAC,cAAc,CAAC,WAAW,CAAC,CAAC;QAC1D,MAAM,gBAAgB,GACpB,QAAQ,IAAI,wBAAU,CAAC,mBAAmB,CAAC,WAAW,EAAE,QAAQ,CAAC,CAAC;QAEpE,MAAM,OAAO,GAAe,EAAE,CAAC;QAE/B,6EAA6E;QAC7E,iGAAiG;QACjG,IAAI,IAAI,EAAE,CAAC;YACT,OAAO,CAAC,IAAI,CAAC;gBACX,IAAI,EAAE,MAAM;gBACZ,IAAI,EAAE,IAAI;aACX,CAAC,CAAC;QACL,CAAC;QAED,wEAAwE;QACxE,gEAAgE;QAChE,MAAM,UAAU,GAAsB;YACpC,IAAI,EAAE,OAAO;YACb,WAAW,EAAE,QAAQ;YACrB,IAAI,EAAE,UAAU;YAChB,SAAS,EAAE,gBAAgB;SAC5B,CAAC;QACF,OAAO,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC;QAEzB,2DAA2D;QAC3D,mEAAmE;QACnE,OAAO,IAAI,wBAAY,CAAC;YACtB,OAAO,EAAE,OAAc;SACjB,CAAC,CAAC;IACZ,CAAC;IAEO,MAAM,CAAC,KAAK,CAAC,kBAAkB,CACrC,WAAwB,EACxB,QAAwB,EACxB,IAAa,EACb,YAAqB;QAErB,IAAI,CAAC,YAAY;YACf,MAAM,IAAI,KAAK,CACb,mIAAmI,CACpI,CAAC;QAEJ,IAAI,CAAC;YACH,4EAA4E;YAC5E,oFAAoF;YACpF,MAAM,oBAAoB,GAAG,QAAQ;gBACnC,CAAC,~~CAAE~~,~~EAA4B~~;~~gBAC/B~~,CAAC,CAAC,EAAE,QAAQ,EAAE,IAAI,EAAE,CAAC;YAEvB,MAAM,eAAe,GACnB,MAAM,iDAA2B,CAAC,qBAAqB,CACrD,WAAW,EACX,oBAAoB,EACpB,YAAY,CACb,CAAC;YAEJ,4DAA4D;YAC5D,MAAM,SAAS,GAAG,IAAI;gBACpB,CAAC,CAAC,GAAG,IAAI,yBAAyB,eAAe,EAAE;gBACnD,CAAC,CAAC,qBAAqB,eAAe,EAAE,CAAC;YAE3C,0DAA0D;YAC1D,OAAO,IAAI,wBAAY,CAAC,SAAS,CAAC,CAAC;QACrC,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YACf,kDAAkD;YAClD,yEAAyE;YACzE,MAAM,IAAI,KAAK,CACb,wDACE,KAAK,YAAY,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,KAAK,CACvD,IAAI;gBACF,mGAAmG,CACtG,CAAC;QACJ,CAAC;IACH,CAAC;CACF;AA1HD,8CA0HC"}
1	+ {"version":3,"file":"messages.js","sourceRoot":"","sources":["../../src/langchain/messages.ts"],"names":[],"mappings":";;;AAAA,yCAAmE;AACnE,sDAAkD;AAElD,+DAAoE;AAuBpE,MAAa,iBAAiB;IAC5B,MAAM,CAAC,MAAM,CAAC,OAAe;QAC3B,OAAO,IAAI,yBAAa,CAAC,OAAO,CAAC,CAAC;IACpC,CAAC;IAED,MAAM,CAAC,KAAK,CAAC,OAAe;QAC1B,OAAO,IAAI,wBAAY,CAAC,OAAO,CAAC,CAAC;IACnC,CAAC;IAED,MAAM,CAAC,KAAK,CAAC,UAAU,CACrB,OAAqC;QAErC,MAAM,EAAE,KAAK,EAAE,IAAI,EAAE,QAAQ,GAAG,MAAM,EAAE,YAAY,EAAE,GAAG,OAAO,CAAC;QACjE,MAAM,EAAE,MAAM,EAAE,QAAQ,EAAE,QAAQ,EAAE,GAAG,KAAK,CAAC;QAE7C,OAAO,IAAI,CAAC,2BAA2B,CACrC,MAAM,EACN,IAAI,EACJ,QAAQ,EACR,QAAQ,EACR,QAAQ,EACR,YAAY,CACb,CAAC;IACJ,CAAC;IAED,MAAM,CAAC,EAAE,CAAC,OAAe;QACvB,OAAO,IAAI,qBAAS,CAAC,OAAO,CAAC,CAAC;IAChC,CAAC;IAEO,MAAM,CAAC,KAAK,CAAC,2BAA2B,CAC9C,WAAwB,EACxB,IAAa,EACb,QAAwB,EACxB,QAAiB,EACjB,WAAyC,MAAM,EAC/C,YAAqB;QAErB,gFAAgF;QAChF,IAAI,QAAQ,KAAK,QAAQ;YACvB,OAAO,MAAM,IAAI,CAAC,kBAAkB,CAClC,WAAW,EACX,QAAQ,EACR,IAAI,EACJ,YAAY,CACb,CAAC;QAEJ,4GAA4G;QAC5G,MAAM,UAAU,GAAG,wBAAU,CAAC,cAAc,CAAC,WAAW,CAAC,CAAC;QAC1D,MAAM,gBAAgB,GACpB,QAAQ,IAAI,wBAAU,CAAC,mBAAmB,CAAC,WAAW,EAAE,QAAQ,CAAC,CAAC;QAEpE,MAAM,OAAO,GAAe,EAAE,CAAC;QAE/B,6EAA6E;QAC7E,iGAAiG;QACjG,IAAI,IAAI,EAAE,CAAC;YACT,OAAO,CAAC,IAAI,CAAC;gBACX,IAAI,EAAE,MAAM;gBACZ,IAAI,EAAE,IAAI;aACX,CAAC,CAAC;QACL,CAAC;QAED,wEAAwE;QACxE,gEAAgE;QAChE,MAAM,UAAU,GAAsB;YACpC,IAAI,EAAE,OAAO;YACb,WAAW,EAAE,QAAQ;YACrB,IAAI,EAAE,UAAU;YAChB,SAAS,EAAE,gBAAgB;SAC5B,CAAC;QACF,OAAO,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC;QAEzB,2DAA2D;QAC3D,mEAAmE;QACnE,OAAO,IAAI,wBAAY,CAAC;YACtB,OAAO,EAAE,OAAc;SACjB,CAAC,CAAC;IACZ,CAAC;IAEO,MAAM,CAAC,KAAK,CAAC,kBAAkB,CACrC,WAAwB,EACxB,QAAwB,EACxB,IAAa,EACb,YAAqB;QAErB,IAAI,CAAC,YAAY;YACf,MAAM,IAAI,KAAK,CACb,mIAAmI,CACpI,CAAC;QAEJ,IAAI,CAAC;YACH,4EAA4E;YAC5E,oFAAoF;YACpF,MAAM,oBAAoB,GAAG,QAAQ;gBACnC,CAAC,CAAC,EAAE,MAAM,EAAE,QAAQ,EAAE;gBACtB,CAAC,CAAC,EAAE,QAAQ,EAAE,IAAI,EAAE,CAAC;YAEvB,MAAM,eAAe,GACnB,MAAM,iDAA2B,CAAC,qBAAqB,CACrD,WAAW,EACX,oBAAoB,EACpB,YAAY,CACb,CAAC;YAEJ,4DAA4D;YAC5D,MAAM,SAAS,GAAG,IAAI;gBACpB,CAAC,CAAC,GAAG,IAAI,yBAAyB,eAAe,EAAE;gBACnD,CAAC,CAAC,qBAAqB,eAAe,EAAE,CAAC;YAE3C,0DAA0D;YAC1D,OAAO,IAAI,wBAAY,CAAC,SAAS,CAAC,CAAC;QACrC,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YACf,kDAAkD;YAClD,yEAAyE;YACzE,MAAM,IAAI,KAAK,CACb,wDACE,KAAK,YAAY,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,KAAK,CACvD,IAAI;gBACF,mGAAmG,CACtG,CAAC;QACJ,CAAC;IACH,CAAC;CACF;AA1HD,8CA0HC"}

package/dist/utils/files-utils.d.ts CHANGED Viewed

@@ -1,6 +1,6 @@
-import type { AudioBuffer } from "../@types/audio";
+import { type AudioBuffer, type AudioMimeType } from "../@types/audio";
 export declare class FilesUtils {
-    static createTempFile(audioBuffer: AudioBuffer, prefix?: string): string;
+    static createTempFile(audioBuffer: AudioBuffer, prefix?: string, format?: string | AudioMimeType): string;
     static cleanupTempFile(filePath: string): void;
 }
 //# sourceMappingURL=files-utils.d.ts.map

package/dist/utils/files-utils.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"files-utils.d.ts","sourceRoot":"","sources":["../../src/utils/files-utils.ts"],"names":[],"mappings":"AAGA,OAAO,KAAK,~~EAAE,~~WAAW,~~EAAE~~,MAAM,iBAAiB,CAAC;~~AAEnD~~,qBAAa,UAAU;IACrB,MAAM,CAAC,cAAc,CACnB,WAAW,EAAE,WAAW,EACxB,MAAM,GAAE,MAAgB,~~GACvB~~,MAAM;~~IAsBT~~,MAAM,CAAC,eAAe,CAAC,QAAQ,EAAE,MAAM,GAAG,IAAI;CAS/C"}
1	+ {"version":3,"file":"files-utils.d.ts","sourceRoot":"","sources":["../../src/utils/files-utils.ts"],"names":[],"mappings":"AAGA,OAAO,EAEL,KAAK,WAAW,EAChB,KAAK,aAAa,EACnB,MAAM,iBAAiB,CAAC;AAEzB,qBAAa,UAAU;IACrB,MAAM,CAAC,cAAc,CACnB,WAAW,EAAE,WAAW,EACxB,MAAM,GAAE,MAAgB,EACxB,MAAM,CAAC,EAAE,MAAM,GAAG,aAAa,GAC9B,MAAM;IA8BT,MAAM,CAAC,eAAe,CAAC,QAAQ,EAAE,MAAM,GAAG,IAAI;CAS/C"}

package/dist/utils/files-utils.js CHANGED Viewed

@@ -37,10 +37,18 @@ exports.FilesUtils = void 0;
 const fs = __importStar(require("fs"));
 const path = __importStar(require("path"));
 const os = __importStar(require("os"));
+const audio_1 = require("../@types/audio");
 class FilesUtils {
-    static createTempFile(audioBuffer, prefix = "audio") {
+    static createTempFile(audioBuffer, prefix = "audio", format) {
+        const extension = format
+            ? format.startsWith("audio/")
+                ? audio_1.MIME_TO_EXTENSION[format] ?? "mp3"
+                : format.replace(/^\./, "")
+            : "mp3";
         const tempDir = os.tmpdir();
-        const tempFilePath = path.join(tempDir, `${prefix}-${Date.now()}-${Math.random().toString(36).substring(7)}.mp3`);
+        const tempFilePath = path.join(tempDir, `${prefix}-${Date.now()}-${Math.random()
+            .toString(36)
+            .substring(7)}.${extension}`);
         // Converte o buffer para Buffer se necessário
         let buffer;
         if (audioBuffer instanceof Buffer) {

package/dist/utils/files-utils.js.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"files-utils.js","sourceRoot":"","sources":["../../src/utils/files-utils.ts"],"names":[],"mappings":";;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;AAAA,uCAAyB;AACzB,2CAA6B;AAC7B,uCAAyB;~~AAGzB~~,MAAa,UAAU;IACrB,MAAM,CAAC,cAAc,CACnB,WAAwB,EACxB,SAAiB,OAAO;~~QAExB~~,MAAM,OAAO,GAAG,EAAE,CAAC,MAAM,EAAE,CAAC;QAC5B,MAAM,YAAY,GAAG,IAAI,CAAC,IAAI,CAC5B,OAAO,EACP,GAAG,MAAM,IAAI,IAAI,CAAC,GAAG,EAAE,IAAI,IAAI,CAAC,MAAM,EAAE,~~CAAC,~~QAAQ,CAAC,EAAE,CAAC,~~CAAC,~~SAAS,CAAC,CAAC,CAAC,~~MAAM~~,~~CACzE~~,CAAC;QAEF,8CAA8C;QAC9C,IAAI,MAAc,CAAC;QACnB,IAAI,WAAW,YAAY,MAAM,EAAE,CAAC;YAClC,MAAM,GAAG,WAAW,CAAC;QACvB,CAAC;aAAM,IAAI,WAAW,YAAY,WAAW,EAAE,CAAC;YAC9C,MAAM,GAAG,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC;QACpC,CAAC;aAAM,CAAC;YACN,MAAM,GAAG,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC;QACpC,CAAC;QAED,+BAA+B;QAC/B,EAAE,CAAC,aAAa,CAAC,YAAY,EAAE,MAAM,CAAC,CAAC;QACvC,OAAO,YAAY,CAAC;IACtB,CAAC;IAED,MAAM,CAAC,eAAe,CAAC,QAAgB;QACrC,IAAI,EAAE,CAAC,UAAU,CAAC,QAAQ,CAAC,EAAE,CAAC;YAC5B,IAAI,CAAC;gBACH,EAAE,CAAC,UAAU,CAAC,QAAQ,CAAC,CAAC;YAC1B,CAAC;YAAC,OAAO,KAAK,EAAE,CAAC;gBACf,OAAO,CAAC,IAAI,CAAC,uCAAuC,KAAK,EAAE,CAAC,CAAC;YAC/D,CAAC;QACH,CAAC;IACH,CAAC;CACF;~~AAnCD~~,~~gCAmCC~~"}
1	+ {"version":3,"file":"files-utils.js","sourceRoot":"","sources":["../../src/utils/files-utils.ts"],"names":[],"mappings":";;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;AAAA,uCAAyB;AACzB,2CAA6B;AAC7B,uCAAyB;AACzB,2CAIyB;AAEzB,MAAa,UAAU;IACrB,MAAM,CAAC,cAAc,CACnB,WAAwB,EACxB,SAAiB,OAAO,EACxB,MAA+B;QAE/B,MAAM,SAAS,GAAG,MAAM;YACtB,CAAC,CAAC,MAAM,CAAC,UAAU,CAAC,QAAQ,CAAC;gBAC3B,CAAC,CAAC,yBAAiB,CAAC,MAAuB,CAAC,IAAI,KAAK;gBACrD,CAAC,CAAC,MAAM,CAAC,OAAO,CAAC,KAAK,EAAE,EAAE,CAAC;YAC7B,CAAC,CAAC,KAAK,CAAC;QAEV,MAAM,OAAO,GAAG,EAAE,CAAC,MAAM,EAAE,CAAC;QAC5B,MAAM,YAAY,GAAG,IAAI,CAAC,IAAI,CAC5B,OAAO,EACP,GAAG,MAAM,IAAI,IAAI,CAAC,GAAG,EAAE,IAAI,IAAI,CAAC,MAAM,EAAE;aACrC,QAAQ,CAAC,EAAE,CAAC;aACZ,SAAS,CAAC,CAAC,CAAC,IAAI,SAAS,EAAE,CAC/B,CAAC;QAEF,8CAA8C;QAC9C,IAAI,MAAc,CAAC;QACnB,IAAI,WAAW,YAAY,MAAM,EAAE,CAAC;YAClC,MAAM,GAAG,WAAW,CAAC;QACvB,CAAC;aAAM,IAAI,WAAW,YAAY,WAAW,EAAE,CAAC;YAC9C,MAAM,GAAG,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC;QACpC,CAAC;aAAM,CAAC;YACN,MAAM,GAAG,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC;QACpC,CAAC;QAED,+BAA+B;QAC/B,EAAE,CAAC,aAAa,CAAC,YAAY,EAAE,MAAM,CAAC,CAAC;QACvC,OAAO,YAAY,CAAC;IACtB,CAAC;IAED,MAAM,CAAC,eAAe,CAAC,QAAgB;QACrC,IAAI,EAAE,CAAC,UAAU,CAAC,QAAQ,CAAC,EAAE,CAAC;YAC5B,IAAI,CAAC;gBACH,EAAE,CAAC,UAAU,CAAC,QAAQ,CAAC,CAAC;YAC1B,CAAC;YAAC,OAAO,KAAK,EAAE,CAAC;gBACf,OAAO,CAAC,IAAI,CAAC,uCAAuC,KAAK,EAAE,CAAC,CAAC;YAC/D,CAAC;QACH,CAAC;IACH,CAAC;CACF;AA5CD,gCA4CC"}

package/docs/LANGCHAIN_WHISPER_WINDOWS_BUG.md ADDED Viewed

@@ -0,0 +1,209 @@
+# Bug do LangChain no Windows: Transcrição de Áudio com Whisper - 2026-02-02
+## Resumo
+O loader `OpenAIWhisperAudio` do LangChain passa o **caminho completo do arquivo** (ex: `C:\Users\...\whisper-xxx.webm`) para a API da OpenAI. No Windows, isso pode causar falhas no envio multipart devido a backslashes e caracteres especiais no path.
+---
+## Passo a passo: O que acontece quando você transcreve áudio
+### 1. Seu código chama a transcrição
+```typescript
+// No seu código (@luanpoppe/ai)
+const tempFilePath = FilesUtils.createTempFile(audioBuffer, "whisper", options.format);
+// tempFilePath = "C:\Users\luan\AppData\Local\Temp\whisper-1738512345-abc123.webm"
+const loader = new OpenAIWhisperAudio(tempFilePath, { ... });
+const docs = await loader.load();
+```
+Você cria um arquivo temporário e passa o **caminho completo** para o loader do LangChain.
+---
+### 2. O LangChain lê o arquivo
+O `OpenAIWhisperAudio` estende `BufferLoader`. Internamente, ele:
+1. Lê o conteúdo do arquivo em memória (um `Buffer`)
+2. Guarda o caminho original em `metadata.source`
+```javascript
+// Dentro do BufferLoader (simplificado)
+metadata = {
+  source:
+    "C:\\Users\\luan\\AppData\\Local\\Temp\\whisper-1738512345-abc123.webm",
+};
+```
+---
+### 3. O LangChain chama a API da OpenAI
+O método `parse()` do loader faz algo assim:
+```javascript
+// Código atual do LangChain (com o bug)
+const fileName = metadata.source === "blob" ? metadata.blobType : metadata.source;
+// fileName = "C:\Users\luan\AppData\Local\Temp\whisper-1738512345-abc123.webm"
+const transcriptionResponse = await this.openAIClient.audio.transcriptions.create({
+  file: await toFile(raw, fileName),  // ← O problema está aqui!
+  model: "whisper-1",
+  ...
+});
+```
+O segundo parâmetro de `toFile(raw, fileName)` deveria ser **apenas o nome do arquivo** (ex: `whisper-1738512345-abc123.webm`), mas o LangChain passa o **caminho completo**.
+---
+### 4. O que a API da OpenAI espera
+A função `toFile` da OpenAI usa o segundo parâmetro para:
+- Definir o nome do arquivo no formulário multipart (Content-Disposition)
+- Ajudar a API a identificar o formato do áudio pela extensão
+O formato multipart espera algo como:
+```
+Content-Disposition: form-data; name="file"; filename="whisper-xxx.webm"
+```
+Com o caminho completo do Windows:
+```
+Content-Disposition: form-data; name="file"; filename="C:\Users\luan\AppData\Local\Temp\whisper-xxx.webm"
+```
+Os backslashes (`\`) e o path longo podem causar:
+- Parsing incorreto do header
+- Erros de encoding
+- Rejeição pela API
+---
+## Por que não dá para resolver no seu código?
+### O fluxo de dados
+```
+Seu código                    LangChain (biblioteca)              API OpenAI
+    |                                |                                  |
+    |  tempFilePath (path completo)  |                                  |
+    | ----------------------------->|                                  |
+    |                                |  Lê arquivo, guarda em metadata   |
+    |                                |  metadata.source = path completo  |
+    |                                |                                  |
+    |                                |  toFile(buffer, metadata.source)  |
+    |                                |  ↑ usa path completo internamente |
+    |                                | --------------------------------->|
+    |                                |                    Envio multipart|
+```
+### Onde está o controle?
+| Etapa                   | Quem controla | O que você pode fazer                                             |
+| ----------------------- | ------------- | ----------------------------------------------------------------- |
+| Criar arquivo temp      | **Você**      | Escolher onde criar (ex: `os.tmpdir()`)                           |
+| Path passado ao loader  | **Você**      | Só pode passar um path – o loader precisa dele para ler o arquivo |
+| Valor usado em `toFile` | **LangChain** | Você não tem acesso – é interno ao loader                         |
+| Chamada à API           | **LangChain** | Você não controla                                                 |
+### O problema central
+O loader **precisa** do path completo para **ler o arquivo** do disco. Não há como passar “só o nome” – o LangChain precisa do path para fazer `fs.readFile` (ou equivalente).
+Depois de ler, o loader usa o mesmo `metadata.source` (o path) como nome do arquivo no `toFile`. A decisão de usar `metadata.source` em vez de `path.basename(metadata.source)` está **dentro do LangChain**, não no seu código.
+### Por que não dá para “enganar” o loader?
+**Tentativa 1: Criar o arquivo em um path curto**
+```typescript
+// Ex: ./whisper-temp.webm
+const tempFilePath = path.join(process.cwd(), "whisper-temp.webm");
+```
+Ainda assim, `metadata.source` será algo como `C:\projeto\whisper-temp.webm`. O path continua completo; o LangChain continua passando ele para `toFile`.
+**Tentativa 2: Passar um Blob em vez de path**
+O loader aceita `string | Blob`. Se você passar um Blob, `metadata.source === "blob"` e ele usa `metadata.blobType` (ex: `"audio/webm"`). O Blob não tem path, então não há problema de Windows.
+Porém: o LangChain não expõe uma forma simples de criar o loader a partir de um Buffer/Blob com controle total do fluxo. E o `BufferLoader` espera um Blob do browser ou um path de arquivo – em Node.js, o uso típico é com path.
+**Tentativa 3: Wrapper ou monkey-patch**
+Você poderia tentar interceptar ou substituir o loader, mas:
+- O loader é instanciado internamente
+- Você não controla o que é passado para `toFile`
+- Faria seu código depender de detalhes internos do LangChain, frágeis a atualizações
+---
+## Correção sugerida (no LangChain)
+No arquivo `openai_whisper_audio.ts` do LangChain:
+```typescript
+// Antes (com bug)
+const fileName =
+  metadata.source === "blob" ? metadata.blobType : metadata.source;
+// Depois (corrigido)
+const fileName =
+  metadata.source === "blob"
+    ? metadata.blobType
+    : path.basename(metadata.source);
+```
+Assim, quando `metadata.source` for um path de arquivo, só o nome do arquivo (ex: `whisper-xxx.webm`) é enviado para `toFile`.
+---
+## Suas opções práticas
+1. **Abrir um PR no LangChain** com essa correção e aguardar o merge.
+2. **Usar `patch-package`** para aplicar essa alteração automaticamente no `node_modules` após cada `pnpm install`.
+3. **Usar a API da OpenAI diretamente** (sem o loader do LangChain) e controlar o nome do arquivo no `toFile`.
+---
+## Diagrama do fluxo
+```
+┌─────────────────────────────────────────────────────────────────────────┐
+│ SEU CÓDIGO                                                               │
+│                                                                          │
+│  createTempFile() → "C:\Users\...\Temp\whisper-xxx.webm"                 │
+│           │                                                              │
+│           ▼                                                              │
+│  new OpenAIWhisperAudio(tempFilePath)                                     │
+└─────────────────────────────────────────────────────────────────────────┘
+                                    │
+                                    │ path completo
+                                    ▼
+┌─────────────────────────────────────────────────────────────────────────┐
+│ LANGCHAIN (você não controla)                                            │
+│                                                                          │
+│  1. Lê arquivo do path                                                   │
+│  2. metadata.source = path  ← guarda path completo                      │
+│  3. fileName = metadata.source  ← BUG: usa path completo                │
+│  4. toFile(buffer, fileName)  ← envia path para OpenAI                  │
+└─────────────────────────────────────────────────────────────────────────┘
+                                    │
+                                    │ multipart com filename = path
+                                    ▼
+┌─────────────────────────────────────────────────────────────────────────┐
+│ API OPENAI                                                               │
+│                                                                          │
+│  Recebe: filename="C:\Users\...\whisper-xxx.webm"                        │
+│  Problema: backslashes, path longo → pode falhar no Windows              │
+└─────────────────────────────────────────────────────────────────────────┘
+```

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@luanpoppe/ai",
-  "version": "1.0.8",
+  "version": "1.0.10",
   "description": "",
   "main": "dist/index.js",
   "keywords": [],
@@ -8,6 +8,7 @@
   "license": "ISC",
   "dependencies": {
     "@langchain/community": "^1.1.10",
+    "openai": "^6.17.0",
     "@langchain/core": "^1.1.16",
     "@langchain/google-genai": "^2.1.12",
     "@langchain/openai": "^1.2.3",

package/src/@types/audio.ts CHANGED Viewed

@@ -13,3 +13,18 @@ export type AudioMimeType =
   | "audio/flac"
   | "audio/aac"
   | "audio/opus";
+export const MIME_TO_EXTENSION: Record<AudioMimeType, string> = {
+  "audio/mpeg": "mp3",
+  "audio/mp3": "mp3",
+  "audio/wav": "wav",
+  "audio/wave": "wav",
+  "audio/x-wav": "wav",
+  "audio/mp4": "mp4",
+  "audio/m4a": "m4a",
+  "audio/webm": "webm",
+  "audio/ogg": "ogg",
+  "audio/flac": "flac",
+  "audio/aac": "aac",
+  "audio/opus": "opus",
+};

package/src/index.ts CHANGED Viewed

@@ -137,7 +137,7 @@ export class Langchain {
   getRawAgent(
     params: LangchainCallParams,
     outputSchema?: z.ZodSchema | undefined
-  ) {
+  ): { agent: ReturnType<typeof createAgent> } {
     const agent = createAgent({
       ...this.standardAgent(params),
       responseFormat: outputSchema as any,
@@ -217,4 +217,7 @@ export type {
   AudioContentBlock,
   HumanMessageWithAudioOptions,
 } from "./langchain/messages";
-export type { WhisperTranscriptionOptions } from "./langchain/audio-transcription";
+export type {
+  WhisperModel,
+  WhisperTranscriptionOptions,
+} from "./langchain/audio-transcription";

package/src/langchain/audio-transcription.ts CHANGED Viewed

@@ -1,70 +1,87 @@
-import { Document } from "@langchain/core/documents";
 import * as fs from "fs";
-import type { AudioBuffer } from "../@types/audio";
-import { OpenAIWhisperAudio } from "@langchain/community/document_loaders/fs/openai_whisper_audio";
-import { FilesUtils } from "../utils/files-utils";
+import * as path from "path";
+import OpenAI from "openai";
+import { toFile } from "openai";
+import type { AudioBuffer, AudioMimeType } from "../@types/audio";
+import { MIME_TO_EXTENSION } from "../@types/audio";
+/** Modelos disponíveis na API de transcrição OpenAI (Speech-to-Text) */
+export type WhisperModel =
+  | "whisper-1"
+  | "gpt-4o-transcribe"
+  | "gpt-4o-mini-transcribe"
+  | "gpt-4o-mini-transcribe-2025-12-15"
+  | "gpt-4o-transcribe-diarize";
 export type WhisperTranscriptionOptions = {
-  language?: string;
+  /** Modelo de transcrição. Padrão: "whisper-1". gpt-4o-transcribe e gpt-4o-mini-transcribe têm maior qualidade. */
+  model?: WhisperModel;
+  languageIn2Digits?: string;
   prompt?: string;
   responseFormat?: "json" | "text" | "srt" | "verbose_json" | "vtt";
   temperature?: number;
   timestampGranularities?: ("word" | "segment")[];
+  /** Formato do áudio: extensão ("mp3", "wav", "webm") ou MIME type ("audio/wav", "audio/webm") */
+  format?: string | AudioMimeType;
 };
-export class LangchainAudioTranscription {
-  private static extractTextFromDocs(docs: Document[]): string {
-    if (docs.length === 0) {
-      throw new Error("Nenhum documento foi retornado pela transcrição");
-    }
-    const firstDoc = docs[0];
-    if (!firstDoc) {
-      throw new Error("Documento vazio retornado pela transcrição");
-    }
-    // LangChain.js usa pageContent (camelCase), não page_content
-    return firstDoc.pageContent;
+function getExtension(format?: string | AudioMimeType): string {
+  if (!format) return "mp3";
+  if (format.startsWith("audio/")) {
+    return MIME_TO_EXTENSION[format as AudioMimeType] ?? "mp3";
   }
+  return format.replace(/^\./, "");
+}
+function toBuffer(audioBuffer: AudioBuffer): Buffer {
+  if (audioBuffer instanceof Buffer) return audioBuffer;
+  if (audioBuffer instanceof ArrayBuffer) return Buffer.from(audioBuffer);
+  return Buffer.from(audioBuffer as Uint8Array);
+}
+export class LangchainAudioTranscription {
   static async transcribeWithWhisper(
     audioBuffer: AudioBuffer,
     options: WhisperTranscriptionOptions = {},
     openAIApiKey?: string
   ): Promise<string> {
-    const tempFilePath = FilesUtils.createTempFile(audioBuffer, "whisper");
+    if (openAIApiKey) {
+      process.env.OPENAI_API_KEY = openAIApiKey;
+    }
-    try {
-      // Configura a API key se fornecida
-      if (openAIApiKey) {
-        process.env.OPENAI_API_KEY = openAIApiKey;
-      }
+    const buffer = toBuffer(audioBuffer);
+    const extension = getExtension(options.format);
+    const fileName = `whisper-${Date.now()}.${extension}`;
-      const transcriptionParams: any = {
-        response_format: options.responseFormat || "text",
-      };
+    const file = await toFile(buffer, fileName);
-      if (options.language) {
-        transcriptionParams.language = options.language;
-      }
-      if (options.prompt) {
-        transcriptionParams.prompt = options.prompt;
-      }
-      if (options.temperature !== undefined) {
-        transcriptionParams.temperature = options.temperature;
-      }
-      if (options.timestampGranularities) {
-        transcriptionParams.timestamp_granularities =
-          options.timestampGranularities;
-      }
+    const openai = new OpenAI();
-      const loader = new OpenAIWhisperAudio(tempFilePath, {
-        transcriptionCreateParams: transcriptionParams,
-      });
+    const transcriptionParams: OpenAI.Audio.TranscriptionCreateParams = {
+      file,
+      model: options.model ?? "whisper-1",
+      response_format: options.responseFormat ?? "text",
+    };
-      const docs: Document[] = await loader.load();
-      return this.extractTextFromDocs(docs);
-    } finally {
-      FilesUtils.cleanupTempFile(tempFilePath);
+    if (options.languageIn2Digits) {
+      transcriptionParams.language = options.languageIn2Digits;
+    }
+    if (options.prompt) {
+      transcriptionParams.prompt = options.prompt;
+    }
+    if (options.temperature !== undefined) {
+      transcriptionParams.temperature = options.temperature;
     }
+    if (options.timestampGranularities) {
+      transcriptionParams.timestamp_granularities =
+        options.timestampGranularities;
+    }
+    const response = await openai.audio.transcriptions.create(
+      transcriptionParams
+    );
+    return typeof response === "string" ? response : response.text;
   }
   static async transcribeFileWithWhisper(
@@ -77,6 +94,12 @@ export class LangchainAudioTranscription {
     }
     const audioBuffer = fs.readFileSync(filePath);
-    return this.transcribeWithWhisper(audioBuffer, options, openAIApiKey);
+    const format =
+      options.format ?? (path.extname(filePath).replace(/^\./, "") || "mp3");
+    return this.transcribeWithWhisper(
+      audioBuffer,
+      { ...options, format },
+      openAIApiKey
+    );
   }
 }

package/src/langchain/messages.ts CHANGED Viewed

@@ -118,7 +118,7 @@ export class LangchainMessages {
       // Prepara opções de transcrição - só inclui language se não houver mimeType
       // Com exactOptionalPropertyTypes: true, não podemos passar undefined explicitamente
       const transcriptionOptions = mimeType
-        ? ({} as { language?: string })
+        ? { format: mimeType }
         : { language: "pt" };
       const transcribedText =

package/src/utils/files-utils.ts CHANGED Viewed

@@ -1,17 +1,30 @@
 import * as fs from "fs";
 import * as path from "path";
 import * as os from "os";
-import type { AudioBuffer } from "../@types/audio";
+import {
+  MIME_TO_EXTENSION,
+  type AudioBuffer,
+  type AudioMimeType,
+} from "../@types/audio";
 export class FilesUtils {
   static createTempFile(
     audioBuffer: AudioBuffer,
-    prefix: string = "audio"
+    prefix: string = "audio",
+    format?: string | AudioMimeType
   ): string {
+    const extension = format
+      ? format.startsWith("audio/")
+        ? MIME_TO_EXTENSION[format as AudioMimeType] ?? "mp3"
+        : format.replace(/^\./, "")
+      : "mp3";
     const tempDir = os.tmpdir();
     const tempFilePath = path.join(
       tempDir,
-      `${prefix}-${Date.now()}-${Math.random().toString(36).substring(7)}.mp3`
+      `${prefix}-${Date.now()}-${Math.random()
+        .toString(36)
+        .substring(7)}.${extension}`
     );
     // Converte o buffer para Buffer se necessário

package/tests/unit/langchain/audio-transcription.test.ts CHANGED Viewed

@@ -1,287 +1,180 @@
 import { describe, it, expect, vi, beforeEach } from "vitest";
-import { LangchainAudioTranscription } from "../../../src/langchain/audio-transcription";
+import { LangchainAudioTranscription } from "../../../src/langchain/audio-transcription.js";
 import * as fs from "fs";
-import * as os from "os";
-import * as path from "path";
-// Mock do fs e os - cria arquivos reais no sistema de arquivos temporário
-import * as realFs from "fs";
-import * as realOs from "os";
-import * as realPath from "path";
-// Calcula tempDir usando os módulos reais (antes dos mocks)
-const tempDir = realPath.join(realOs.tmpdir(), "langchain-audio-test");
-// Garante que o diretório temporário existe
-if (!realFs.existsSync(tempDir)) {
-  realFs.mkdirSync(tempDir, { recursive: true });
-}
-vi.mock("fs", () => {
-  // Usa require para acessar o módulo real diretamente
-  const actualFs = require("fs");
-  const writeFileSyncSpy = vi.fn((filePath: string, data: Buffer) => {
-    // Cria o arquivo real no sistema de arquivos
-    actualFs.writeFileSync(filePath, data);
-  });
-  const readFileSyncSpy = vi.fn((filePath: string) => {
-    if (actualFs.existsSync(filePath)) {
-      return actualFs.readFileSync(filePath);
-    }
-    return Buffer.from("fake audio data");
-  });
-  const existsSyncSpy = vi.fn((filePath: string) => {
-    return actualFs.existsSync(filePath) || filePath.startsWith("/path/to/");
-  });
-  const unlinkSyncSpy = vi.fn((filePath: string) => {
-    if (actualFs.existsSync(filePath)) {
-      actualFs.unlinkSync(filePath);
-    }
-  });
-  return {
-    ...actualFs,
-    writeFileSync: writeFileSyncSpy,
-    readFileSync: readFileSyncSpy,
-    existsSync: existsSyncSpy,
-    unlinkSync: unlinkSyncSpy,
-  };
+const mockTranscriptionsCreate = vi.fn().mockResolvedValue({
+  text: "Texto transcrito do áudio",
 });
-vi.mock("os", () => {
-  // Calcula tempDir dentro do mock usando os módulos reais
-  const realOs = require("os");
-  const realPath = require("path");
-  const tempDirValue = realPath.join(realOs.tmpdir(), "langchain-audio-test");
+vi.mock("openai", () => {
   return {
-    tmpdir: vi.fn(() => tempDirValue),
+    default: class MockOpenAI {
+      audio = {
+        transcriptions: {
+          create: mockTranscriptionsCreate,
+        },
+      };
+    },
+    toFile: async (buffer: Buffer, filename: string) => {
+      return new File([new Uint8Array(buffer)], filename, {
+        type: "audio/mpeg",
+      });
+    },
   };
 });
-// Mock do módulo - precisa interceptar o require() dinâmico
-// Como o código usa require() dinâmico dentro de try-catch, precisamos garantir
-// que o mock seja aplicado antes do código ser executado
-vi.mock("@langchain/community/document_loaders/fs/openai_whisper_audio", () => {
-  // Importa o fs mockado para verificar arquivos
-  const fs = require("fs");
-  class MockOpenAIWhisperAudio {
-    constructor(public filePath: string, public options?: any) {
-      // Verifica se o arquivo existe usando o fs mockado
-      // O arquivo já deve ter sido criado pelo writeFileSync antes desta chamada
-      if (!fs.existsSync(filePath)) {
-        // Se não existe, lança o mesmo erro que o loader real lançaria
-        const error: any = new Error(`ENOENT: no such file or directory, open '${filePath}'`);
-        error.code = "ENOENT";
-        error.errno = -4058;
-        error.syscall = "open";
-        error.path = filePath;
-        throw error;
-      }
-    }
-    async load() {
-      return [
-        {
-          pageContent: "Texto transcrito do áudio",
-          metadata: {},
-        },
-      ];
-    }
-  }
+vi.mock("fs", () => {
+  const actualFs = require("fs");
   return {
-    OpenAIWhisperAudio: MockOpenAIWhisperAudio,
+    ...actualFs,
+    existsSync: vi.fn((filePath: string) => {
+      return actualFs.existsSync(filePath) || filePath.startsWith("/path/to/");
+    }),
+    readFileSync: vi.fn((filePath: string) => {
+      if (actualFs.existsSync(filePath)) {
+        return actualFs.readFileSync(filePath);
+      }
+      return Buffer.from("fake audio data");
+    }),
   };
 });
-// Mock também precisa interceptar o require() dinâmico usado no código
-// Vamos mockar o módulo de forma que o require() pegue o mock
 describe("LangchainAudioTranscription", () => {
   beforeEach(() => {
     vi.clearAllMocks();
-    // Limpa arquivos temporários criados nos testes anteriores
-    if (realFs.existsSync(tempDir)) {
-      const files = realFs.readdirSync(tempDir);
-      files.forEach((file) => {
-        const filePath = realPath.join(tempDir, file);
-        try {
-          realFs.unlinkSync(filePath);
-        } catch (error) {
-          // Ignora erros ao remover arquivos
-        }
-      });
-    }
-  });
-  afterAll(() => {
-    // Limpa diretório temporário após todos os testes
-    if (realFs.existsSync(tempDir)) {
-      try {
-        realFs.rmSync(tempDir, { recursive: true, force: true });
-      } catch (error) {
-        // Ignora erros ao remover diretório
-      }
-    }
+    mockTranscriptionsCreate.mockResolvedValue({
+      text: "Texto transcrito do áudio",
+    });
   });
   describe("transcribeWithWhisper", () => {
     it("deve transcrever áudio usando Whisper", async () => {
-      // Mocka diretamente o módulo após ser carregado
-      const audioModulePath = "@langchain/community/document_loaders/fs/openai_whisper_audio";
-      const audioModule = require(audioModulePath);
-      class MockLoader {
-        constructor(public filePath: string) {
-          // Usa o fs mockado importado
-          if (!fs.existsSync(filePath)) {
-            throw new Error(`ENOENT: no such file or directory, open '${filePath}'`);
-          }
-        }
-        async load() {
-          return [{ pageContent: "Texto transcrito do áudio", metadata: {} }];
-        }
-      }
-      // Substitui temporariamente a classe
-      const originalLoader = audioModule.OpenAIWhisperAudio;
-      audioModule.OpenAIWhisperAudio = MockLoader;
-      // Recarrega o módulo para pegar o mock
-      vi.resetModules();
-      const transcriptionModule = await import("../../../src/langchain/audio-transcription");
-      // Força a reimportação do loader mockado
-      const newAudioModule = require(audioModulePath);
-      newAudioModule.OpenAIWhisperAudio = MockLoader;
-      try {
-        const audioBuffer = Buffer.from("fake audio data");
-        const result = await transcriptionModule.LangchainAudioTranscription.transcribeWithWhisper(
-          audioBuffer
-        );
-        expect(result).toBe("Texto transcrito do áudio");
-        expect(vi.mocked(fs.writeFileSync)).toHaveBeenCalled();
-        expect(vi.mocked(fs.unlinkSync)).toHaveBeenCalled();
-      } finally {
-        // Restaura o loader original
-        audioModule.OpenAIWhisperAudio = originalLoader;
-      }
+      const audioBuffer = Buffer.from("fake audio data");
+      const result = await LangchainAudioTranscription.transcribeWithWhisper(
+        audioBuffer
+      );
+      expect(result).toBe("Texto transcrito do áudio");
+      expect(mockTranscriptionsCreate).toHaveBeenCalledWith(
+        expect.objectContaining({
+          model: "whisper-1",
+          response_format: "text",
+        })
+      );
     });
     it("deve aceitar opções de transcrição", async () => {
-      const audioModulePath = "@langchain/community/document_loaders/fs/openai_whisper_audio";
-      const audioModule = require(audioModulePath);
-      class MockLoader {
-        constructor(public filePath: string) {
-          // Usa o fs mockado importado
-          if (!fs.existsSync(filePath)) {
-            throw new Error(`ENOENT: no such file or directory, open '${filePath}'`);
-          }
-        }
-        async load() {
-          return [{ pageContent: "Texto transcrito do áudio", metadata: {} }];
-        }
-      }
-      const originalLoader = audioModule.OpenAIWhisperAudio;
-      audioModule.OpenAIWhisperAudio = MockLoader;
-      vi.resetModules();
-      const transcriptionModule = await import("../../../src/langchain/audio-transcription");
-      const newAudioModule = require(audioModulePath);
-      newAudioModule.OpenAIWhisperAudio = MockLoader;
-      try {
-        const audioBuffer = Buffer.from("fake audio data");
-        await transcriptionModule.LangchainAudioTranscription.transcribeWithWhisper(audioBuffer, {
-          language: "pt",
-          responseFormat: "json",
-        });
+      const audioBuffer = Buffer.from("fake audio data");
-        expect(vi.mocked(fs.writeFileSync)).toHaveBeenCalled();
-      } finally {
-        audioModule.OpenAIWhisperAudio = originalLoader;
-      }
+      await LangchainAudioTranscription.transcribeWithWhisper(audioBuffer, {
+        languageIn2Digits: "pt",
+        responseFormat: "json",
+      });
+      expect(mockTranscriptionsCreate).toHaveBeenCalledWith(
+        expect.objectContaining({
+          language: "pt",
+          response_format: "json",
+        })
+      );
     });
-    it("deve limpar arquivo temporário mesmo em caso de erro", async () => {
+    it("deve aceitar modelo customizado", async () => {
       const audioBuffer = Buffer.from("fake audio data");
-      // Mocka o módulo antes de importar
-      vi.doMock("@langchain/community/document_loaders/fs/openai_whisper_audio", () => {
-        const fs = require("fs");
-        class MockLoaderWithError {
-          constructor(public filePath: string) {
-            if (!fs.existsSync(filePath)) {
-              throw new Error(`ENOENT: no such file or directory, open '${filePath}'`);
-            }
-          }
-          async load() {
-            throw new Error("Erro de transcrição");
-          }
-        }
-        return { OpenAIWhisperAudio: MockLoaderWithError };
+      await LangchainAudioTranscription.transcribeWithWhisper(audioBuffer, {
+        model: "gpt-4o-transcribe",
       });
-      vi.resetModules();
-      const transcriptionModule = await import("../../../src/langchain/audio-transcription");
+      expect(mockTranscriptionsCreate).toHaveBeenCalledWith(
+        expect.objectContaining({
+          model: "gpt-4o-transcribe",
+        })
+      );
+    });
+    it("deve usar whisper-1 como padrão quando model não é informado", async () => {
+      const audioBuffer = Buffer.from("fake audio data");
+      await LangchainAudioTranscription.transcribeWithWhisper(audioBuffer);
+      expect(mockTranscriptionsCreate).toHaveBeenCalledWith(
+        expect.objectContaining({
+          model: "whisper-1",
+        })
+      );
+    });
+    it("deve aceitar formato de áudio nas opções (extensão)", async () => {
+      const audioBuffer = Buffer.from("fake wav audio data");
+      const result = await LangchainAudioTranscription.transcribeWithWhisper(
+        audioBuffer,
+        { format: "wav" }
+      );
+      expect(result).toBe("Texto transcrito do áudio");
+      expect(mockTranscriptionsCreate).toHaveBeenCalledWith(
+        expect.objectContaining({
+          file: expect.anything(),
+        })
+      );
+      const createCall = mockTranscriptionsCreate.mock.calls[0]?.[0];
+      expect(createCall?.file).toBeDefined();
+      const file = createCall?.file as { name?: string };
+      expect(file?.name).toMatch(/\.wav$/);
+    });
+    it("deve aceitar MIME type como formato", async () => {
+      const audioBuffer = Buffer.from("fake webm audio data");
+      const result = await LangchainAudioTranscription.transcribeWithWhisper(
+        audioBuffer,
+        { format: "audio/webm" }
+      );
+      expect(result).toBe("Texto transcrito do áudio");
+      const createCall = mockTranscriptionsCreate.mock.calls[0]?.[0];
+      const file = createCall?.file as { name?: string };
+      expect(file?.name).toMatch(/\.webm$/);
+    });
+    it("deve propagar erro da API", async () => {
+      mockTranscriptionsCreate.mockRejectedValueOnce(
+        new Error("Erro de transcrição")
+      );
+      const audioBuffer = Buffer.from("fake audio data");
       await expect(
-        transcriptionModule.LangchainAudioTranscription.transcribeWithWhisper(audioBuffer)
+        LangchainAudioTranscription.transcribeWithWhisper(audioBuffer)
       ).rejects.toThrow("Erro de transcrição");
-      // Verifica que tentou remover o arquivo temporário
-      expect(vi.mocked(fs.unlinkSync)).toHaveBeenCalled();
     });
   });
   describe("transcribeFileWithWhisper", () => {
     it("deve transcrever arquivo usando Whisper", async () => {
-      // Limpa o mock anterior e cria um novo mock
-      vi.doUnmock("@langchain/community/document_loaders/fs/openai_whisper_audio");
-      vi.doMock("@langchain/community/document_loaders/fs/openai_whisper_audio", () => {
-        const fs = require("fs");
-        class MockLoader {
-          constructor(public filePath: string) {
-            if (!fs.existsSync(filePath)) {
-              throw new Error(`ENOENT: no such file or directory, open '${filePath}'`);
-            }
-          }
-          async load() {
-            return [{ pageContent: "Texto transcrito do áudio", metadata: {} }];
-          }
-        }
-        return { OpenAIWhisperAudio: MockLoader };
-      });
-      vi.resetModules();
-      const transcriptionModule = await import("../../../src/langchain/audio-transcription");
-      const fs = require("fs");
       const filePath = "/path/to/audio.mp3";
       const result =
-        await transcriptionModule.LangchainAudioTranscription.transcribeFileWithWhisper(filePath);
+        await LangchainAudioTranscription.transcribeFileWithWhisper(filePath);
+      expect(result).toBe("Texto transcrito do áudio");
+      expect(vi.mocked(fs.readFileSync)).toHaveBeenCalledWith(filePath);
+      expect(mockTranscriptionsCreate).toHaveBeenCalled();
+    });
+    it("deve extrair formato da extensão do arquivo quando format não é informado", async () => {
+      const filePath = "/path/to/audio.wav";
+      const result =
+        await LangchainAudioTranscription.transcribeFileWithWhisper(filePath);
       expect(result).toBe("Texto transcrito do áudio");
-      // Verifica que readFileSync foi chamado (pode não ser spy após resetModules)
-      expect(fs.readFileSync).toBeDefined();
+      const createCall = mockTranscriptionsCreate.mock.calls[0]?.[0];
+      const file = createCall?.file as { name?: string };
+      expect(file?.name).toMatch(/\.wav$/);
     });
     it("deve lançar erro se arquivo não existir", async () => {