npm - hume - Versions diffs - 0.13.6 → 0.13.8 - Mend

hume 0.13.6 → 0.13.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (244) hide show

package/api/resources/index.d.ts CHANGED Viewed

@@ -1,3 +1,3 @@
-export * as empathicVoice from "./empathicVoice";
 export * as tts from "./tts";
+export * as empathicVoice from "./empathicVoice";
 export * as expressionMeasurement from "./expressionMeasurement";

package/api/resources/index.js CHANGED Viewed

@@ -33,7 +33,7 @@ var __importStar = (this && this.__importStar) || (function () {
     };
 })();
 Object.defineProperty(exports, "__esModule", { value: true });
-exports.expressionMeasurement = exports.tts = exports.empathicVoice = void 0;
-exports.empathicVoice = __importStar(require("./empathicVoice"));
+exports.expressionMeasurement = exports.empathicVoice = exports.tts = void 0;
 exports.tts = __importStar(require("./tts"));
+exports.empathicVoice = __importStar(require("./empathicVoice"));
 exports.expressionMeasurement = __importStar(require("./expressionMeasurement"));

package/api/resources/tts/client/Client.d.ts CHANGED Viewed

@@ -70,6 +70,12 @@ export declare class Tts {
      */
     synthesizeFile(request: Hume.tts.PostedTts, requestOptions?: Tts.RequestOptions): core.HttpResponsePromise<stream.Readable>;
     private __synthesizeFile;
+    /**
+     * Streams synthesized speech using the specified voice. If no voice is provided, a novel voice will be generated dynamically. Optionally, additional context can be included to influence the speech's style and prosody.
+     * @throws {@link Hume.tts.UnprocessableEntityError}
+     */
+    synthesizeFileStreaming(request: Hume.tts.PostedTts, requestOptions?: Tts.RequestOptions): core.HttpResponsePromise<stream.Readable>;
+    private __synthesizeFileStreaming;
     /**
      * Streams synthesized speech using the specified voice. If no voice is provided, a novel voice will be generated dynamically. Optionally, additional context can be included to influence the speech's style and prosody.
      *
@@ -77,12 +83,6 @@ export declare class Tts {
      */
     synthesizeJsonStreaming(request: Hume.tts.PostedTts, requestOptions?: Tts.RequestOptions): core.HttpResponsePromise<core.Stream<Hume.tts.SnippetAudioChunk>>;
     private __synthesizeJsonStreaming;
-    /**
-     * Streams synthesized speech using the specified voice. If no voice is provided, a novel voice will be generated dynamically. Optionally, additional context can be included to influence the speech's style and prosody.
-     * @throws {@link Hume.tts.UnprocessableEntityError}
-     */
-    synthesizeFileStreaming(request: Hume.tts.PostedTts, requestOptions?: Tts.RequestOptions): core.HttpResponsePromise<stream.Readable>;
-    private __synthesizeFileStreaming;
     protected _getCustomAuthorizationHeaders(): Promise<{
         "X-Hume-Api-Key": string | undefined;
     }>;

package/api/resources/tts/client/Client.js CHANGED Viewed

@@ -218,47 +218,28 @@ class Tts {
     }
     /**
      * Streams synthesized speech using the specified voice. If no voice is provided, a novel voice will be generated dynamically. Optionally, additional context can be included to influence the speech's style and prosody.
-     *
-     * The response is a stream of JSON objects including audio encoded in base64.
+     * @throws {@link Hume.tts.UnprocessableEntityError}
      */
-    synthesizeJsonStreaming(request, requestOptions) {
-        return core.HttpResponsePromise.fromPromise(this.__synthesizeJsonStreaming(request, requestOptions));
+    synthesizeFileStreaming(request, requestOptions) {
+        return core.HttpResponsePromise.fromPromise(this.__synthesizeFileStreaming(request, requestOptions));
     }
-    __synthesizeJsonStreaming(request, requestOptions) {
+    __synthesizeFileStreaming(request, requestOptions) {
         return __awaiter(this, void 0, void 0, function* () {
             var _a, _b, _c, _d;
             const _response = yield ((_a = this._options.fetcher) !== null && _a !== void 0 ? _a : core.fetcher)({
-                url: (0, url_join_1.default)((_c = (_b = (yield core.Supplier.get(this._options.baseUrl))) !== null && _b !== void 0 ? _b : (yield core.Supplier.get(this._options.environment))) !== null && _c !== void 0 ? _c : environments.HumeEnvironment.Production, "v0/tts/stream/json"),
+                url: (0, url_join_1.default)((_c = (_b = (yield core.Supplier.get(this._options.baseUrl))) !== null && _b !== void 0 ? _b : (yield core.Supplier.get(this._options.environment))) !== null && _c !== void 0 ? _c : environments.HumeEnvironment.Production, "v0/tts/stream/file"),
                 method: "POST",
                 headers: (0, headers_js_1.mergeHeaders)((_d = this._options) === null || _d === void 0 ? void 0 : _d.headers, (0, headers_js_1.mergeOnlyDefinedHeaders)(Object.assign({}, (yield this._getCustomAuthorizationHeaders()))), requestOptions === null || requestOptions === void 0 ? void 0 : requestOptions.headers),
                 contentType: "application/json",
                 requestType: "json",
                 body: serializers.tts.PostedTts.jsonOrThrow(request, { unrecognizedObjectKeys: "strip" }),
-                responseType: "sse",
+                responseType: "streaming",
                 timeoutMs: (requestOptions === null || requestOptions === void 0 ? void 0 : requestOptions.timeoutInSeconds) != null ? requestOptions.timeoutInSeconds * 1000 : 60000,
                 maxRetries: requestOptions === null || requestOptions === void 0 ? void 0 : requestOptions.maxRetries,
                 abortSignal: requestOptions === null || requestOptions === void 0 ? void 0 : requestOptions.abortSignal,
             });
             if (_response.ok) {
-                return {
-                    data: new core.Stream({
-                        stream: _response.body,
-                        parse: (data) => __awaiter(this, void 0, void 0, function* () {
-                            return serializers.tts.SnippetAudioChunk.parseOrThrow(data, {
-                                unrecognizedObjectKeys: "passthrough",
-                                allowUnrecognizedUnionMembers: true,
-                                allowUnrecognizedEnumValues: true,
-                                breadcrumbsPrefix: ["response"],
-                            });
-                        }),
-                        signal: requestOptions === null || requestOptions === void 0 ? void 0 : requestOptions.abortSignal,
-                        eventShape: {
-                            type: "json",
-                            messageTerminator: "\n",
-                        },
-                    }),
-                    rawResponse: _response.rawResponse,
-                };
+                return { data: _response.body, rawResponse: _response.rawResponse };
             }
             if (_response.error.reason === "status-code") {
                 switch (_response.error.statusCode) {
@@ -285,7 +266,7 @@ class Tts {
                         rawResponse: _response.rawResponse,
                     });
                 case "timeout":
-                    throw new errors.HumeTimeoutError("Timeout exceeded when calling POST /v0/tts/stream/json.");
+                    throw new errors.HumeTimeoutError("Timeout exceeded when calling POST /v0/tts/stream/file.");
                 case "unknown":
                     throw new errors.HumeError({
                         message: _response.error.errorMessage,
@@ -296,28 +277,47 @@ class Tts {
     }
     /**
      * Streams synthesized speech using the specified voice. If no voice is provided, a novel voice will be generated dynamically. Optionally, additional context can be included to influence the speech's style and prosody.
-     * @throws {@link Hume.tts.UnprocessableEntityError}
+     *
+     * The response is a stream of JSON objects including audio encoded in base64.
      */
-    synthesizeFileStreaming(request, requestOptions) {
-        return core.HttpResponsePromise.fromPromise(this.__synthesizeFileStreaming(request, requestOptions));
+    synthesizeJsonStreaming(request, requestOptions) {
+        return core.HttpResponsePromise.fromPromise(this.__synthesizeJsonStreaming(request, requestOptions));
     }
-    __synthesizeFileStreaming(request, requestOptions) {
+    __synthesizeJsonStreaming(request, requestOptions) {
         return __awaiter(this, void 0, void 0, function* () {
             var _a, _b, _c, _d;
             const _response = yield ((_a = this._options.fetcher) !== null && _a !== void 0 ? _a : core.fetcher)({
-                url: (0, url_join_1.default)((_c = (_b = (yield core.Supplier.get(this._options.baseUrl))) !== null && _b !== void 0 ? _b : (yield core.Supplier.get(this._options.environment))) !== null && _c !== void 0 ? _c : environments.HumeEnvironment.Production, "v0/tts/stream/file"),
+                url: (0, url_join_1.default)((_c = (_b = (yield core.Supplier.get(this._options.baseUrl))) !== null && _b !== void 0 ? _b : (yield core.Supplier.get(this._options.environment))) !== null && _c !== void 0 ? _c : environments.HumeEnvironment.Production, "v0/tts/stream/json"),
                 method: "POST",
                 headers: (0, headers_js_1.mergeHeaders)((_d = this._options) === null || _d === void 0 ? void 0 : _d.headers, (0, headers_js_1.mergeOnlyDefinedHeaders)(Object.assign({}, (yield this._getCustomAuthorizationHeaders()))), requestOptions === null || requestOptions === void 0 ? void 0 : requestOptions.headers),
                 contentType: "application/json",
                 requestType: "json",
                 body: serializers.tts.PostedTts.jsonOrThrow(request, { unrecognizedObjectKeys: "strip" }),
-                responseType: "streaming",
+                responseType: "sse",
                 timeoutMs: (requestOptions === null || requestOptions === void 0 ? void 0 : requestOptions.timeoutInSeconds) != null ? requestOptions.timeoutInSeconds * 1000 : 60000,
                 maxRetries: requestOptions === null || requestOptions === void 0 ? void 0 : requestOptions.maxRetries,
                 abortSignal: requestOptions === null || requestOptions === void 0 ? void 0 : requestOptions.abortSignal,
             });
             if (_response.ok) {
-                return { data: _response.body, rawResponse: _response.rawResponse };
+                return {
+                    data: new core.Stream({
+                        stream: _response.body,
+                        parse: (data) => __awaiter(this, void 0, void 0, function* () {
+                            return serializers.tts.SnippetAudioChunk.parseOrThrow(data, {
+                                unrecognizedObjectKeys: "passthrough",
+                                allowUnrecognizedUnionMembers: true,
+                                allowUnrecognizedEnumValues: true,
+                                breadcrumbsPrefix: ["response"],
+                            });
+                        }),
+                        signal: requestOptions === null || requestOptions === void 0 ? void 0 : requestOptions.abortSignal,
+                        eventShape: {
+                            type: "json",
+                            messageTerminator: "\n",
+                        },
+                    }),
+                    rawResponse: _response.rawResponse,
+                };
             }
             if (_response.error.reason === "status-code") {
                 switch (_response.error.statusCode) {
@@ -344,7 +344,7 @@ class Tts {
                         rawResponse: _response.rawResponse,
                     });
                 case "timeout":
-                    throw new errors.HumeTimeoutError("Timeout exceeded when calling POST /v0/tts/stream/file.");
+                    throw new errors.HumeTimeoutError("Timeout exceeded when calling POST /v0/tts/stream/json.");
                 case "unknown":
                     throw new errors.HumeError({
                         message: _response.error.errorMessage,

package/api/resources/tts/types/OctaveVersion.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+/**
+ * This file was auto-generated by Fern from our API Definition.
+ */
+export type OctaveVersion = string;

package/api/resources/tts/types/OctaveVersion.js ADDED Viewed

@@ -0,0 +1,5 @@
+"use strict";
+/**
+ * This file was auto-generated by Fern from our API Definition.
+ */
+Object.defineProperty(exports, "__esModule", { value: true });

package/api/resources/tts/types/PostedTts.d.ts CHANGED Viewed

@@ -5,16 +5,10 @@ import * as Hume from "../../../index";
 export interface PostedTts {
     /** Utterances to use as context for generating consistent speech style and prosody across multiple requests. These will not be converted to speech output. */
     context?: Hume.tts.PostedContext;
-    /**
-     * A list of **Utterances** to be converted to speech output.
-     *
-     * An **Utterance** is a unit of input for [Octave](/docs/text-to-speech-tts/overview), and includes input `text`, an optional `description` to serve as the prompt for how the speech should be delivered, an optional `voice` specification, and additional controls to guide delivery for `speed` and `trailing_silence`.
-     */
-    utterances: Hume.tts.PostedUtterance[];
-    /** Number of generations of the audio to produce. */
-    numGenerations?: number;
     /** Specifies the output audio file format. */
     format?: Hume.tts.Format;
+    /** Number of generations of the audio to produce. */
+    numGenerations?: number;
     /**
      * Controls how audio output is segmented in the response.
      *
@@ -27,6 +21,13 @@ export interface PostedTts {
     splitUtterances?: boolean;
     /** If enabled, the audio for all the chunks of a generation, once concatenated together, will constitute a single audio file. Otherwise, if disabled, each chunk's audio will be its own audio file, each with its own headers (if applicable). */
     stripHeaders?: boolean;
+    /**
+     * A list of **Utterances** to be converted to speech output.
+     *
+     * An **Utterance** is a unit of input for [Octave](/docs/text-to-speech-tts/overview), and includes input `text`, an optional `description` to serve as the prompt for how the speech should be delivered, an optional `voice` specification, and additional controls to guide delivery for `speed` and `trailing_silence`.
+     */
+    utterances: Hume.tts.PostedUtterance[];
+    version?: Hume.tts.OctaveVersion;
     /**
      * Enables ultra-low latency streaming, significantly reducing the time until the first audio chunk is received. Recommended for real-time applications requiring immediate audio playback. For further details, see our documentation on [instant mode](/docs/text-to-speech-tts/overview#ultra-low-latency-streaming-instant-mode).
      * - A [voice](/reference/text-to-speech-tts/synthesize-json-streaming#request.body.utterances.voice) must be specified when instant mode is enabled. Dynamic voice generation is not supported with this mode.

package/api/resources/tts/types/PostedUtterance.d.ts CHANGED Viewed

@@ -3,8 +3,6 @@
  */
 import * as Hume from "../../../index";
 export interface PostedUtterance {
-    /** The input text to be synthesized into speech. */
-    text: string;
     /**
      * Natural language instructions describing how the synthesized speech should sound, including but not limited to tone, intonation, pacing, and accent.
      *
@@ -13,14 +11,16 @@ export interface PostedUtterance {
      * - **Voice not specified**: the description will serve as a voice prompt for generating a voice. See our [prompting guide](/docs/text-to-speech-tts/prompting) for design tips.
      */
     description?: string;
+    /** Speed multiplier for the synthesized speech. Extreme values below 0.75 and above 1.5 may sometimes cause instability to the generated output. */
+    speed?: number;
+    /** The input text to be synthesized into speech. */
+    text: string;
+    /** Duration of trailing silence (in seconds) to add to this utterance */
+    trailingSilence?: number;
     /**
      * The `name` or `id` associated with a **Voice** from the **Voice Library** to be used as the speaker for this and all subsequent `utterances`, until the `voice` field is updated again.
      *
      *  See our [voices guide](/docs/text-to-speech-tts/voices) for more details on generating and specifying **Voices**.
      */
     voice?: Hume.tts.PostedUtteranceVoice;
-    /** Speed multiplier for the synthesized speech. Extreme values below 0.75 and above 1.5 may sometimes cause instability to the generated output. */
-    speed?: number;
-    /** Duration of trailing silence (in seconds) to add to this utterance */
-    trailingSilence?: number;
 }

package/api/resources/tts/types/ReturnGeneration.d.ts CHANGED Viewed

@@ -3,15 +3,15 @@
  */
 import * as Hume from "../../../index";
 export interface ReturnGeneration {
-    /** A unique ID associated with this TTS generation that can be used as context for generating consistent speech style and prosody across multiple requests. */
-    generationId: string;
+    /** The generated audio output in the requested format, encoded as a base64 string. */
+    audio: string;
     /** Duration of the generated audio in seconds. */
     duration: number;
+    encoding: Hume.tts.AudioEncoding;
     /** Size of the generated audio in bytes. */
     fileSize: number;
-    encoding: Hume.tts.AudioEncoding;
-    /** The generated audio output in the requested format, encoded as a base64 string. */
-    audio: string;
+    /** A unique ID associated with this TTS generation that can be used as context for generating consistent speech style and prosody across multiple requests. */
+    generationId: string;
     /** A list of snippet groups where each group corresponds to an utterance in the request. Each group contains segmented snippets that represent the original utterance divided into more natural-sounding units optimized for speech delivery. */
     snippets: Hume.tts.Snippet[][];
 }

package/api/resources/tts/types/ReturnTts.d.ts CHANGED Viewed

@@ -3,7 +3,7 @@
  */
 import * as Hume from "../../../index";
 export interface ReturnTts {
+    generations: Hume.tts.ReturnGeneration[];
     /** A unique ID associated with this request for tracking and troubleshooting. Use this ID when contacting [support](/support) for troubleshooting assistance. */
     requestId?: string;
-    generations: Hume.tts.ReturnGeneration[];
 }

package/api/resources/tts/types/Snippet.d.ts CHANGED Viewed

@@ -2,16 +2,16 @@
  * This file was auto-generated by Fern from our API Definition.
  */
 export interface Snippet {
+    /** The segmented audio output in the requested format, encoded as a base64 string. */
+    audio: string;
+    /** The generation ID this snippet corresponds to. */
+    generationId: string;
     /** A unique ID associated with this **Snippet**. */
     id: string;
     /** The text for this **Snippet**. */
     text: string;
-    /** The generation ID this snippet corresponds to. */
-    generationId: string;
-    /** The index of the utterance in the request this snippet corresponds to. */
-    utteranceIndex?: number;
     /** The transcribed text of the generated audio. It is only present if `instant_mode` is set to `false`. */
     transcribedText?: string;
-    /** The segmented audio output in the requested format, encoded as a base64 string. */
-    audio: string;
+    /** The index of the utterance in the request this snippet corresponds to. */
+    utteranceIndex?: number;
 }

package/api/resources/tts/types/SnippetAudioChunk.d.ts CHANGED Viewed

@@ -6,25 +6,26 @@ import * as Hume from "../../../index";
  * Metadata for a chunk of generated audio.
  */
 export interface SnippetAudioChunk {
-    /** ID of the initiating request. */
-    requestId: string;
+    /** The generated audio output chunk in the requested format. */
+    audio: string;
+    /** The generated audio output format. */
+    audioFormat: Hume.tts.AudioFormatType;
+    /** The index of the audio chunk in the snippet. */
+    chunkIndex: number;
     /** The generation ID of the parent snippet that this chunk corresponds to. */
     generationId: string;
+    /** Whether or not this is the last chunk streamed back from the decoder for one input snippet. */
+    isLastChunk: boolean;
+    /** ID of the initiating request. */
+    requestId: string;
+    snippet?: Hume.tts.Snippet;
     /** The ID of the parent snippet that this chunk corresponds to. */
     snippetId: string;
     /** The text of the parent snippet that this chunk corresponds to. */
     text: string;
     /** The transcribed text of the generated audio of the parent snippet that this chunk corresponds to. It is only present if `instant_mode` is set to `false`. */
     transcribedText?: string;
-    /** The index of the audio chunk in the snippet. */
-    chunkIndex: number;
-    /** The generated audio output chunk in the requested format. */
-    audio: string;
-    /** The generated audio output format. */
-    audioFormat: Hume.tts.AudioFormatType;
-    /** Whether or not this is the last chunk streamed back from the decoder for one input snippet. */
-    isLastChunk: boolean;
+    type?: "audio";
     /** The index of the utterance in the request that the parent snippet of this chunk corresponds to. */
     utteranceIndex?: number;
-    snippet?: Hume.tts.Snippet;
 }

package/api/resources/tts/types/index.d.ts CHANGED Viewed

@@ -15,6 +15,7 @@ export * from "./PostedContext";
 export * from "./Format";
 export * from "./PostedTts";
 export * from "./ReturnTts";
+export * from "./OctaveVersion";
 export * from "./ReturnVoice";
 export * from "./FormatPcm";
 export * from "./Snippet";

package/api/resources/tts/types/index.js CHANGED Viewed

@@ -31,6 +31,7 @@ __exportStar(require("./PostedContext"), exports);
 __exportStar(require("./Format"), exports);
 __exportStar(require("./PostedTts"), exports);
 __exportStar(require("./ReturnTts"), exports);
+__exportStar(require("./OctaveVersion"), exports);
 __exportStar(require("./ReturnVoice"), exports);
 __exportStar(require("./FormatPcm"), exports);
 __exportStar(require("./Snippet"), exports);

package/dist/api/resources/empathicVoice/types/AssistantEnd.d.ts CHANGED Viewed

@@ -5,12 +5,12 @@
  * When provided, the output is an assistant end message.
  */
 export interface AssistantEnd {
+    /** Used to manage conversational state, correlate frontend and backend data, and persist conversations across EVI sessions. */
+    customSessionId?: string;
     /**
      * The type of message sent through the socket; for an Assistant End message, this must be `assistant_end`.
      *
      * This message indicates the conclusion of the assistant's response, signaling that the assistant has finished speaking for the current conversational turn.
      */
     type: "assistant_end";
-    /** Used to manage conversational state, correlate frontend and backend data, and persist conversations across EVI sessions. */
-    customSessionId?: string;
 }

package/dist/api/resources/empathicVoice/types/AssistantInput.d.ts CHANGED Viewed

@@ -5,8 +5,6 @@
  * When provided, the input is spoken by EVI.
  */
 export interface AssistantInput {
-    /** The type of message sent through the socket; must be `assistant_input` for our server to correctly identify and process it as an Assistant Input message. */
-    type: "assistant_input";
     /** Used to manage conversational state, correlate frontend and backend data, and persist conversations across EVI sessions. */
     customSessionId?: string;
     /**
@@ -15,4 +13,6 @@ export interface AssistantInput {
      * EVI uses this text to generate spoken audio using our proprietary expressive text-to-speech model. Our model adds appropriate emotional inflections and tones to the text based on the user's expressions and the context of the conversation. The synthesized audio is streamed back to the user as an [Assistant Message](/reference/speech-to-speech-evi/chat#receive.AssistantMessage).
      */
     text: string;
+    /** The type of message sent through the socket; must be `assistant_input` for our server to correctly identify and process it as an Assistant Input message. */
+    type: "assistant_input";
 }

package/dist/api/resources/empathicVoice/types/AssistantMessage.d.ts CHANGED Viewed

@@ -6,20 +6,20 @@ import * as Hume from "../../../index";
  * When provided, the output is an assistant message.
  */
 export interface AssistantMessage {
-    /**
-     * The type of message sent through the socket; for an Assistant Message, this must be `assistant_message`.
-     *
-     * This message contains both a transcript of the assistant's response and the expression measurement predictions of the assistant's audio output.
-     */
-    type: "assistant_message";
     /** Used to manage conversational state, correlate frontend and backend data, and persist conversations across EVI sessions. */
     customSessionId?: string;
+    /** Indicates if this message was inserted into the conversation as text from an [Assistant Input message](/reference/speech-to-speech-evi/chat#send.AssistantInput.text). */
+    fromText: boolean;
     /** ID of the assistant message. Allows the Assistant Message to be tracked and referenced. */
     id?: string;
     /** Transcript of the message. */
     message: Hume.empathicVoice.ChatMessage;
     /** Inference model results. */
     models: Hume.empathicVoice.Inference;
-    /** Indicates if this message was inserted into the conversation as text from an [Assistant Input message](/reference/speech-to-speech-evi/chat#send.AssistantInput.text). */
-    fromText: boolean;
+    /**
+     * The type of message sent through the socket; for an Assistant Message, this must be `assistant_message`.
+     *
+     * This message contains both a transcript of the assistant's response and the expression measurement predictions of the assistant's audio output.
+     */
+    type: "assistant_message";
 }

package/dist/api/resources/empathicVoice/types/AssistantProsody.d.ts CHANGED Viewed

@@ -6,16 +6,16 @@ import * as Hume from "../../../index";
  * When provided, the output is an Assistant Prosody message.
  */
 export interface AssistantProsody {
+    /** Used to manage conversational state, correlate frontend and backend data, and persist conversations across EVI sessions. */
+    customSessionId?: string;
+    /** Unique identifier for the segment. */
+    id?: string;
+    /** Inference model results. */
+    models: Hume.empathicVoice.Inference;
     /**
      * The type of message sent through the socket; for an Assistant Prosody message, this must be `assistant_PROSODY`.
      *
      * This message the expression measurement predictions of the assistant's audio output.
      */
     type: "assistant_prosody";
-    /** Used to manage conversational state, correlate frontend and backend data, and persist conversations across EVI sessions. */
-    customSessionId?: string;
-    /** Inference model results. */
-    models: Hume.empathicVoice.Inference;
-    /** Unique identifier for the segment. */
-    id?: string;
 }

package/dist/api/resources/empathicVoice/types/AudioConfiguration.d.ts CHANGED Viewed

@@ -3,10 +3,10 @@
  */
 import * as Hume from "../../../index";
 export interface AudioConfiguration {
-    /** Encoding format of the audio input, such as `linear16`. */
-    encoding: Hume.empathicVoice.Encoding;
     /** Number of audio channels. */
     channels: number;
+    /** Encoding format of the audio input, such as `linear16`. */
+    encoding: Hume.empathicVoice.Encoding;
     /** Audio sample rate. Number of samples per second in the audio input, measured in Hertz. */
     sampleRate: number;
 }

package/dist/api/resources/empathicVoice/types/AudioInput.d.ts CHANGED Viewed

@@ -5,12 +5,6 @@
  * When provided, the input is audio.
  */
 export interface AudioInput {
-    /**
-     * The type of message sent through the socket; must be `audio_input` for our server to correctly identify and process it as an Audio Input message.
-     *
-     * This message is used for sending audio input data to EVI for processing and expression measurement. Audio data should be sent as a continuous stream, encoded in Base64.
-     */
-    type: "audio_input";
     /** Used to manage conversational state, correlate frontend and backend data, and persist conversations across EVI sessions. */
     customSessionId?: string;
     /**
@@ -23,4 +17,10 @@ export interface AudioInput {
      * Hume recommends streaming audio with a buffer window of 20 milliseconds (ms), or 100 milliseconds (ms) for web applications.
      */
     data: string;
+    /**
+     * The type of message sent through the socket; must be `audio_input` for our server to correctly identify and process it as an Audio Input message.
+     *
+     * This message is used for sending audio input data to EVI for processing and expression measurement. Audio data should be sent as a continuous stream, encoded in Base64.
+     */
+    type: "audio_input";
 }

package/dist/api/resources/empathicVoice/types/AudioOutput.d.ts CHANGED Viewed

@@ -5,14 +5,14 @@
  * The type of message sent through the socket; for an Audio Output message, this must be `audio_output`.
  */
 export interface AudioOutput {
-    /** The type of message sent through the socket; for an Audio Output message, this must be `audio_output`. */
-    type: "audio_output";
     /** Used to manage conversational state, correlate frontend and backend data, and persist conversations across EVI sessions. */
     customSessionId?: string;
+    /** Base64 encoded audio output. This encoded audio is transmitted to the client, where it can be decoded and played back as part of the user interaction. */
+    data: string;
     /** ID of the audio output. Allows the Audio Output message to be tracked and referenced. */
     id: string;
     /** Index of the chunk of audio relative to the whole audio segment. */
     index: number;
-    /** Base64 encoded audio output. This encoded audio is transmitted to the client, where it can be decoded and played back as part of the user interaction. */
-    data: string;
+    /** The type of message sent through the socket; for an Audio Output message, this must be `audio_output`. */
+    type: "audio_output";
 }

package/dist/api/resources/empathicVoice/types/BuiltinToolConfig.d.ts CHANGED Viewed

@@ -3,7 +3,7 @@
  */
 import * as Hume from "../../../index";
 export interface BuiltinToolConfig {
-    name: Hume.empathicVoice.BuiltInTool;
     /** Optional text passed to the supplemental LLM if the tool call fails. The LLM then uses this text to generate a response back to the user, ensuring continuity in the conversation. */
     fallbackContent?: string;
+    name: Hume.empathicVoice.BuiltInTool;
 }

package/dist/api/resources/empathicVoice/types/ChatMessage.d.ts CHANGED Viewed

@@ -3,10 +3,10 @@
  */
 import * as Hume from "../../../index";
 export interface ChatMessage {
-    /** Role of who is providing the message. */
-    role: Hume.empathicVoice.Role;
     /** Transcript of the message. */
     content?: string;
+    /** Role of who is providing the message. */
+    role: Hume.empathicVoice.Role;
     /** Function call name and arguments. */
     toolCall?: Hume.empathicVoice.ToolCallMessage;
     /** Function call response from client. */

package/dist/api/resources/empathicVoice/types/ChatMetadata.d.ts CHANGED Viewed

@@ -5,14 +5,6 @@
  * When provided, the output is a chat metadata message.
  */
 export interface ChatMetadata {
-    /**
-     * The type of message sent through the socket; for a Chat Metadata message, this must be `chat_metadata`.
-     *
-     * The Chat Metadata message is the first message you receive after establishing a connection with EVI and contains important identifiers for the current Chat session.
-     */
-    type: "chat_metadata";
-    /** Used to manage conversational state, correlate frontend and backend data, and persist conversations across EVI sessions. */
-    customSessionId?: string;
     /**
      * ID of the Chat Group.
      *
@@ -23,6 +15,14 @@ export interface ChatMetadata {
     chatGroupId: string;
     /** ID of the Chat session. Allows the Chat session to be tracked and referenced. */
     chatId: string;
+    /** Used to manage conversational state, correlate frontend and backend data, and persist conversations across EVI sessions. */
+    customSessionId?: string;
     /** ID of the initiating request. */
     requestId?: string;
+    /**
+     * The type of message sent through the socket; for a Chat Metadata message, this must be `chat_metadata`.
+     *
+     * The Chat Metadata message is the first message you receive after establishing a connection with EVI and contains important identifiers for the current Chat session.
+     */
+    type: "chat_metadata";
 }

package/dist/api/resources/empathicVoice/types/Context.d.ts CHANGED Viewed

@@ -3,6 +3,12 @@
  */
 import * as Hume from "../../../index";
 export interface Context {
+    /**
+     * The context to be injected into the conversation. Helps inform the LLM's response by providing relevant information about the ongoing conversation.
+     *
+     * This text will be appended to the end of [user_messages](/reference/speech-to-speech-evi/chat#receive.UserMessage.message.content) based on the chosen persistence level. For example, if you want to remind EVI of its role as a helpful weather assistant, the context you insert will be appended to the end of user messages as `{Context: You are a helpful weather assistant}`.
+     */
+    text: string;
     /**
      * The persistence level of the injected context. Specifies how long the injected context will remain active in the session.
      *
@@ -11,10 +17,4 @@ export interface Context {
      * - **Persistent**: Context that is applied to all subsequent assistant responses for the remainder of the Chat.
      */
     type?: Hume.empathicVoice.ContextType;
-    /**
-     * The context to be injected into the conversation. Helps inform the LLM's response by providing relevant information about the ongoing conversation.
-     *
-     * This text will be appended to the end of [user_messages](/reference/speech-to-speech-evi/chat#receive.UserMessage.message.content) based on the chosen persistence level. For example, if you want to remind EVI of its role as a helpful weather assistant, the context you insert will be appended to the end of user messages as `{Context: You are a helpful weather assistant}`.
-     */
-    text: string;
 }

package/dist/api/resources/empathicVoice/types/LanguageModelType.d.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 /**
  * This file was auto-generated by Fern from our API Definition.
  */
-export type LanguageModelType = "claude-3-7-sonnet-latest" | "claude-3-5-sonnet-latest" | "claude-3-5-haiku-latest" | "claude-3-5-sonnet-20240620" | "claude-3-opus-20240229" | "claude-3-sonnet-20240229" | "claude-3-haiku-20240307" | "claude-sonnet-4-20250514" | "us.anthropic.claude-3-5-haiku-20241022-v1:0" | "us.anthropic.claude-3-5-sonnet-20240620-v1:0" | "us.anthropic.claude-3-haiku-20240307-v1:0" | "gpt-oss-120b" | "qwen-3-235b-a22b" | "qwen-3-235b-a22b-instruct-2507" | "qwen-3-235b-a22b-thinking-2507" | "gemini-1.5-pro" | "gemini-1.5-flash" | "gemini-1.5-pro-002" | "gemini-1.5-flash-002" | "gemini-2.0-flash" | "gemini-2.5-flash" | "gemini-2.5-flash-preview-04-17" | "gpt-4-turbo" | "gpt-4-turbo-preview" | "gpt-3.5-turbo-0125" | "gpt-3.5-turbo" | "gpt-4o" | "gpt-4o-mini" | "gpt-4.1" | "gpt-5" | "gpt-5-mini" | "gpt-5-nano" | "gemma-7b-it" | "llama3-8b-8192" | "llama3-70b-8192" | "llama-3.1-70b-versatile" | "llama-3.3-70b-versatile" | "llama-3.1-8b-instant" | "moonshotai/kimi-k2-instruct" | "accounts/fireworks/models/mixtral-8x7b-instruct" | "accounts/fireworks/models/llama-v3p1-405b-instruct" | "accounts/fireworks/models/llama-v3p1-70b-instruct" | "accounts/fireworks/models/llama-v3p1-8b-instruct" | "sonar" | "sonar-pro" | "sambanova" | "DeepSeek-R1-Distill-Llama-70B" | "Llama-4-Maverick-17B-128E-Instruct" | "Qwen3-32B" | "ellm" | "custom-language-model" | "hume-evi-3-web-search";
+export type LanguageModelType = "claude-3-7-sonnet-latest" | "claude-3-5-sonnet-latest" | "claude-3-5-haiku-latest" | "claude-3-5-sonnet-20240620" | "claude-3-opus-20240229" | "claude-3-sonnet-20240229" | "claude-3-haiku-20240307" | "claude-sonnet-4-20250514" | "us.anthropic.claude-3-5-haiku-20241022-v1:0" | "us.anthropic.claude-3-5-sonnet-20240620-v1:0" | "us.anthropic.claude-3-haiku-20240307-v1:0" | "gpt-oss-120b" | "qwen-3-235b-a22b" | "qwen-3-235b-a22b-instruct-2507" | "qwen-3-235b-a22b-thinking-2507" | "gemini-1.5-pro" | "gemini-1.5-flash" | "gemini-1.5-pro-002" | "gemini-1.5-flash-002" | "gemini-2.0-flash" | "gemini-2.5-flash" | "gemini-2.5-flash-preview-04-17" | "gpt-4-turbo" | "gpt-4-turbo-preview" | "gpt-3.5-turbo-0125" | "gpt-3.5-turbo" | "gpt-4o" | "gpt-4o-mini" | "gpt-4.1" | "gpt-5" | "gpt-5-mini" | "gpt-5-nano" | "gpt-4o-priority" | "gpt-4o-mini-priority" | "gpt-4.1-priority" | "gpt-5-priority" | "gpt-5-mini-priority" | "gpt-5-nano-priority" | "gemma-7b-it" | "llama3-8b-8192" | "llama3-70b-8192" | "llama-3.1-70b-versatile" | "llama-3.3-70b-versatile" | "llama-3.1-8b-instant" | "moonshotai/kimi-k2-instruct" | "accounts/fireworks/models/mixtral-8x7b-instruct" | "accounts/fireworks/models/llama-v3p1-405b-instruct" | "accounts/fireworks/models/llama-v3p1-70b-instruct" | "accounts/fireworks/models/llama-v3p1-8b-instruct" | "sonar" | "sonar-pro" | "sambanova" | "DeepSeek-R1-Distill-Llama-70B" | "Llama-4-Maverick-17B-128E-Instruct" | "Qwen3-32B" | "ellm" | "custom-language-model" | "hume-evi-3-web-search";
 export declare const LanguageModelType: {
     readonly Claude37SonnetLatest: "claude-3-7-sonnet-latest";
     readonly Claude35SonnetLatest: "claude-3-5-sonnet-latest";
@@ -35,6 +35,12 @@ export declare const LanguageModelType: {
     readonly Gpt5: "gpt-5";
     readonly Gpt5Mini: "gpt-5-mini";
     readonly Gpt5Nano: "gpt-5-nano";
+    readonly Gpt4OPriority: "gpt-4o-priority";
+    readonly Gpt4OMiniPriority: "gpt-4o-mini-priority";
+    readonly Gpt41Priority: "gpt-4.1-priority";
+    readonly Gpt5Priority: "gpt-5-priority";
+    readonly Gpt5MiniPriority: "gpt-5-mini-priority";
+    readonly Gpt5NanoPriority: "gpt-5-nano-priority";
     readonly Gemma7BIt: "gemma-7b-it";
     readonly Llama38B8192: "llama3-8b-8192";
     readonly Llama370B8192: "llama3-70b-8192";