npm - @huggingface/inference - Versions diffs - 2.6.6 → 2.7.0 - Mend

@huggingface/inference 2.6.6 → 2.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (129) hide show

package/README.md +126 -27
package/dist/index.cjs +81 -17
package/dist/index.js +79 -17
package/dist/src/HfInference.d.ts +28 -0
package/dist/src/HfInference.d.ts.map +1 -0
package/dist/src/index.d.ts +5 -0
package/dist/src/index.d.ts.map +1 -0
package/dist/src/lib/InferenceOutputError.d.ts +4 -0
package/dist/src/lib/InferenceOutputError.d.ts.map +1 -0
package/dist/src/lib/getDefaultTask.d.ts +12 -0
package/dist/src/lib/getDefaultTask.d.ts.map +1 -0
package/dist/src/lib/isUrl.d.ts +2 -0
package/dist/src/lib/isUrl.d.ts.map +1 -0
package/dist/src/lib/makeRequestOptions.d.ts +18 -0
package/dist/src/lib/makeRequestOptions.d.ts.map +1 -0
package/dist/src/tasks/audio/audioClassification.d.ts +24 -0
package/dist/src/tasks/audio/audioClassification.d.ts.map +1 -0
package/dist/src/tasks/audio/audioToAudio.d.ts +28 -0
package/dist/src/tasks/audio/audioToAudio.d.ts.map +1 -0
package/dist/src/tasks/audio/automaticSpeechRecognition.d.ts +19 -0
package/dist/src/tasks/audio/automaticSpeechRecognition.d.ts.map +1 -0
package/dist/src/tasks/audio/textToSpeech.d.ts +14 -0
package/dist/src/tasks/audio/textToSpeech.d.ts.map +1 -0
package/dist/src/tasks/custom/request.d.ts +13 -0
package/dist/src/tasks/custom/request.d.ts.map +1 -0
package/dist/src/tasks/custom/streamingRequest.d.ts +13 -0
package/dist/src/tasks/custom/streamingRequest.d.ts.map +1 -0
package/dist/src/tasks/cv/imageClassification.d.ts +24 -0
package/dist/src/tasks/cv/imageClassification.d.ts.map +1 -0
package/dist/src/tasks/cv/imageSegmentation.d.ts +28 -0
package/dist/src/tasks/cv/imageSegmentation.d.ts.map +1 -0
package/dist/src/tasks/cv/imageToImage.d.ts +55 -0
package/dist/src/tasks/cv/imageToImage.d.ts.map +1 -0
package/dist/src/tasks/cv/imageToText.d.ts +18 -0
package/dist/src/tasks/cv/imageToText.d.ts.map +1 -0
package/dist/src/tasks/cv/objectDetection.d.ts +33 -0
package/dist/src/tasks/cv/objectDetection.d.ts.map +1 -0
package/dist/src/tasks/cv/textToImage.d.ts +36 -0
package/dist/src/tasks/cv/textToImage.d.ts.map +1 -0
package/dist/src/tasks/cv/zeroShotImageClassification.d.ts +26 -0
package/dist/src/tasks/cv/zeroShotImageClassification.d.ts.map +1 -0
package/dist/src/tasks/index.d.ts +32 -0
package/dist/src/tasks/index.d.ts.map +1 -0
package/dist/src/tasks/multimodal/documentQuestionAnswering.d.ts +35 -0
package/dist/src/tasks/multimodal/documentQuestionAnswering.d.ts.map +1 -0
package/dist/src/tasks/multimodal/visualQuestionAnswering.d.ts +27 -0
package/dist/src/tasks/multimodal/visualQuestionAnswering.d.ts.map +1 -0
package/dist/src/tasks/nlp/chatCompletion.d.ts +7 -0
package/dist/src/tasks/nlp/chatCompletion.d.ts.map +1 -0
package/dist/src/tasks/nlp/chatCompletionStream.d.ts +7 -0
package/dist/src/tasks/nlp/chatCompletionStream.d.ts.map +1 -0
package/dist/src/tasks/nlp/featureExtraction.d.ts +19 -0
package/dist/src/tasks/nlp/featureExtraction.d.ts.map +1 -0
package/dist/src/tasks/nlp/fillMask.d.ts +27 -0
package/dist/src/tasks/nlp/fillMask.d.ts.map +1 -0
package/dist/src/tasks/nlp/questionAnswering.d.ts +30 -0
package/dist/src/tasks/nlp/questionAnswering.d.ts.map +1 -0
package/dist/src/tasks/nlp/sentenceSimilarity.d.ts +19 -0
package/dist/src/tasks/nlp/sentenceSimilarity.d.ts.map +1 -0
package/dist/src/tasks/nlp/summarization.d.ts +48 -0
package/dist/src/tasks/nlp/summarization.d.ts.map +1 -0
package/dist/src/tasks/nlp/tableQuestionAnswering.d.ts +36 -0
package/dist/src/tasks/nlp/tableQuestionAnswering.d.ts.map +1 -0
package/dist/src/tasks/nlp/textClassification.d.ts +22 -0
package/dist/src/tasks/nlp/textClassification.d.ts.map +1 -0
package/dist/src/tasks/nlp/textGeneration.d.ts +8 -0
package/dist/src/tasks/nlp/textGeneration.d.ts.map +1 -0
package/dist/src/tasks/nlp/textGenerationStream.d.ts +81 -0
package/dist/src/tasks/nlp/textGenerationStream.d.ts.map +1 -0
package/dist/src/tasks/nlp/tokenClassification.d.ts +51 -0
package/dist/src/tasks/nlp/tokenClassification.d.ts.map +1 -0
package/dist/src/tasks/nlp/translation.d.ts +19 -0
package/dist/src/tasks/nlp/translation.d.ts.map +1 -0
package/dist/src/tasks/nlp/zeroShotClassification.d.ts +28 -0
package/dist/src/tasks/nlp/zeroShotClassification.d.ts.map +1 -0
package/dist/src/tasks/tabular/tabularClassification.d.ts +20 -0
package/dist/src/tasks/tabular/tabularClassification.d.ts.map +1 -0
package/dist/src/tasks/tabular/tabularRegression.d.ts +20 -0
package/dist/src/tasks/tabular/tabularRegression.d.ts.map +1 -0
package/dist/src/types.d.ts +69 -0
package/dist/src/types.d.ts.map +1 -0
package/dist/src/utils/base64FromBytes.d.ts +2 -0
package/dist/src/utils/base64FromBytes.d.ts.map +1 -0
package/dist/src/utils/distributive-omit.d.ts +9 -0
package/dist/src/utils/distributive-omit.d.ts.map +1 -0
package/dist/src/utils/isBackend.d.ts +2 -0
package/dist/src/utils/isBackend.d.ts.map +1 -0
package/dist/src/utils/isFrontend.d.ts +2 -0
package/dist/src/utils/isFrontend.d.ts.map +1 -0
package/dist/src/utils/omit.d.ts +5 -0
package/dist/src/utils/omit.d.ts.map +1 -0
package/dist/src/utils/pick.d.ts +5 -0
package/dist/src/utils/pick.d.ts.map +1 -0
package/dist/src/utils/toArray.d.ts +2 -0
package/dist/src/utils/toArray.d.ts.map +1 -0
package/dist/src/utils/typedInclude.d.ts +2 -0
package/dist/src/utils/typedInclude.d.ts.map +1 -0
package/dist/src/vendor/fetch-event-source/parse.d.ts +69 -0
package/dist/src/vendor/fetch-event-source/parse.d.ts.map +1 -0
package/dist/src/vendor/fetch-event-source/parse.spec.d.ts +2 -0
package/dist/src/vendor/fetch-event-source/parse.spec.d.ts.map +1 -0
package/dist/test/HfInference.spec.d.ts +2 -0
package/dist/test/HfInference.spec.d.ts.map +1 -0
package/dist/test/expect-closeto.d.ts +2 -0
package/dist/test/expect-closeto.d.ts.map +1 -0
package/dist/test/test-files.d.ts +2 -0
package/dist/test/test-files.d.ts.map +1 -0
package/dist/test/vcr.d.ts +2 -0
package/dist/test/vcr.d.ts.map +1 -0
package/package.json +9 -7
package/src/HfInference.ts +7 -6
package/src/lib/makeRequestOptions.ts +23 -18
package/src/tasks/custom/request.ts +5 -0
package/src/tasks/custom/streamingRequest.ts +8 -0
package/src/tasks/cv/imageToImage.ts +1 -1
package/src/tasks/cv/zeroShotImageClassification.ts +1 -1
package/src/tasks/index.ts +2 -0
package/src/tasks/multimodal/documentQuestionAnswering.ts +1 -1
package/src/tasks/multimodal/visualQuestionAnswering.ts +1 -1
package/src/tasks/nlp/chatCompletion.ts +32 -0
package/src/tasks/nlp/chatCompletionStream.ts +17 -0
package/src/tasks/nlp/textGeneration.ts +3 -1
package/src/tasks/nlp/textGenerationStream.ts +2 -2
package/src/types.ts +13 -2
package/src/utils/base64FromBytes.ts +11 -0
package/src/utils/{distributive-omit.d.ts → distributive-omit.ts} +0 -2
package/src/utils/isBackend.ts +6 -0
package/src/utils/isFrontend.ts +3 -0
package/dist/index.d.ts +0 -1341

package/dist/src/vendor/fetch-event-source/parse.d.ts ADDED Viewed

@@ -0,0 +1,69 @@
+/**
+ This file is a part of fetch-event-source package (as of v2.0.1)
+ https://github.com/Azure/fetch-event-source/blob/v2.0.1/src/parse.ts
+ Full package can be used after it is made compatible with nodejs:
+ https://github.com/Azure/fetch-event-source/issues/20
+ Below is the fetch-event-source package license:
+ MIT License
+ Copyright (c) Microsoft Corporation.
+ Permission is hereby granted, free of charge, to any person obtaining a copy
+ of this software and associated documentation files (the "Software"), to deal
+ in the Software without restriction, including without limitation the rights
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+ copies of the Software, and to permit persons to whom the Software is
+ furnished to do so, subject to the following conditions:
+ The above copyright notice and this permission notice shall be included in all
+ copies or substantial portions of the Software.
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ SOFTWARE
+ */
+/**
+ * Represents a message sent in an event stream
+ * https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events/Using_server-sent_events#Event_stream_format
+ */
+export interface EventSourceMessage {
+    /** The event ID to set the EventSource object's last event ID value. */
+    id: string;
+    /** A string identifying the type of event described. */
+    event: string;
+    /** The event data */
+    data: string;
+    /** The reconnection interval (in milliseconds) to wait before retrying the connection */
+    retry?: number;
+}
+/**
+ * Converts a ReadableStream into a callback pattern.
+ * @param stream The input ReadableStream.
+ * @param onChunk A function that will be called on each new byte chunk in the stream.
+ * @returns {Promise<void>} A promise that will be resolved when the stream closes.
+ */
+export declare function getBytes(stream: ReadableStream<Uint8Array>, onChunk: (arr: Uint8Array) => void): Promise<void>;
+/**
+ * Parses arbitary byte chunks into EventSource line buffers.
+ * Each line should be of the format "field: value" and ends with \r, \n, or \r\n.
+ * @param onLine A function that will be called on each new EventSource line.
+ * @returns A function that should be called for each incoming byte chunk.
+ */
+export declare function getLines(onLine: (line: Uint8Array, fieldLength: number) => void): (arr: Uint8Array) => void;
+/**
+ * Parses line buffers into EventSourceMessages.
+ * @param onId A function that will be called on each `id` field.
+ * @param onRetry A function that will be called on each `retry` field.
+ * @param onMessage A function that will be called on each message.
+ * @returns A function that should be called for each incoming line buffer.
+ */
+export declare function getMessages(onId: (id: string) => void, onRetry: (retry: number) => void, onMessage?: (msg: EventSourceMessage) => void): (line: Uint8Array, fieldLength: number) => void;
+//# sourceMappingURL=parse.d.ts.map

package/dist/src/vendor/fetch-event-source/parse.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"parse.d.ts","sourceRoot":"","sources":["../../../../src/vendor/fetch-event-source/parse.ts"],"names":[],"mappings":"AAAA;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA+BG;AAEH;;;GAGG;AACH,MAAM,WAAW,kBAAkB;IAC/B,wEAAwE;IACxE,EAAE,EAAE,MAAM,CAAC;IACX,wDAAwD;IACxD,KAAK,EAAE,MAAM,CAAC;IACd,qBAAqB;IACrB,IAAI,EAAE,MAAM,CAAC;IACb,yFAAyF;IACzF,KAAK,CAAC,EAAE,MAAM,CAAC;CAClB;AAED;;;;;GAKG;AACH,wBAAsB,QAAQ,CAAC,MAAM,EAAE,cAAc,CAAC,UAAU,CAAC,EAAE,OAAO,EAAE,CAAC,GAAG,EAAE,UAAU,KAAK,IAAI,iBAMpG;AASD;;;;;GAKG;AACH,wBAAgB,QAAQ,CAAC,MAAM,EAAE,CAAC,IAAI,EAAE,UAAU,EAAE,WAAW,EAAE,MAAM,KAAK,IAAI,SAO/C,UAAU,UA4D1C;AAED;;;;;;GAMG;AACH,wBAAgB,WAAW,CACvB,IAAI,EAAE,CAAC,EAAE,EAAE,MAAM,KAAK,IAAI,EAC1B,OAAO,EAAE,CAAC,KAAK,EAAE,MAAM,KAAK,IAAI,EAChC,SAAS,CAAC,EAAE,CAAC,GAAG,EAAE,kBAAkB,KAAK,IAAI,UAMhB,UAAU,eAAe,MAAM,UAmC/D"}

package/dist/src/vendor/fetch-event-source/parse.spec.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ export {};
2	+ //# sourceMappingURL=parse.spec.d.ts.map

package/dist/src/vendor/fetch-event-source/parse.spec.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"parse.spec.d.ts","sourceRoot":"","sources":["../../../../src/vendor/fetch-event-source/parse.spec.ts"],"names":[],"mappings":""}

package/dist/test/HfInference.spec.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ import "./vcr";
2	+ //# sourceMappingURL=HfInference.spec.d.ts.map

package/dist/test/HfInference.spec.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"HfInference.spec.d.ts","sourceRoot":"","sources":["../../test/HfInference.spec.ts"],"names":[],"mappings":"AAKA,OAAO,OAAO,CAAC"}

package/dist/test/expect-closeto.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ export {};
2	+ //# sourceMappingURL=expect-closeto.d.ts.map

package/dist/test/expect-closeto.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"expect-closeto.d.ts","sourceRoot":"","sources":["../../test/expect-closeto.ts"],"names":[],"mappings":""}

package/dist/test/test-files.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ export declare const readTestFile: (filename: string) => Uint8Array;
2	+ //# sourceMappingURL=test-files.d.ts.map

package/dist/test/test-files.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"test-files.d.ts","sourceRoot":"","sources":["../../test/test-files.ts"],"names":[],"mappings":"AAGA,eAAO,MAAM,YAAY,aAAc,MAAM,KAAG,UAK/C,CAAC"}

package/dist/test/vcr.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ export {};
2	+ //# sourceMappingURL=vcr.d.ts.map

package/dist/test/vcr.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"vcr.d.ts","sourceRoot":"","sources":["../../test/vcr.ts"],"names":[],"mappings":""}

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@huggingface/inference",
-  "version": "2.6.6",
+  "version": "2.7.0",
   "packageManager": "pnpm@8.10.5",
   "license": "MIT",
   "author": "Tim Mikeladze <tim.mikeladze@gmail.com>",
@@ -29,23 +29,25 @@
     "src"
   ],
   "source": "src/index.ts",
-  "types": "./dist/index.d.ts",
+  "types": "./dist/src/index.d.ts",
   "main": "./dist/index.cjs",
   "module": "./dist/index.js",
   "exports": {
-    "types": "./dist/index.d.ts",
+    "types": "./dist/src/index.d.ts",
     "require": "./dist/index.cjs",
     "import": "./dist/index.js"
   },
   "type": "module",
+  "dependencies": {
+    "@huggingface/tasks": "^0.10.0"
+  },
   "devDependencies": {
-    "@types/node": "18.13.0",
-    "@huggingface/tasks": "^0.6.0"
+    "@types/node": "18.13.0"
   },
   "resolutions": {},
   "scripts": {
-    "build": "tsup src/index.ts --format cjs,esm --clean && pnpm run dts",
-    "dts": "tsx scripts/generate-dts.ts",
+    "build": "tsup src/index.ts --format cjs,esm --clean && tsc --emitDeclarationOnly --declaration",
+    "dts": "tsx scripts/generate-dts.ts && tsc --noEmit dist/index.d.ts",
     "lint": "eslint --quiet --fix --ext .cjs,.ts .",
     "lint:check": "eslint --ext .cjs,.ts .",
     "format": "prettier --write .",

package/src/HfInference.ts CHANGED Viewed

@@ -2,6 +2,9 @@ import * as tasks from "./tasks";
 import type { Options, RequestArgs } from "./types";
 import type { DistributiveOmit } from "./utils/distributive-omit";
+/* eslint-disable @typescript-eslint/no-empty-interface */
+/* eslint-disable @typescript-eslint/no-unsafe-declaration-merging */
 type Task = typeof tasks;
 type TaskWithNoAccessToken = {
@@ -11,9 +14,9 @@ type TaskWithNoAccessToken = {
 	) => ReturnType<Task[key]>;
 };
-type TaskWithNoAccessTokenNoModel = {
+type TaskWithNoAccessTokenNoEndpointUrl = {
 	[key in keyof Task]: (
-		args: DistributiveOmit<Parameters<Task[key]>[0], "accessToken" | "model">,
+		args: DistributiveOmit<Parameters<Task[key]>[0], "accessToken" | "endpointUrl">,
 		options?: Parameters<Task[key]>[1]
 	) => ReturnType<Task[key]>;
 };
@@ -54,14 +57,12 @@ export class HfInferenceEndpoint {
 				enumerable: false,
 				value: (params: RequestArgs, options: Options) =>
 					// eslint-disable-next-line @typescript-eslint/no-explicit-any
-					fn({ ...params, accessToken, model: endpointUrl } as any, { ...defaultOptions, ...options }),
+					fn({ ...params, accessToken, endpointUrl } as any, { ...defaultOptions, ...options }),
 			});
 		}
 	}
 }
-// eslint-disable-next-line @typescript-eslint/no-empty-interface
 export interface HfInference extends TaskWithNoAccessToken {}
-// eslint-disable-next-line @typescript-eslint/no-empty-interface
-export interface HfInferenceEndpoint extends TaskWithNoAccessTokenNoModel {}
+export interface HfInferenceEndpoint extends TaskWithNoAccessTokenNoEndpointUrl {}

package/src/lib/makeRequestOptions.ts CHANGED Viewed

@@ -1,4 +1,5 @@
 import type { InferenceTask, Options, RequestArgs } from "../types";
+import { omit } from "../utils/omit";
 import { HF_HUB_URL } from "./getDefaultTask";
 import { isUrl } from "./isUrl";
@@ -22,10 +23,10 @@ export async function makeRequestOptions(
 		forceTask?: string | InferenceTask;
 		/** To load default model if needed */
 		taskHint?: InferenceTask;
+		chatCompletion?: boolean;
 	}
 ): Promise<{ url: string; info: RequestInit }> {
-	// eslint-disable-next-line @typescript-eslint/no-unused-vars
-	const { accessToken, model: _model, ...otherArgs } = args;
+	const { accessToken, endpointUrl, ...otherArgs } = args;
 	let { model } = args;
 	const {
 		forceTask: task,
@@ -34,7 +35,7 @@ export async function makeRequestOptions(
 		wait_for_model,
 		use_cache,
 		dont_load_model,
-		...otherOptions
+		chatCompletion,
 	} = options ?? {};
 	const headers: Record<string, string> = {};
@@ -77,11 +78,17 @@ export async function makeRequestOptions(
 		headers["X-Load-Model"] = "0";
 	}
-	const url = (() => {
+	let url = (() => {
+		if (endpointUrl && isUrl(model)) {
+			throw new TypeError("Both model and endpointUrl cannot be URLs");
+		}
 		if (isUrl(model)) {
+			console.warn("Using a model URL is deprecated, please use the `endpointUrl` parameter instead");
 			return model;
 		}
+		if (endpointUrl) {
+			return endpointUrl;
+		}
 		if (task) {
 			return `${HF_INFERENCE_API_BASE_URL}/pipeline/${task}/${model}`;
 		}
@@ -89,19 +96,18 @@ export async function makeRequestOptions(
 		return `${HF_INFERENCE_API_BASE_URL}/models/${model}`;
 	})();
-	// Let users configure credentials, or disable them all together (or keep default behavior).
-	// ---
-	// This used to be an internal property only and never exposed to users. This means that most usages will never define this value
-	// So in order to make this backwards compatible, if it's undefined we go to "same-origin" (default behaviour before).
-	// If it's a boolean and set to true then set to "include". If false, don't define credentials at all (useful for edge runtimes)
-	// Then finally, if it's a string, use it as-is.
+	if (chatCompletion && !url.endsWith("/chat/completions")) {
+		url += "/v1/chat/completions";
+	}
+	/**
+	 * For edge runtimes, leave 'credentials' undefined, otherwise cloudflare workers will error
+	 */
 	let credentials: RequestCredentials | undefined;
 	if (typeof includeCredentials === "string") {
 		credentials = includeCredentials as RequestCredentials;
-	} else if (typeof includeCredentials === "boolean") {
-		credentials = includeCredentials ? "include" : undefined;
-	} else if (includeCredentials === undefined) {
-		credentials = "same-origin";
+	} else if (includeCredentials === true) {
+		credentials = "include";
 	}
 	const info: RequestInit = {
@@ -110,10 +116,9 @@ export async function makeRequestOptions(
 		body: binary
 			? args.data
 			: JSON.stringify({
-					...otherArgs,
-					options: options && otherOptions,
+					...(otherArgs.model && isUrl(otherArgs.model) ? omit(otherArgs, "model") : otherArgs),
 			  }),
-		credentials,
+		...(credentials && { credentials }),
 		signal: options?.signal,
 	};

package/src/tasks/custom/request.ts CHANGED Viewed

@@ -11,6 +11,8 @@ export async function request<T>(
 		task?: string | InferenceTask;
 		/** To load default model if needed */
 		taskHint?: InferenceTask;
+		/** Is chat completion compatible */
+		chatCompletion?: boolean;
 	}
 ): Promise<T> {
 	const { url, info } = await makeRequestOptions(args, options);
@@ -26,6 +28,9 @@ export async function request<T>(
 	if (!response.ok) {
 		if (response.headers.get("Content-Type")?.startsWith("application/json")) {
 			const output = await response.json();
+			if ([400, 422, 404, 500].includes(response.status) && options?.chatCompletion) {
+				throw new Error(`Server ${args.model} does not seem to support chat completion. Error: ${output.error}`);
+			}
 			if (output.error) {
 				throw new Error(output.error);
 			}

package/src/tasks/custom/streamingRequest.ts CHANGED Viewed

@@ -13,6 +13,8 @@ export async function* streamingRequest<T>(
 		task?: string | InferenceTask;
 		/** To load default model if needed */
 		taskHint?: InferenceTask;
+		/** Is chat completion compatible */
+		chatCompletion?: boolean;
 	}
 ): AsyncGenerator<T> {
 	const { url, info } = await makeRequestOptions({ ...args, stream: true }, options);
@@ -27,6 +29,9 @@ export async function* streamingRequest<T>(
 	if (!response.ok) {
 		if (response.headers.get("Content-Type")?.startsWith("application/json")) {
 			const output = await response.json();
+			if ([400, 422, 404, 500].includes(response.status) && options?.chatCompletion) {
+				throw new Error(`Server ${args.model} does not seem to support chat completion. Error: ${output.error}`);
+			}
 			if (output.error) {
 				throw new Error(output.error);
 			}
@@ -67,6 +72,9 @@ export async function* streamingRequest<T>(
 			onChunk(value);
 			for (const event of events) {
 				if (event.data.length > 0) {
+					if (event.data === "[DONE]") {
+						return;
+					}
 					const data = JSON.parse(event.data);
 					if (typeof data === "object" && data !== null && "error" in data) {
 						throw new Error(data.error);

package/src/tasks/cv/imageToImage.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 import { InferenceOutputError } from "../../lib/InferenceOutputError";
 import type { BaseArgs, Options, RequestArgs } from "../../types";
+import { base64FromBytes } from "../../utils/base64FromBytes";
 import { request } from "../custom/request";
-import { base64FromBytes } from "../../../../shared";
 export type ImageToImageArgs = BaseArgs & {
 	/**

package/src/tasks/cv/zeroShotImageClassification.ts CHANGED Viewed

@@ -2,7 +2,7 @@ import { InferenceOutputError } from "../../lib/InferenceOutputError";
 import type { BaseArgs, Options } from "../../types";
 import { request } from "../custom/request";
 import type { RequestArgs } from "../../types";
-import { base64FromBytes } from "../../../../shared";
+import { base64FromBytes } from "../../utils/base64FromBytes";
 export type ZeroShotImageClassificationArgs = BaseArgs & {
 	inputs: {

package/src/tasks/index.ts CHANGED Viewed

@@ -30,6 +30,8 @@ export * from "./nlp/textGenerationStream";
 export * from "./nlp/tokenClassification";
 export * from "./nlp/translation";
 export * from "./nlp/zeroShotClassification";
+export * from "./nlp/chatCompletion";
+export * from "./nlp/chatCompletionStream";
 // Multimodal tasks
 export * from "./multimodal/documentQuestionAnswering";

package/src/tasks/multimodal/documentQuestionAnswering.ts CHANGED Viewed

@@ -2,8 +2,8 @@ import { InferenceOutputError } from "../../lib/InferenceOutputError";
 import type { BaseArgs, Options } from "../../types";
 import { request } from "../custom/request";
 import type { RequestArgs } from "../../types";
-import { base64FromBytes } from "../../../../shared";
 import { toArray } from "../../utils/toArray";
+import { base64FromBytes } from "../../utils/base64FromBytes";
 export type DocumentQuestionAnsweringArgs = BaseArgs & {
 	inputs: {

package/src/tasks/multimodal/visualQuestionAnswering.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 import { InferenceOutputError } from "../../lib/InferenceOutputError";
 import type { BaseArgs, Options, RequestArgs } from "../../types";
+import { base64FromBytes } from "../../utils/base64FromBytes";
 import { request } from "../custom/request";
-import { base64FromBytes } from "../../../../shared";
 export type VisualQuestionAnsweringArgs = BaseArgs & {
 	inputs: {

package/src/tasks/nlp/chatCompletion.ts ADDED Viewed

@@ -0,0 +1,32 @@
+import { InferenceOutputError } from "../../lib/InferenceOutputError";
+import type { BaseArgs, Options } from "../../types";
+import { request } from "../custom/request";
+import type { ChatCompletionInput, ChatCompletionOutput } from "@huggingface/tasks";
+/**
+ * Use the chat completion endpoint to generate a response to a prompt, using OpenAI message completion API no stream
+ */
+export async function chatCompletion(
+	args: BaseArgs & ChatCompletionInput,
+	options?: Options
+): Promise<ChatCompletionOutput> {
+	const res = await request<ChatCompletionOutput>(args, {
+		...options,
+		taskHint: "text-generation",
+		chatCompletion: true,
+	});
+	const isValidOutput =
+		typeof res === "object" &&
+		Array.isArray(res?.choices) &&
+		typeof res?.created === "number" &&
+		typeof res?.id === "string" &&
+		typeof res?.model === "string" &&
+		typeof res?.system_fingerprint === "string" &&
+		typeof res?.usage === "object";
+	if (!isValidOutput) {
+		throw new InferenceOutputError("Expected ChatCompletionOutput");
+	}
+	return res;
+}

package/src/tasks/nlp/chatCompletionStream.ts ADDED Viewed

@@ -0,0 +1,17 @@
+import type { BaseArgs, Options } from "../../types";
+import { streamingRequest } from "../custom/streamingRequest";
+import type { ChatCompletionInput, ChatCompletionStreamOutput } from "@huggingface/tasks";
+/**
+ * Use to continue text from a prompt. Same as `textGeneration` but returns generator that can be read one token at a time
+ */
+export async function* chatCompletionStream(
+	args: BaseArgs & ChatCompletionInput,
+	options?: Options
+): AsyncGenerator<ChatCompletionStreamOutput> {
+	yield* streamingRequest<ChatCompletionStreamOutput>(args, {
+		...options,
+		taskHint: "text-generation",
+		chatCompletion: true,
+	});
+}

package/src/tasks/nlp/textGeneration.ts CHANGED Viewed

@@ -1,8 +1,10 @@
-import type { TextGenerationInput, TextGenerationOutput } from "@huggingface/tasks/src/tasks/text-generation/inference";
+import type { TextGenerationInput, TextGenerationOutput } from "@huggingface/tasks";
 import { InferenceOutputError } from "../../lib/InferenceOutputError";
 import type { BaseArgs, Options } from "../../types";
 import { request } from "../custom/request";
+export type { TextGenerationInput, TextGenerationOutput };
 /**
  * Use to continue text from a prompt. This is a very generic task. Recommended model: gpt2 (it’s a simple model, but fun to play with).
  */

package/src/tasks/nlp/textGenerationStream.ts CHANGED Viewed

@@ -1,8 +1,7 @@
+import type { TextGenerationInput } from "@huggingface/tasks";
 import type { BaseArgs, Options } from "../../types";
 import { streamingRequest } from "../custom/streamingRequest";
-import type { TextGenerationInput } from "@huggingface/tasks/src/tasks/text-generation/inference";
 export interface TextGenerationStreamToken {
 	/** Token ID from the model tokenizer */
 	id: number;
@@ -68,6 +67,7 @@ export interface TextGenerationStreamDetails {
 }
 export interface TextGenerationStreamOutput {
+	index?: number;
 	/** Generated token, one at a time */
 	token: TextGenerationStreamToken;
 	/**

package/src/types.ts CHANGED Viewed

@@ -1,4 +1,5 @@
 import type { PipelineType } from "@huggingface/tasks";
+import type { ChatCompletionInput } from "@huggingface/tasks";
 export interface Options {
 	/**
@@ -47,15 +48,25 @@ export interface BaseArgs {
 	 */
 	accessToken?: string;
 	/**
-	 * The model to use. Can be a full URL for a dedicated inference endpoint.
+	 * The model to use.
 	 *
 	 * If not specified, will call huggingface.co/api/tasks to get the default model for the task.
+	 *
+	 * /!\ Legacy behavior allows this to be an URL, but this is deprecated and will be removed in the future.
+	 * Use the `endpointUrl` parameter instead.
 	 */
 	model?: string;
+	/**
+	 * The URL of the endpoint to use. If not specified, will call huggingface.co/api/tasks to get the default endpoint for the task.
+	 *
+	 * If specified, will use this URL instead of the default one.
+	 */
+	endpointUrl?: string;
 }
 export type RequestArgs = BaseArgs &
-	({ data: Blob | ArrayBuffer } | { inputs: unknown }) & {
+	({ data: Blob | ArrayBuffer } | { inputs: unknown } | ChatCompletionInput) & {
 		parameters?: Record<string, unknown>;
 		accessToken?: string;
 	};

package/src/utils/base64FromBytes.ts ADDED Viewed

@@ -0,0 +1,11 @@
+export function base64FromBytes(arr: Uint8Array): string {
+	if (globalThis.Buffer) {
+		return globalThis.Buffer.from(arr).toString("base64");
+	} else {
+		const bin: string[] = [];
+		arr.forEach((byte) => {
+			bin.push(String.fromCharCode(byte));
+		});
+		return globalThis.btoa(bin.join(""));
+	}
+}

package/src/utils/{distributive-omit.d.ts → distributive-omit.ts} RENAMED Viewed

@@ -4,8 +4,6 @@
  * This allows omitting keys from objects inside unions, without merging the individual components of the union.
  */
-type Keys<T> = keyof T;
-type DistributiveKeys<T> = T extends unknown ? Keys<T> : never;
 type Omit_<T, K> = Omit<T, Extract<keyof T, K>>;
 export type DistributiveOmit<T, K> = T extends unknown

package/src/utils/isBackend.ts ADDED Viewed

@@ -0,0 +1,6 @@
+const isBrowser = typeof window !== "undefined" && typeof window.document !== "undefined";
+const isWebWorker =
+	typeof self === "object" && self.constructor && self.constructor.name === "DedicatedWorkerGlobalScope";
+export const isBackend = !isBrowser && !isWebWorker;

package/src/utils/isFrontend.ts ADDED Viewed

@@ -0,0 +1,3 @@
+import { isBackend } from "./isBackend";
+export const isFrontend = !isBackend;