npm - @huggingface/inference - Versions diffs - 3.5.2 → 3.6.0 - Mend

@huggingface/inference 3.5.2 → 3.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (82) hide show

package/src/snippets/getInferenceSnippets.ts ADDED Viewed

@@ -0,0 +1,398 @@
+import type { PipelineType, WidgetType } from "@huggingface/tasks/src/pipelines.js";
+import type { ChatCompletionInputMessage, GenerationParameters } from "@huggingface/tasks/src/tasks/index.js";
+import {
+	type InferenceSnippet,
+	type InferenceSnippetLanguage,
+	type ModelDataMinimal,
+	inferenceSnippetLanguages,
+	getModelInputSnippet,
+} from "@huggingface/tasks";
+import type { InferenceProvider, InferenceTask, RequestArgs } from "../types";
+import { Template } from "@huggingface/jinja";
+import { makeRequestOptionsFromResolvedModel } from "../lib/makeRequestOptions";
+import fs from "fs";
+import path from "path";
+import { existsSync as pathExists } from "node:fs";
+const PYTHON_CLIENTS = ["huggingface_hub", "fal_client", "requests", "openai"] as const;
+const JS_CLIENTS = ["fetch", "huggingface.js", "openai"] as const;
+const SH_CLIENTS = ["curl"] as const;
+type Client = (typeof SH_CLIENTS)[number] | (typeof PYTHON_CLIENTS)[number] | (typeof JS_CLIENTS)[number];
+const CLIENTS: Record<InferenceSnippetLanguage, Client[]> = {
+	js: [...JS_CLIENTS],
+	python: [...PYTHON_CLIENTS],
+	sh: [...SH_CLIENTS],
+};
+type InputPreparationFn = (model: ModelDataMinimal, opts?: Record<string, unknown>) => object;
+interface TemplateParams {
+	accessToken?: string;
+	authorizationHeader?: string;
+	baseUrl?: string;
+	fullUrl?: string;
+	inputs?: object;
+	providerInputs?: object;
+	model?: ModelDataMinimal;
+	provider?: InferenceProvider;
+	providerModelId?: string;
+	methodName?: string; // specific to snippetBasic
+	importBase64?: boolean; // specific to snippetImportRequests
+	importJson?: boolean; // specific to snippetImportRequests
+}
+// Helpers to find + load templates
+const rootDirFinder = (): string => {
+	let currentPath =
+		typeof import.meta !== "undefined" && import.meta.url
+			? path.normalize(new URL(import.meta.url).pathname) /// for ESM
+			: __dirname; /// for CJS
+	while (currentPath !== "/") {
+		if (pathExists(path.join(currentPath, "package.json"))) {
+			return currentPath;
+		}
+		currentPath = path.normalize(path.join(currentPath, ".."));
+	}
+	return "/";
+};
+const templatePath = (language: InferenceSnippetLanguage, client: Client, templateName: string): string =>
+	path.join(rootDirFinder(), "src", "snippets", "templates", language, client, `${templateName}.jinja`);
+const hasTemplate = (language: InferenceSnippetLanguage, client: Client, templateName: string): boolean =>
+	pathExists(templatePath(language, client, templateName));
+const loadTemplate = (
+	language: InferenceSnippetLanguage,
+	client: Client,
+	templateName: string
+): ((data: TemplateParams) => string) => {
+	const template = fs.readFileSync(templatePath(language, client, templateName), "utf8");
+	return (data: TemplateParams) => new Template(template).render({ ...data });
+};
+const snippetImportPythonInferenceClient = loadTemplate("python", "huggingface_hub", "importInferenceClient");
+const snippetImportRequests = loadTemplate("python", "requests", "importRequests");
+// Needed for huggingface_hub basic snippets
+const HF_PYTHON_METHODS: Partial<Record<WidgetType, string>> = {
+	"audio-classification": "audio_classification",
+	"audio-to-audio": "audio_to_audio",
+	"automatic-speech-recognition": "automatic_speech_recognition",
+	"document-question-answering": "document_question_answering",
+	"feature-extraction": "feature_extraction",
+	"fill-mask": "fill_mask",
+	"image-classification": "image_classification",
+	"image-segmentation": "image_segmentation",
+	"image-to-image": "image_to_image",
+	"image-to-text": "image_to_text",
+	"object-detection": "object_detection",
+	"question-answering": "question_answering",
+	"sentence-similarity": "sentence_similarity",
+	summarization: "summarization",
+	"table-question-answering": "table_question_answering",
+	"tabular-classification": "tabular_classification",
+	"tabular-regression": "tabular_regression",
+	"text-classification": "text_classification",
+	"text-generation": "text_generation",
+	"text-to-image": "text_to_image",
+	"text-to-speech": "text_to_speech",
+	"text-to-video": "text_to_video",
+	"token-classification": "token_classification",
+	translation: "translation",
+	"visual-question-answering": "visual_question_answering",
+	"zero-shot-classification": "zero_shot_classification",
+	"zero-shot-image-classification": "zero_shot_image_classification",
+};
+// Needed for huggingface.js basic snippets
+const HF_JS_METHODS: Partial<Record<WidgetType, string>> = {
+	"automatic-speech-recognition": "automaticSpeechRecognition",
+	"feature-extraction": "featureExtraction",
+	"fill-mask": "fillMask",
+	"image-classification": "imageClassification",
+	"question-answering": "questionAnswering",
+	"sentence-similarity": "sentenceSimilarity",
+	summarization: "summarization",
+	"table-question-answering": "tableQuestionAnswering",
+	"text-classification": "textClassification",
+	"text-generation": "textGeneration",
+	"text2text-generation": "textGeneration",
+	"token-classification": "tokenClassification",
+	translation: "translation",
+};
+// Snippet generators
+const snippetGenerator = (templateName: string, inputPreparationFn?: InputPreparationFn) => {
+	return (
+		model: ModelDataMinimal,
+		accessToken: string,
+		provider: InferenceProvider,
+		providerModelId?: string,
+		opts?: Record<string, unknown>
+	): InferenceSnippet[] => {
+		/// Hacky: hard-code conversational templates here
+		if (
+			model.pipeline_tag &&
+			["text-generation", "image-text-to-text"].includes(model.pipeline_tag) &&
+			model.tags.includes("conversational")
+		) {
+			templateName = opts?.streaming ? "conversationalStream" : "conversational";
+			inputPreparationFn = prepareConversationalInput;
+		}
+		/// Prepare inputs + make request
+		const inputs = inputPreparationFn ? inputPreparationFn(model, opts) : { inputs: getModelInputSnippet(model) };
+		const request = makeRequestOptionsFromResolvedModel(
+			providerModelId ?? model.id,
+			{ accessToken: accessToken, provider: provider, ...inputs } as RequestArgs,
+			{ chatCompletion: templateName.includes("conversational"), task: model.pipeline_tag as InferenceTask }
+		);
+		/// Parse request.info.body if not a binary.
+		/// This is the body sent to the provider. Important for snippets with raw payload (e.g curl, requests, etc.)
+		let providerInputs = inputs;
+		const bodyAsObj = request.info.body;
+		if (typeof bodyAsObj === "string") {
+			try {
+				providerInputs = JSON.parse(bodyAsObj);
+			} catch (e) {
+				console.error("Failed to parse body as JSON", e);
+			}
+		}
+		/// Prepare template injection data
+		const params: TemplateParams = {
+			accessToken,
+			authorizationHeader: (request.info.headers as Record<string, string>)?.Authorization,
+			baseUrl: removeSuffix(request.url, "/chat/completions"),
+			fullUrl: request.url,
+			inputs: {
+				asObj: inputs,
+				asCurlString: formatBody(inputs, "curl"),
+				asJsonString: formatBody(inputs, "json"),
+				asPythonString: formatBody(inputs, "python"),
+				asTsString: formatBody(inputs, "ts"),
+			},
+			providerInputs: {
+				asObj: providerInputs,
+				asCurlString: formatBody(providerInputs, "curl"),
+				asJsonString: formatBody(providerInputs, "json"),
+				asPythonString: formatBody(providerInputs, "python"),
+				asTsString: formatBody(providerInputs, "ts"),
+			},
+			model,
+			provider,
+			providerModelId: providerModelId ?? model.id,
+		};
+		/// Iterate over clients => check if a snippet exists => generate
+		return inferenceSnippetLanguages
+			.map((language) => {
+				return CLIENTS[language]
+					.map((client) => {
+						if (!hasTemplate(language, client, templateName)) {
+							return;
+						}
+						const template = loadTemplate(language, client, templateName);
+						if (client === "huggingface_hub" && templateName.includes("basic")) {
+							if (!(model.pipeline_tag && model.pipeline_tag in HF_PYTHON_METHODS)) {
+								return;
+							}
+							params["methodName"] = HF_PYTHON_METHODS[model.pipeline_tag];
+						}
+						if (client === "huggingface.js" && templateName.includes("basic")) {
+							if (!(model.pipeline_tag && model.pipeline_tag in HF_JS_METHODS)) {
+								return;
+							}
+							params["methodName"] = HF_JS_METHODS[model.pipeline_tag];
+						}
+						/// Generate snippet
+						let snippet = template(params).trim();
+						if (!snippet) {
+							return;
+						}
+						/// Add import section separately
+						if (client === "huggingface_hub") {
+							const importSection = snippetImportPythonInferenceClient({ ...params });
+							snippet = `${importSection}\n\n${snippet}`;
+						} else if (client === "requests") {
+							const importSection = snippetImportRequests({
+								...params,
+								importBase64: snippet.includes("base64"),
+								importJson: snippet.includes("json."),
+							});
+							snippet = `${importSection}\n\n${snippet}`;
+						}
+						/// Snippet is ready!
+						return { language, client: client as string, content: snippet };
+					})
+					.filter((snippet): snippet is InferenceSnippet => snippet !== undefined);
+			})
+			.flat();
+	};
+};
+const prepareDocumentQuestionAnsweringInput = (model: ModelDataMinimal): object => {
+	return JSON.parse(getModelInputSnippet(model) as string);
+};
+const prepareImageToImageInput = (model: ModelDataMinimal): object => {
+	const data = JSON.parse(getModelInputSnippet(model) as string);
+	return { inputs: data.image, parameters: { prompt: data.prompt } };
+};
+const prepareConversationalInput = (
+	model: ModelDataMinimal,
+	opts?: {
+		streaming?: boolean;
+		messages?: ChatCompletionInputMessage[];
+		temperature?: GenerationParameters["temperature"];
+		max_tokens?: GenerationParameters["max_new_tokens"];
+		top_p?: GenerationParameters["top_p"];
+	}
+): object => {
+	return {
+		messages: opts?.messages ?? getModelInputSnippet(model),
+		...(opts?.temperature ? { temperature: opts?.temperature } : undefined),
+		max_tokens: opts?.max_tokens ?? 500,
+		...(opts?.top_p ? { top_p: opts?.top_p } : undefined),
+	};
+};
+const snippets: Partial<
+	Record<
+		PipelineType,
+		(
+			model: ModelDataMinimal,
+			accessToken: string,
+			provider: InferenceProvider,
+			providerModelId?: string,
+			opts?: Record<string, unknown>
+		) => InferenceSnippet[]
+	>
+> = {
+	"audio-classification": snippetGenerator("basicAudio"),
+	"audio-to-audio": snippetGenerator("basicAudio"),
+	"automatic-speech-recognition": snippetGenerator("basicAudio"),
+	"document-question-answering": snippetGenerator("documentQuestionAnswering", prepareDocumentQuestionAnsweringInput),
+	"feature-extraction": snippetGenerator("basic"),
+	"fill-mask": snippetGenerator("basic"),
+	"image-classification": snippetGenerator("basicImage"),
+	"image-segmentation": snippetGenerator("basicImage"),
+	"image-text-to-text": snippetGenerator("conversational"),
+	"image-to-image": snippetGenerator("imageToImage", prepareImageToImageInput),
+	"image-to-text": snippetGenerator("basicImage"),
+	"object-detection": snippetGenerator("basicImage"),
+	"question-answering": snippetGenerator("basic"),
+	"sentence-similarity": snippetGenerator("basic"),
+	summarization: snippetGenerator("basic"),
+	"tabular-classification": snippetGenerator("tabular"),
+	"tabular-regression": snippetGenerator("tabular"),
+	"table-question-answering": snippetGenerator("basic"),
+	"text-classification": snippetGenerator("basic"),
+	"text-generation": snippetGenerator("basic"),
+	"text-to-audio": snippetGenerator("textToAudio"),
+	"text-to-image": snippetGenerator("textToImage"),
+	"text-to-speech": snippetGenerator("textToAudio"),
+	"text-to-video": snippetGenerator("textToVideo"),
+	"text2text-generation": snippetGenerator("basic"),
+	"token-classification": snippetGenerator("basic"),
+	translation: snippetGenerator("basic"),
+	"zero-shot-classification": snippetGenerator("zeroShotClassification"),
+	"zero-shot-image-classification": snippetGenerator("zeroShotImageClassification"),
+};
+export function getInferenceSnippets(
+	model: ModelDataMinimal,
+	accessToken: string,
+	provider: InferenceProvider,
+	providerModelId?: string,
+	opts?: Record<string, unknown>
+): InferenceSnippet[] {
+	return model.pipeline_tag && model.pipeline_tag in snippets
+		? snippets[model.pipeline_tag]?.(model, accessToken, provider, providerModelId, opts) ?? []
+		: [];
+}
+// String manipulation helpers
+function formatBody(obj: object, format: "curl" | "json" | "python" | "ts"): string {
+	switch (format) {
+		case "curl":
+			return indentString(formatBody(obj, "json"));
+		case "json":
+			/// Hacky: remove outer brackets to make is extendable in templates
+			return JSON.stringify(obj, null, 4).split("\n").slice(1, -1).join("\n");
+		case "python":
+			return indentString(
+				Object.entries(obj)
+					.map(([key, value]) => {
+						const formattedValue = JSON.stringify(value, null, 4).replace(/"/g, '"');
+						return `${key}=${formattedValue},`;
+					})
+					.join("\n")
+			);
+		case "ts":
+			/// Hacky: remove outer brackets to make is extendable in templates
+			return formatTsObject(obj).split("\n").slice(1, -1).join("\n");
+		default:
+			throw new Error(`Unsupported format: ${format}`);
+	}
+}
+function formatTsObject(obj: unknown, depth?: number): string {
+	depth = depth ?? 0;
+	/// Case int, boolean, string, etc.
+	if (typeof obj !== "object" || obj === null) {
+		return JSON.stringify(obj);
+	}
+	/// Case array
+	if (Array.isArray(obj)) {
+		const items = obj
+			.map((item) => {
+				const formatted = formatTsObject(item, depth + 1);
+				return `${" ".repeat(4 * (depth + 1))}${formatted},`;
+			})
+			.join("\n");
+		return `[\n${items}\n${" ".repeat(4 * depth)}]`;
+	}
+	/// Case mapping
+	const entries = Object.entries(obj);
+	const lines = entries
+		.map(([key, value]) => {
+			const formattedValue = formatTsObject(value, depth + 1);
+			const keyStr = /^[a-zA-Z_$][a-zA-Z0-9_$]*$/.test(key) ? key : `"${key}"`;
+			return `${" ".repeat(4 * (depth + 1))}${keyStr}: ${formattedValue},`;
+		})
+		.join("\n");
+	return `{\n${lines}\n${" ".repeat(4 * depth)}}`;
+}
+function indentString(str: string): string {
+	return str
+		.split("\n")
+		.map((line) => " ".repeat(4) + line)
+		.join("\n");
+}
+function removeSuffix(str: string, suffix: string) {
+	return str.endsWith(suffix) ? str.slice(0, -suffix.length) : str;
+}

package/src/snippets/index.ts CHANGED Viewed

@@ -1,5 +1 @@
-import * as curl from "./curl.js";
-import * as python from "./python.js";
-import * as js from "./js.js";
-export { curl, python, js };
+export { getInferenceSnippets } from "./getInferenceSnippets.js";

package/src/snippets/templates/js/fetch/basic.jinja ADDED Viewed

@@ -0,0 +1,19 @@
+async function query(data) {
+	const response = await fetch(
+		"{{ fullUrl }}",
+		{
+			headers: {
+				Authorization: "{{ authorizationHeader }}",
+				"Content-Type": "application/json",
+			},
+			method: "POST",
+			body: JSON.stringify(data),
+		}
+	);
+	const result = await response.json();
+	return result;
+}
+query({ inputs: {{ providerInputs.asObj.inputs }} }).then((response) => {
+    console.log(JSON.stringify(response));
+});

package/src/snippets/templates/js/fetch/basicAudio.jinja ADDED Viewed

@@ -0,0 +1,19 @@
+async function query(data) {
+	const response = await fetch(
+		"{{ fullUrl }}",
+		{
+			headers: {
+				Authorization: "{{ authorizationHeader }}",
+				"Content-Type": "audio/flac"
+			},
+			method: "POST",
+			body: JSON.stringify(data),
+		}
+	);
+	const result = await response.json();
+	return result;
+}
+query({ inputs: {{ providerInputs.asObj.inputs }} }).then((response) => {
+    console.log(JSON.stringify(response));
+});

package/src/snippets/templates/js/fetch/basicImage.jinja ADDED Viewed

@@ -0,0 +1,19 @@
+async function query(data) {
+	const response = await fetch(
+		"{{ fullUrl }}",
+		{
+			headers: {
+				Authorization: "{{ authorizationHeader }}",
+				"Content-Type": "image/jpeg"
+			},
+			method: "POST",
+			body: JSON.stringify(data),
+		}
+	);
+	const result = await response.json();
+	return result;
+}
+query({ inputs: {{ providerInputs.asObj.inputs }} }).then((response) => {
+    console.log(JSON.stringify(response));
+});

package/src/snippets/templates/js/fetch/textToAudio.jinja ADDED Viewed

@@ -0,0 +1,41 @@
+{% if model.library_name == "transformers" %}
+async function query(data) {
+	const response = await fetch(
+		"{{ fullUrl }}",
+		{
+			headers: {
+				Authorization: "{{ authorizationHeader }}",
+				"Content-Type": "application/json",
+			},
+			method: "POST",
+			body: JSON.stringify(data),
+		}
+	);
+	const result = await response.blob();
+    return result;
+}
+query({ inputs: {{ providerInputs.asObj.inputs }} }).then((response) => {
+    // Returns a byte object of the Audio wavform. Use it directly!
+});
+{% else %}
+async function query(data) {
+	const response = await fetch(
+		"{{ fullUrl }}",
+		{
+			headers: {
+				Authorization: "{{ authorizationHeader }}",
+				"Content-Type": "application/json",
+			},
+			method: "POST",
+			body: JSON.stringify(data),
+		}
+	);
+    const result = await response.json();
+    return result;
+}
+query({ inputs: {{ providerInputs.asObj.inputs }} }).then((response) => {
+    console.log(JSON.stringify(response));
+});
+{% endif %}

package/src/snippets/templates/js/fetch/textToImage.jinja ADDED Viewed

@@ -0,0 +1,19 @@
+async function query(data) {
+	const response = await fetch(
+		"{{ fullUrl }}",
+		{
+			headers: {
+				Authorization: "{{ authorizationHeader }}",
+				"Content-Type": "application/json",
+			},
+			method: "POST",
+			body: JSON.stringify(data),
+		}
+	);
+	const result = await response.blob();
+	return result;
+}
+query({ inputs: {{ providerInputs.asObj.inputs }} }).then((response) => {
+    // Use image
+});

package/src/snippets/templates/js/fetch/zeroShotClassification.jinja ADDED Viewed

@@ -0,0 +1,22 @@
+async function query(data) {
+    const response = await fetch(
+		"{{ fullUrl }}",
+        {
+            headers: {
+				Authorization: "{{ authorizationHeader }}",
+                "Content-Type": "application/json",
+            },
+            method: "POST",
+            body: JSON.stringify(data),
+        }
+    );
+    const result = await response.json();
+    return result;
+}
+query({
+    inputs: {{ providerInputs.asObj.inputs }},
+    parameters: { candidate_labels: ["refund", "legal", "faq"] }
+}).then((response) => {
+    console.log(JSON.stringify(response));
+});

package/src/snippets/templates/js/huggingface.js/basic.jinja ADDED Viewed

@@ -0,0 +1,11 @@
+import { InferenceClient } from "@huggingface/inference";
+const client = new InferenceClient("{{ accessToken }}");
+const output = await client.{{ methodName }}({
+	model: "{{ model.id }}",
+	inputs: {{ inputs.asObj.inputs }},
+	provider: "{{ provider }}",
+});
+console.log(output);

package/src/snippets/templates/js/huggingface.js/basicAudio.jinja ADDED Viewed

@@ -0,0 +1,13 @@
+import { InferenceClient } from "@huggingface/inference";
+const client = new InferenceClient("{{ accessToken }}");
+const data = fs.readFileSync({{inputs.asObj.inputs}});
+const output = await client.{{ methodName }}({
+	data,
+	model: "{{ model.id }}",
+	provider: "{{ provider }}",
+});
+console.log(output);

package/src/snippets/templates/js/huggingface.js/basicImage.jinja ADDED Viewed

@@ -0,0 +1,13 @@
+import { InferenceClient } from "@huggingface/inference";
+const client = new InferenceClient("{{ accessToken }}");
+const data = fs.readFileSync({{inputs.asObj.inputs}});
+const output = await client.{{ methodName }}({
+	data,
+	model: "{{ model.id }}",
+	provider: "{{ provider }}",
+});
+console.log(output);

package/src/snippets/templates/js/huggingface.js/conversational.jinja ADDED Viewed

@@ -0,0 +1,11 @@
+import { InferenceClient } from "@huggingface/inference";
+const client = new InferenceClient("{{ accessToken }}");
+const chatCompletion = await client.chatCompletion({
+    provider: "{{ provider }}",
+    model: "{{ model.id }}",
+{{ inputs.asTsString }}
+});
+console.log(chatCompletion.choices[0].message);

package/src/snippets/templates/js/huggingface.js/conversationalStream.jinja ADDED Viewed

@@ -0,0 +1,19 @@
+import { InferenceClient } from "@huggingface/inference";
+const client = new InferenceClient("{{ accessToken }}");
+let out = "";
+const stream = await client.chatCompletionStream({
+    provider: "{{ provider }}",
+    model: "{{ model.id }}",
+{{ inputs.asTsString }}
+});
+for await (const chunk of stream) {
+	if (chunk.choices && chunk.choices.length > 0) {
+		const newContent = chunk.choices[0].delta.content;
+		out += newContent;
+		console.log(newContent);
+	}
+}

package/src/snippets/templates/js/huggingface.js/textToImage.jinja ADDED Viewed

@@ -0,0 +1,11 @@
+import { InferenceClient } from "@huggingface/inference";
+const client = new InferenceClient("{{ accessToken }}");
+const image = await client.textToImage({
+    provider: "{{ provider }}",
+    model: "{{ model.id }}",
+	inputs: {{ inputs.asObj.inputs }},
+	parameters: { num_inference_steps: 5 },
+});
+/// Use the generated image (it's a Blob)

package/src/snippets/templates/js/huggingface.js/textToVideo.jinja ADDED Viewed

@@ -0,0 +1,10 @@
+import { InferenceClient } from "@huggingface/inference";
+const client = new InferenceClient("{{ accessToken }}");
+const image = await client.textToVideo({
+    provider: "{{ provider }}",
+    model: "{{ model.id }}",
+	inputs: {{ inputs.asObj.inputs }},
+});
+// Use the generated video (it's a Blob)

package/src/snippets/templates/js/openai/conversational.jinja ADDED Viewed

@@ -0,0 +1,13 @@
+import { OpenAI } from "openai";
+const client = new OpenAI({
+	baseURL: "{{ baseUrl }}",
+	apiKey: "{{ accessToken }}",
+});
+const chatCompletion = await client.chat.completions.create({
+	model: "{{ providerModelId }}",
+{{ inputs.asTsString }}
+});
+console.log(chatCompletion.choices[0].message);