npm - @huggingface/inference - Versions diffs - 2.5.2 → 2.6.0 - Mend

@huggingface/inference 2.5.2 → 2.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

package/dist/index.d.ts +48 -2
package/dist/index.js +168 -78
package/dist/index.mjs +168 -78
package/package.json +1 -1
package/src/lib/getDefaultTask.ts +1 -1
package/src/lib/makeRequestOptions.ts +34 -5
package/src/tasks/audio/audioClassification.ts +4 -1
package/src/tasks/audio/audioToAudio.ts +4 -1
package/src/tasks/audio/automaticSpeechRecognition.ts +4 -1
package/src/tasks/audio/textToSpeech.ts +4 -1
package/src/tasks/custom/request.ts +3 -1
package/src/tasks/custom/streamingRequest.ts +3 -1
package/src/tasks/cv/imageClassification.ts +4 -1
package/src/tasks/cv/imageSegmentation.ts +4 -1
package/src/tasks/cv/imageToImage.ts +4 -1
package/src/tasks/cv/imageToText.ts +6 -1
package/src/tasks/cv/objectDetection.ts +4 -1
package/src/tasks/cv/textToImage.ts +4 -1
package/src/tasks/cv/zeroShotImageClassification.ts +4 -1
package/src/tasks/multimodal/documentQuestionAnswering.ts +4 -1
package/src/tasks/multimodal/visualQuestionAnswering.ts +6 -1
package/src/tasks/nlp/conversational.ts +1 -1
package/src/tasks/nlp/featureExtraction.ts +7 -10
package/src/tasks/nlp/fillMask.ts +4 -1
package/src/tasks/nlp/questionAnswering.ts +4 -1
package/src/tasks/nlp/sentenceSimilarity.ts +6 -10
package/src/tasks/nlp/summarization.ts +4 -1
package/src/tasks/nlp/tableQuestionAnswering.ts +4 -1
package/src/tasks/nlp/textClassification.ts +6 -1
package/src/tasks/nlp/textGeneration.ts +4 -1
package/src/tasks/nlp/textGenerationStream.ts +4 -1
package/src/tasks/nlp/tokenClassification.ts +6 -1
package/src/tasks/nlp/translation.ts +4 -1
package/src/tasks/nlp/zeroShotClassification.ts +4 -1
package/src/tasks/tabular/tabularClassification.ts +4 -1
package/src/tasks/tabular/tabularRegression.ts +4 -1
package/src/types.ts +36 -2

package/dist/index.mjs CHANGED Viewed

@@ -45,15 +45,63 @@ function isUrl(modelOrUrl) {
   return /^http(s?):/.test(modelOrUrl) || modelOrUrl.startsWith("/");
 }
+// src/lib/getDefaultTask.ts
+var taskCache = /* @__PURE__ */ new Map();
+var CACHE_DURATION = 10 * 60 * 1e3;
+var MAX_CACHE_ITEMS = 1e3;
+var HF_HUB_URL = "https://huggingface.co";
+async function getDefaultTask(model, accessToken) {
+  if (isUrl(model)) {
+    return null;
+  }
+  const key = `${model}:${accessToken}`;
+  let cachedTask = taskCache.get(key);
+  if (cachedTask && cachedTask.date < new Date(Date.now() - CACHE_DURATION)) {
+    taskCache.delete(key);
+    cachedTask = void 0;
+  }
+  if (cachedTask === void 0) {
+    const modelTask = await fetch(`${HF_HUB_URL}/api/models/${model}?expand[]=pipeline_tag`, {
+      headers: accessToken ? { Authorization: `Bearer ${accessToken}` } : {}
+    }).then((resp) => resp.json()).then((json) => json.pipeline_tag).catch(() => null);
+    if (!modelTask) {
+      return null;
+    }
+    cachedTask = { task: modelTask, date: /* @__PURE__ */ new Date() };
+    taskCache.set(key, { task: modelTask, date: /* @__PURE__ */ new Date() });
+    if (taskCache.size > MAX_CACHE_ITEMS) {
+      taskCache.delete(taskCache.keys().next().value);
+    }
+  }
+  return cachedTask.task;
+}
 // src/lib/makeRequestOptions.ts
 var HF_INFERENCE_API_BASE_URL = "https://api-inference.huggingface.co";
-function makeRequestOptions(args, options) {
-  const { model, accessToken, ...otherArgs } = args;
-  const { task, includeCredentials, ...otherOptions } = options ?? {};
+var tasks = null;
+async function makeRequestOptions(args, options) {
+  const { accessToken, model: _model, ...otherArgs } = args;
+  let { model } = args;
+  const { forceTask: task, includeCredentials, taskHint, ...otherOptions } = options ?? {};
   const headers = {};
   if (accessToken) {
     headers["Authorization"] = `Bearer ${accessToken}`;
   }
+  if (!model && !tasks && taskHint) {
+    const res = await fetch(`${HF_HUB_URL}/api/tasks`);
+    if (res.ok) {
+      tasks = await res.json();
+    }
+  }
+  if (!model && tasks && taskHint) {
+    const taskInfo = tasks[taskHint];
+    if (taskInfo) {
+      model = taskInfo.models[0].id;
+    }
+  }
+  if (!model) {
+    throw new Error("No model provided, and no default model found for this task");
+  }
   const binary = "data" in args && !!args.data;
   if (!binary) {
     headers["Content-Type"] = "application/json";
@@ -91,7 +139,7 @@ function makeRequestOptions(args, options) {
 // src/tasks/custom/request.ts
 async function request(args, options) {
-  const { url, info } = makeRequestOptions(args, options);
+  const { url, info } = await makeRequestOptions(args, options);
   const response = await (options?.fetch ?? fetch)(url, info);
   if (options?.retry_on_error !== false && response.status === 503 && !options?.wait_for_model) {
     return request(args, {
@@ -215,7 +263,7 @@ function newMessage() {
 // src/tasks/custom/streamingRequest.ts
 async function* streamingRequest(args, options) {
-  const { url, info } = makeRequestOptions({ ...args, stream: true }, options);
+  const { url, info } = await makeRequestOptions({ ...args, stream: true }, options);
   const response = await (options?.fetch ?? fetch)(url, info);
   if (options?.retry_on_error !== false && response.status === 503 && !options?.wait_for_model) {
     return streamingRequest(args, {
@@ -288,7 +336,10 @@ var InferenceOutputError = class extends TypeError {
 // src/tasks/audio/audioClassification.ts
 async function audioClassification(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "audio-classification"
+  });
   const isValidOutput = Array.isArray(res) && res.every((x) => typeof x.label === "string" && typeof x.score === "number");
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected Array<{label: string, score: number}>");
@@ -298,7 +349,10 @@ async function audioClassification(args, options) {
 // src/tasks/audio/automaticSpeechRecognition.ts
 async function automaticSpeechRecognition(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "automatic-speech-recognition"
+  });
   const isValidOutput = typeof res?.text === "string";
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected {text: string}");
@@ -308,7 +362,10 @@ async function automaticSpeechRecognition(args, options) {
 // src/tasks/audio/textToSpeech.ts
 async function textToSpeech(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "text-to-speech"
+  });
   const isValidOutput = res && res instanceof Blob;
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected Blob");
@@ -318,7 +375,10 @@ async function textToSpeech(args, options) {
 // src/tasks/audio/audioToAudio.ts
 async function audioToAudio(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "audio-to-audio"
+  });
   const isValidOutput = Array.isArray(res) && res.every(
     (x) => typeof x.label === "string" && typeof x.blob === "string" && typeof x["content-type"] === "string"
   );
@@ -330,7 +390,10 @@ async function audioToAudio(args, options) {
 // src/tasks/cv/imageClassification.ts
 async function imageClassification(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "image-classification"
+  });
   const isValidOutput = Array.isArray(res) && res.every((x) => typeof x.label === "string" && typeof x.score === "number");
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected Array<{label: string, score: number}>");
@@ -340,7 +403,10 @@ async function imageClassification(args, options) {
 // src/tasks/cv/imageSegmentation.ts
 async function imageSegmentation(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "image-segmentation"
+  });
   const isValidOutput = Array.isArray(res) && res.every((x) => typeof x.label === "string" && typeof x.mask === "string" && typeof x.score === "number");
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected Array<{label: string, mask: string, score: number}>");
@@ -350,7 +416,10 @@ async function imageSegmentation(args, options) {
 // src/tasks/cv/imageToText.ts
 async function imageToText(args, options) {
-  const res = (await request(args, options))?.[0];
+  const res = (await request(args, {
+    ...options,
+    taskHint: "image-to-text"
+  }))?.[0];
   if (typeof res?.generated_text !== "string") {
     throw new InferenceOutputError("Expected {generated_text: string}");
   }
@@ -359,7 +428,10 @@ async function imageToText(args, options) {
 // src/tasks/cv/objectDetection.ts
 async function objectDetection(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "object-detection"
+  });
   const isValidOutput = Array.isArray(res) && res.every(
     (x) => typeof x.label === "string" && typeof x.score === "number" && typeof x.box.xmin === "number" && typeof x.box.ymin === "number" && typeof x.box.xmax === "number" && typeof x.box.ymax === "number"
   );
@@ -373,7 +445,10 @@ async function objectDetection(args, options) {
 // src/tasks/cv/textToImage.ts
 async function textToImage(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "text-to-image"
+  });
   const isValidOutput = res && res instanceof Blob;
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected Blob");
@@ -415,7 +490,10 @@ async function imageToImage(args, options) {
       )
     };
   }
-  const res = await request(reqArgs, options);
+  const res = await request(reqArgs, {
+    ...options,
+    taskHint: "image-to-image"
+  });
   const isValidOutput = res && res instanceof Blob;
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected Blob");
@@ -435,7 +513,10 @@ async function zeroShotImageClassification(args, options) {
       )
     }
   };
-  const res = await request(reqArgs, options);
+  const res = await request(reqArgs, {
+    ...options,
+    taskHint: "zero-shot-image-classification"
+  });
   const isValidOutput = Array.isArray(res) && res.every((x) => typeof x.label === "string" && typeof x.score === "number");
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected Array<{label: string, score: number}>");
@@ -445,7 +526,7 @@ async function zeroShotImageClassification(args, options) {
 // src/tasks/nlp/conversational.ts
 async function conversational(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, { ...options, taskHint: "conversational" });
   const isValidOutput = Array.isArray(res.conversation.generated_responses) && res.conversation.generated_responses.every((x) => typeof x === "string") && Array.isArray(res.conversation.past_user_inputs) && res.conversation.past_user_inputs.every((x) => typeof x === "string") && typeof res.generated_text === "string" && Array.isArray(res.warnings) && res.warnings.every((x) => typeof x === "string");
   if (!isValidOutput) {
     throw new InferenceOutputError(
@@ -455,47 +536,14 @@ async function conversational(args, options) {
   return res;
 }
-// src/lib/getDefaultTask.ts
-var taskCache = /* @__PURE__ */ new Map();
-var CACHE_DURATION = 10 * 60 * 1e3;
-var MAX_CACHE_ITEMS = 1e3;
-var HF_HUB_URL = "https://huggingface.co";
-async function getDefaultTask(model, accessToken) {
-  if (isUrl(model)) {
-    return null;
-  }
-  const key = `${model}:${accessToken}`;
-  let cachedTask = taskCache.get(key);
-  if (cachedTask && cachedTask.date < new Date(Date.now() - CACHE_DURATION)) {
-    taskCache.delete(key);
-    cachedTask = void 0;
-  }
-  if (cachedTask === void 0) {
-    const modelTask = await fetch(`${HF_HUB_URL}/api/models/${model}?expand[]=pipeline_tag`, {
-      headers: accessToken ? { Authorization: `Bearer ${accessToken}` } : {}
-    }).then((resp) => resp.json()).then((json) => json.pipeline_tag).catch(() => null);
-    if (!modelTask) {
-      return null;
-    }
-    cachedTask = { task: modelTask, date: /* @__PURE__ */ new Date() };
-    taskCache.set(key, { task: modelTask, date: /* @__PURE__ */ new Date() });
-    if (taskCache.size > MAX_CACHE_ITEMS) {
-      taskCache.delete(taskCache.keys().next().value);
-    }
-  }
-  return cachedTask.task;
-}
 // src/tasks/nlp/featureExtraction.ts
 async function featureExtraction(args, options) {
-  const defaultTask = await getDefaultTask(args.model, args.accessToken);
-  const res = await request(
-    args,
-    defaultTask === "sentence-similarity" ? {
-      ...options,
-      task: "feature-extraction"
-    } : options
-  );
+  const defaultTask = args.model ? await getDefaultTask(args.model, args.accessToken) : void 0;
+  const res = await request(args, {
+    ...options,
+    taskHint: "feature-extraction",
+    ...defaultTask === "sentence-similarity" && { forceTask: "feature-extraction" }
+  });
   let isValidOutput = true;
   const isNumArrayRec = (arr, maxDepth, curDepth = 0) => {
     if (curDepth > maxDepth)
@@ -515,7 +563,10 @@ async function featureExtraction(args, options) {
 // src/tasks/nlp/fillMask.ts
 async function fillMask(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "fill-mask"
+  });
   const isValidOutput = Array.isArray(res) && res.every(
     (x) => typeof x.score === "number" && typeof x.sequence === "string" && typeof x.token === "number" && typeof x.token_str === "string"
   );
@@ -529,7 +580,10 @@ async function fillMask(args, options) {
 // src/tasks/nlp/questionAnswering.ts
 async function questionAnswering(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "question-answering"
+  });
   const isValidOutput = typeof res === "object" && !!res && typeof res.answer === "string" && typeof res.end === "number" && typeof res.score === "number" && typeof res.start === "number";
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected {answer: string, end: number, score: number, start: number}");
@@ -539,14 +593,12 @@ async function questionAnswering(args, options) {
 // src/tasks/nlp/sentenceSimilarity.ts
 async function sentenceSimilarity(args, options) {
-  const defaultTask = await getDefaultTask(args.model, args.accessToken);
-  const res = await request(
-    args,
-    defaultTask === "feature-extraction" ? {
-      ...options,
-      task: "sentence-similarity"
-    } : options
-  );
+  const defaultTask = args.model ? await getDefaultTask(args.model, args.accessToken) : void 0;
+  const res = await request(args, {
+    ...options,
+    taskHint: "sentence-similarity",
+    ...defaultTask === "feature-extraction" && { forceTask: "sentence-similarity" }
+  });
   const isValidOutput = Array.isArray(res) && res.every((x) => typeof x === "number");
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected number[]");
@@ -556,7 +608,10 @@ async function sentenceSimilarity(args, options) {
 // src/tasks/nlp/summarization.ts
 async function summarization(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "summarization"
+  });
   const isValidOutput = Array.isArray(res) && res.every((x) => typeof x?.summary_text === "string");
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected Array<{summary_text: string}>");
@@ -566,7 +621,10 @@ async function summarization(args, options) {
 // src/tasks/nlp/tableQuestionAnswering.ts
 async function tableQuestionAnswering(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "table-question-answering"
+  });
   const isValidOutput = typeof res?.aggregator === "string" && typeof res.answer === "string" && Array.isArray(res.cells) && res.cells.every((x) => typeof x === "string") && Array.isArray(res.coordinates) && res.coordinates.every((coord) => Array.isArray(coord) && coord.every((x) => typeof x === "number"));
   if (!isValidOutput) {
     throw new InferenceOutputError(
@@ -578,7 +636,10 @@ async function tableQuestionAnswering(args, options) {
 // src/tasks/nlp/textClassification.ts
 async function textClassification(args, options) {
-  const res = (await request(args, options))?.[0];
+  const res = (await request(args, {
+    ...options,
+    taskHint: "text-classification"
+  }))?.[0];
   const isValidOutput = Array.isArray(res) && res.every((x) => typeof x?.label === "string" && typeof x.score === "number");
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected Array<{label: string, score: number}>");
@@ -588,7 +649,10 @@ async function textClassification(args, options) {
 // src/tasks/nlp/textGeneration.ts
 async function textGeneration(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "text-generation"
+  });
   const isValidOutput = Array.isArray(res) && res.every((x) => typeof x?.generated_text === "string");
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected Array<{generated_text: string}>");
@@ -598,7 +662,10 @@ async function textGeneration(args, options) {
 // src/tasks/nlp/textGenerationStream.ts
 async function* textGenerationStream(args, options) {
-  yield* streamingRequest(args, options);
+  yield* streamingRequest(args, {
+    ...options,
+    taskHint: "text-generation"
+  });
 }
 // src/utils/toArray.ts
@@ -611,7 +678,12 @@ function toArray(obj) {
 // src/tasks/nlp/tokenClassification.ts
 async function tokenClassification(args, options) {
-  const res = toArray(await request(args, options));
+  const res = toArray(
+    await request(args, {
+      ...options,
+      taskHint: "token-classification"
+    })
+  );
   const isValidOutput = Array.isArray(res) && res.every(
     (x) => typeof x.end === "number" && typeof x.entity_group === "string" && typeof x.score === "number" && typeof x.start === "number" && typeof x.word === "string"
   );
@@ -625,7 +697,10 @@ async function tokenClassification(args, options) {
 // src/tasks/nlp/translation.ts
 async function translation(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "translation"
+  });
   const isValidOutput = Array.isArray(res) && res.every((x) => typeof x?.translation_text === "string");
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected type Array<{translation_text: string}>");
@@ -636,7 +711,10 @@ async function translation(args, options) {
 // src/tasks/nlp/zeroShotClassification.ts
 async function zeroShotClassification(args, options) {
   const res = toArray(
-    await request(args, options)
+    await request(args, {
+      ...options,
+      taskHint: "zero-shot-classification"
+    })
   );
   const isValidOutput = Array.isArray(res) && res.every(
     (x) => Array.isArray(x.labels) && x.labels.every((_label) => typeof _label === "string") && Array.isArray(x.scores) && x.scores.every((_score) => typeof _score === "number") && typeof x.sequence === "string"
@@ -662,7 +740,10 @@ async function documentQuestionAnswering(args, options) {
     }
   };
   const res = toArray(
-    await request(reqArgs, options)
+    await request(reqArgs, {
+      ...options,
+      taskHint: "document-question-answering"
+    })
   )?.[0];
   const isValidOutput = typeof res?.answer === "string" && (typeof res.end === "number" || typeof res.end === "undefined") && (typeof res.score === "number" || typeof res.score === "undefined") && (typeof res.start === "number" || typeof res.start === "undefined");
   if (!isValidOutput) {
@@ -685,7 +766,10 @@ async function visualQuestionAnswering(args, options) {
       )
     }
   };
-  const res = (await request(reqArgs, options))?.[0];
+  const res = (await request(reqArgs, {
+    ...options,
+    taskHint: "visual-question-answering"
+  }))?.[0];
   const isValidOutput = typeof res?.answer === "string" && typeof res.score === "number";
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected Array<{answer: string, score: number}>");
@@ -695,7 +779,10 @@ async function visualQuestionAnswering(args, options) {
 // src/tasks/tabular/tabularRegression.ts
 async function tabularRegression(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "tabular-regression"
+  });
   const isValidOutput = Array.isArray(res) && res.every((x) => typeof x === "number");
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected number[]");
@@ -705,7 +792,10 @@ async function tabularRegression(args, options) {
 // src/tasks/tabular/tabularClassification.ts
 async function tabularClassification(args, options) {
-  const res = await request(args, options);
+  const res = await request(args, {
+    ...options,
+    taskHint: "tabular-classification"
+  });
   const isValidOutput = Array.isArray(res) && res.every((x) => typeof x === "number");
   if (!isValidOutput) {
     throw new InferenceOutputError("Expected number[]");

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@huggingface/inference",
-  "version": "2.5.2",
+  "version": "2.6.0",
   "packageManager": "pnpm@8.3.1",
   "license": "MIT",
   "author": "Tim Mikeladze <tim.mikeladze@gmail.com>",

package/src/lib/getDefaultTask.ts CHANGED Viewed

@@ -8,7 +8,7 @@ import { isUrl } from "./isUrl";
 const taskCache = new Map<string, { task: string; date: Date }>();
 const CACHE_DURATION = 10 * 60 * 1000;
 const MAX_CACHE_ITEMS = 1000;
-const HF_HUB_URL = "https://huggingface.co";
+export const HF_HUB_URL = "https://huggingface.co";
 /**
  * Get the default task. Use a LRU cache of 1000 items with 10 minutes expiration

package/src/lib/makeRequestOptions.ts CHANGED Viewed

@@ -1,12 +1,18 @@
 import type { InferenceTask, Options, RequestArgs } from "../types";
+import { HF_HUB_URL } from "./getDefaultTask";
 import { isUrl } from "./isUrl";
 const HF_INFERENCE_API_BASE_URL = "https://api-inference.huggingface.co";
+/**
+ * Loaded from huggingface.co/api/tasks if needed
+ */
+let tasks: Record<string, { models: { id: string }[] }> | null = null;
 /**
  * Helper that prepares request arguments
  */
-export function makeRequestOptions(
+export async function makeRequestOptions(
 	args: RequestArgs & {
 		data?: Blob | ArrayBuffer;
 		stream?: boolean;
@@ -15,17 +21,40 @@ export function makeRequestOptions(
 		/** For internal HF use, which is why it's not exposed in {@link Options} */
 		includeCredentials?: boolean;
 		/** When a model can be used for multiple tasks, and we want to run a non-default task */
-		task?: string | InferenceTask;
+		forceTask?: string | InferenceTask;
+		/** To load default model if needed */
+		taskHint?: InferenceTask;
 	}
-): { url: string; info: RequestInit } {
-	const { model, accessToken, ...otherArgs } = args;
-	const { task, includeCredentials, ...otherOptions } = options ?? {};
+): Promise<{ url: string; info: RequestInit }> {
+	// eslint-disable-next-line @typescript-eslint/no-unused-vars
+	const { accessToken, model: _model, ...otherArgs } = args;
+	let { model } = args;
+	const { forceTask: task, includeCredentials, taskHint, ...otherOptions } = options ?? {};
 	const headers: Record<string, string> = {};
 	if (accessToken) {
 		headers["Authorization"] = `Bearer ${accessToken}`;
 	}
+	if (!model && !tasks && taskHint) {
+		const res = await fetch(`${HF_HUB_URL}/api/tasks`);
+		if (res.ok) {
+			tasks = await res.json();
+		}
+	}
+	if (!model && tasks && taskHint) {
+		const taskInfo = tasks[taskHint];
+		if (taskInfo) {
+			model = taskInfo.models[0].id;
+		}
+	}
+	if (!model) {
+		throw new Error("No model provided, and no default model found for this task");
+	}
 	const binary = "data" in args && !!args.data;
 	if (!binary) {

package/src/tasks/audio/audioClassification.ts CHANGED Viewed

@@ -31,7 +31,10 @@ export async function audioClassification(
 	args: AudioClassificationArgs,
 	options?: Options
 ): Promise<AudioClassificationReturn> {
-	const res = await request<AudioClassificationReturn>(args, options);
+	const res = await request<AudioClassificationReturn>(args, {
+		...options,
+		taskHint: "audio-classification",
+	});
 	const isValidOutput =
 		Array.isArray(res) && res.every((x) => typeof x.label === "string" && typeof x.score === "number");
 	if (!isValidOutput) {

package/src/tasks/audio/audioToAudio.ts CHANGED Viewed

@@ -33,7 +33,10 @@ export type AudioToAudioReturn = AudioToAudioOutputValue[];
  * Example model: speechbrain/sepformer-wham does audio source separation.
  */
 export async function audioToAudio(args: AudioToAudioArgs, options?: Options): Promise<AudioToAudioReturn> {
-	const res = await request<AudioToAudioReturn>(args, options);
+	const res = await request<AudioToAudioReturn>(args, {
+		...options,
+		taskHint: "audio-to-audio",
+	});
 	const isValidOutput =
 		Array.isArray(res) &&
 		res.every(

package/src/tasks/audio/automaticSpeechRecognition.ts CHANGED Viewed

@@ -24,7 +24,10 @@ export async function automaticSpeechRecognition(
 	args: AutomaticSpeechRecognitionArgs,
 	options?: Options
 ): Promise<AutomaticSpeechRecognitionOutput> {
-	const res = await request<AutomaticSpeechRecognitionOutput>(args, options);
+	const res = await request<AutomaticSpeechRecognitionOutput>(args, {
+		...options,
+		taskHint: "automatic-speech-recognition",
+	});
 	const isValidOutput = typeof res?.text === "string";
 	if (!isValidOutput) {
 		throw new InferenceOutputError("Expected {text: string}");

package/src/tasks/audio/textToSpeech.ts CHANGED Viewed

@@ -16,7 +16,10 @@ export type TextToSpeechOutput = Blob;
  * Recommended model: espnet/kan-bayashi_ljspeech_vits
  */
 export async function textToSpeech(args: TextToSpeechArgs, options?: Options): Promise<TextToSpeechOutput> {
-	const res = await request<TextToSpeechOutput>(args, options);
+	const res = await request<TextToSpeechOutput>(args, {
+		...options,
+		taskHint: "text-to-speech",
+	});
 	const isValidOutput = res && res instanceof Blob;
 	if (!isValidOutput) {
 		throw new InferenceOutputError("Expected Blob");

package/src/tasks/custom/request.ts CHANGED Viewed

@@ -11,9 +11,11 @@ export async function request<T>(
 		includeCredentials?: boolean;
 		/** When a model can be used for multiple tasks, and we want to run a non-default task */
 		task?: string | InferenceTask;
+		/** To load default model if needed */
+		taskHint?: InferenceTask;
 	}
 ): Promise<T> {
-	const { url, info } = makeRequestOptions(args, options);
+	const { url, info } = await makeRequestOptions(args, options);
 	const response = await (options?.fetch ?? fetch)(url, info);
 	if (options?.retry_on_error !== false && response.status === 503 && !options?.wait_for_model) {

package/src/tasks/custom/streamingRequest.ts CHANGED Viewed

@@ -13,9 +13,11 @@ export async function* streamingRequest<T>(
 		includeCredentials?: boolean;
 		/** When a model can be used for multiple tasks, and we want to run a non-default task */
 		task?: string | InferenceTask;
+		/** To load default model if needed */
+		taskHint?: InferenceTask;
 	}
 ): AsyncGenerator<T> {
-	const { url, info } = makeRequestOptions({ ...args, stream: true }, options);
+	const { url, info } = await makeRequestOptions({ ...args, stream: true }, options);
 	const response = await (options?.fetch ?? fetch)(url, info);
 	if (options?.retry_on_error !== false && response.status === 503 && !options?.wait_for_model) {

package/src/tasks/cv/imageClassification.ts CHANGED Viewed

@@ -30,7 +30,10 @@ export async function imageClassification(
 	args: ImageClassificationArgs,
 	options?: Options
 ): Promise<ImageClassificationOutput> {
-	const res = await request<ImageClassificationOutput>(args, options);
+	const res = await request<ImageClassificationOutput>(args, {
+		...options,
+		taskHint: "image-classification",
+	});
 	const isValidOutput =
 		Array.isArray(res) && res.every((x) => typeof x.label === "string" && typeof x.score === "number");
 	if (!isValidOutput) {

package/src/tasks/cv/imageSegmentation.ts CHANGED Viewed

@@ -34,7 +34,10 @@ export async function imageSegmentation(
 	args: ImageSegmentationArgs,
 	options?: Options
 ): Promise<ImageSegmentationOutput> {
-	const res = await request<ImageSegmentationOutput>(args, options);
+	const res = await request<ImageSegmentationOutput>(args, {
+		...options,
+		taskHint: "image-segmentation",
+	});
 	const isValidOutput =
 		Array.isArray(res) &&
 		res.every((x) => typeof x.label === "string" && typeof x.mask === "string" && typeof x.score === "number");

package/src/tasks/cv/imageToImage.ts CHANGED Viewed

@@ -74,7 +74,10 @@ export async function imageToImage(args: ImageToImageArgs, options?: Options): P
 			),
 		};
 	}
-	const res = await request<ImageToImageOutput>(reqArgs, options);
+	const res = await request<ImageToImageOutput>(reqArgs, {
+		...options,
+		taskHint: "image-to-image",
+	});
 	const isValidOutput = res && res instanceof Blob;
 	if (!isValidOutput) {
 		throw new InferenceOutputError("Expected Blob");