npm - @huggingface/tasks - Versions diffs - 0.3.2 → 0.3.4 - Mend

@huggingface/tasks 0.3.2 → 0.3.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

package/dist/index.cjs +43 -1
package/dist/index.d.ts +1993 -5
package/dist/index.js +43 -1
package/package.json +1 -1
package/src/model-data.ts +2 -2
package/src/model-libraries-snippets.ts +38 -0
package/src/model-libraries.ts +7 -0
package/src/pipelines.ts +1 -1
package/src/tasks/index.ts +58 -0
package/src/tasks/summarization/inference.ts +3 -6
package/src/tasks/summarization/spec/output.json +9 -2
package/src/tasks/translation/inference.ts +3 -6
package/src/tasks/translation/spec/output.json +9 -2

package/dist/index.js CHANGED Viewed

@@ -1260,7 +1260,7 @@ var PIPELINE_DATA = {
     color: "green"
   },
   "image-text-to-text": {
-    name: "Image + Text to Text (VLLMs)",
+    name: "Image-Text-to-Text",
     modality: "multimodal",
     color: "red",
     hideInDatasets: true
@@ -4406,6 +4406,41 @@ var pythae = (model) => [
 model = AutoModel.load_from_hf_hub("${model.id}")`
 ];
+var musicgen = (model) => [
+  `from audiocraft.models import MusicGen
+model = MusicGen.get_pretrained("${model.id}")
+descriptions = ['happy rock', 'energetic EDM', 'sad jazz']
+wav = model.generate(descriptions)  # generates 3 samples.`
+];
+var magnet = (model) => [
+  `from audiocraft.models import MAGNeT
+model = MAGNeT.get_pretrained("${model.id}")
+descriptions = ['disco beat', 'energetic EDM', 'funky groove']
+wav = model.generate(descriptions)  # generates 3 samples.`
+];
+var audiogen = (model) => [
+  `from audiocraft.models import AudioGen
+model = AudioGen.get_pretrained("${model.id}")
+model.set_generation_params(duration=5)  # generate 5 seconds.
+descriptions = ['dog barking', 'sirene of an emergency vehicle', 'footsteps in a corridor']
+wav = model.generate(descriptions)  # generates 3 samples.`
+];
+var audiocraft = (model) => {
+  if (model.tags?.includes("musicgen")) {
+    return musicgen(model);
+  } else if (model.tags?.includes("audiogen")) {
+    return audiogen(model);
+  } else if (model.tags?.includes("magnet")) {
+    return magnet(model);
+  } else {
+    return [`# Type of model unknown.`];
+  }
+};
 // src/model-libraries.ts
 var MODEL_LIBRARIES_UI_ELEMENTS = {
@@ -4439,6 +4474,13 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
       term: { path: "pytorch_model.bin" }
     }
   },
+  audiocraft: {
+    prettyLabel: "Audiocraft",
+    repoName: "audiocraft",
+    repoUrl: "https://github.com/facebookresearch/audiocraft",
+    snippets: audiocraft,
+    filter: false
+  },
   bertopic: {
     prettyLabel: "BERTopic",
     repoName: "BERTopic",

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "@huggingface/tasks",
   "packageManager": "pnpm@8.10.5",
-  "version": "0.3.2",
+  "version": "0.3.4",
   "description": "List of ML tasks for huggingface.co/tasks",
   "repository": "https://github.com/huggingface/huggingface.js.git",
   "publishConfig": {

package/src/model-data.ts CHANGED Viewed

@@ -54,7 +54,7 @@ export interface ModelData {
 			base_model_name?: string;
 			task_type?: string;
 		};
-		tokenizer?: TokenizerConfig;
+		tokenizer_config?: TokenizerConfig;
 	};
 	/**
 	 * all the model tags
@@ -80,7 +80,7 @@ export interface ModelData {
 	 */
 	widgetData?: WidgetExample[] | undefined;
 	/**
-	 * Parameters that will be used by the widget when calling Inference Endpoints (serverless)
+	 * Parameters that will be used by the widget when calling Inference API (serverless)
 	 * https://huggingface.co/docs/api-inference/detailed_parameters
 	 *
 	 * can be set in the model card metadata (under `inference/parameters`)

package/src/model-libraries-snippets.ts CHANGED Viewed

@@ -548,4 +548,42 @@ export const pythae = (model: ModelData): string[] => [
 model = AutoModel.load_from_hf_hub("${model.id}")`,
 ];
+const musicgen = (model: ModelData): string[] => [
+	`from audiocraft.models import MusicGen
+model = MusicGen.get_pretrained("${model.id}")
+descriptions = ['happy rock', 'energetic EDM', 'sad jazz']
+wav = model.generate(descriptions)  # generates 3 samples.`,
+];
+const magnet = (model: ModelData): string[] => [
+	`from audiocraft.models import MAGNeT
+model = MAGNeT.get_pretrained("${model.id}")
+descriptions = ['disco beat', 'energetic EDM', 'funky groove']
+wav = model.generate(descriptions)  # generates 3 samples.`,
+];
+const audiogen = (model: ModelData): string[] => [
+	`from audiocraft.models import AudioGen
+model = AudioGen.get_pretrained("${model.id}")
+model.set_generation_params(duration=5)  # generate 5 seconds.
+descriptions = ['dog barking', 'sirene of an emergency vehicle', 'footsteps in a corridor']
+wav = model.generate(descriptions)  # generates 3 samples.`,
+];
+export const audiocraft = (model: ModelData): string[] => {
+	if (model.tags?.includes("musicgen")) {
+		return musicgen(model);
+	} else if (model.tags?.includes("audiogen")) {
+		return audiogen(model);
+	} else if (model.tags?.includes("magnet")) {
+		return magnet(model);
+	} else {
+		return [`# Type of model unknown.`];
+	}
+};
 //#endregion

package/src/model-libraries.ts CHANGED Viewed

@@ -88,6 +88,13 @@ export const MODEL_LIBRARIES_UI_ELEMENTS = {
 			term: { path: "pytorch_model.bin" },
 		},
 	},
+	audiocraft: {
+		prettyLabel: "Audiocraft",
+		repoName: "audiocraft",
+		repoUrl: "https://github.com/facebookresearch/audiocraft",
+		snippets: snippets.audiocraft,
+		filter: false,
+	},
 	bertopic: {
 		prettyLabel: "BERTopic",
 		repoName: "BERTopic",

package/src/pipelines.ts CHANGED Viewed

@@ -590,7 +590,7 @@ export const PIPELINE_DATA = {
 		color: "green",
 	},
 	"image-text-to-text": {
-		name: "Image + Text to Text (VLLMs)",
+		name: "Image-Text-to-Text",
 		modality: "multimodal",
 		color: "red",
 		hideInDatasets: true,

package/src/tasks/index.ts CHANGED Viewed

@@ -36,6 +36,64 @@ import zeroShotClassification from "./zero-shot-classification/data";
 import zeroShotImageClassification from "./zero-shot-image-classification/data";
 import zeroShotObjectDetection from "./zero-shot-object-detection/data";
+export type * from "./audio-classification/inference";
+export type * from "./automatic-speech-recognition/inference";
+export type * from "./document-question-answering/inference";
+export type * from "./feature-extraction/inference";
+export type * from "./fill-mask/inference";
+export type {
+	ImageClassificationInput,
+	ImageClassificationOutput,
+	ImageClassificationOutputElement,
+	ImageClassificationParameters,
+} from "./image-classification/inference";
+export type * from "./image-to-image/inference";
+export type { ImageToTextInput, ImageToTextOutput, ImageToTextParameters } from "./image-to-text/inference";
+export type * from "./image-segmentation/inference";
+export type * from "./object-detection/inference";
+export type * from "./depth-estimation/inference";
+export type * from "./question-answering/inference";
+export type * from "./sentence-similarity/inference";
+export type * from "./summarization/inference";
+export type * from "./table-question-answering/inference";
+export type { TextToImageInput, TextToImageOutput, TextToImageParameters } from "./text-to-image/inference";
+export type { TextToAudioParameters, TextToSpeechInput, TextToSpeechOutput } from "./text-to-speech/inference";
+export type * from "./token-classification/inference";
+export type {
+	Text2TextGenerationParameters,
+	Text2TextGenerationTruncationStrategy,
+	TranslationInput,
+	TranslationOutput,
+} from "./translation/inference";
+export type {
+	ClassificationOutputTransform,
+	TextClassificationInput,
+	TextClassificationOutput,
+	TextClassificationOutputElement,
+	TextClassificationParameters,
+} from "./text-classification/inference";
+export type {
+	FinishReason,
+	PrefillToken,
+	TextGenerationInput,
+	TextGenerationOutput,
+	TextGenerationOutputDetails,
+	TextGenerationParameters,
+	TextGenerationSequenceDetails,
+	Token,
+} from "./text-generation/inference";
+export type * from "./video-classification/inference";
+export type * from "./visual-question-answering/inference";
+export type * from "./zero-shot-classification/inference";
+export type * from "./zero-shot-image-classification/inference";
+export type {
+	BoundingBox,
+	ZeroShotObjectDetectionInput,
+	ZeroShotObjectDetectionInputData,
+	ZeroShotObjectDetectionOutput,
+	ZeroShotObjectDetectionOutputElement,
+} from "./zero-shot-object-detection/inference";
 import type { ModelLibraryKey } from "../model-libraries";
 /**

package/src/tasks/summarization/inference.ts CHANGED Viewed

@@ -45,15 +45,12 @@ export interface Text2TextGenerationParameters {
 export type Text2TextGenerationTruncationStrategy = "do_not_truncate" | "longest_first" | "only_first" | "only_second";
 /**
- * Outputs for Summarization inference
- *
- * Outputs of inference for the Text2text Generation task
+ * Outputs of inference for the Summarization task
  */
 export interface SummarizationOutput {
-	generatedText: unknown;
 	/**
-	 * The generated text.
+	 * The summarized text.
 	 */
-	generated_text?: string;
+	summary_text: string;
 	[property: string]: unknown;
 }

package/src/tasks/summarization/spec/output.json CHANGED Viewed

@@ -1,7 +1,14 @@
 {
-	"$ref": "/inference/schemas/text2text-generation/output.json",
 	"$id": "/inference/schemas/summarization/output.json",
 	"$schema": "http://json-schema.org/draft-06/schema#",
+	"description": "Outputs of inference for the Summarization task",
 	"title": "SummarizationOutput",
-	"description": "Outputs for Summarization inference"
+	"type": "object",
+	"properties": {
+		"summary_text": {
+			"type": "string",
+			"description": "The summarized text."
+		}
+	},
+	"required": ["summary_text"]
 }

package/src/tasks/translation/inference.ts CHANGED Viewed

@@ -45,15 +45,12 @@ export interface Text2TextGenerationParameters {
 export type Text2TextGenerationTruncationStrategy = "do_not_truncate" | "longest_first" | "only_first" | "only_second";
 /**
- * Outputs for Translation inference
- *
- * Outputs of inference for the Text2text Generation task
+ * Outputs of inference for the Translation task
  */
 export interface TranslationOutput {
-	generatedText: unknown;
 	/**
-	 * The generated text.
+	 * The translated text.
 	 */
-	generated_text?: string;
+	translation_text: string;
 	[property: string]: unknown;
 }

package/src/tasks/translation/spec/output.json CHANGED Viewed

@@ -1,7 +1,14 @@
 {
-	"$ref": "/inference/schemas/text2text-generation/output.json",
 	"$id": "/inference/schemas/translation/output.json",
 	"$schema": "http://json-schema.org/draft-06/schema#",
+	"description": "Outputs of inference for the Translation task",
 	"title": "TranslationOutput",
-	"description": "Outputs for Translation inference"
+	"type": "object",
+	"properties": {
+		"translation_text": {
+			"type": "string",
+			"description": "The translated text."
+		}
+	},
+	"required": ["translation_text"]
 }