npm - @huggingface/tasks - Versions diffs - 0.2.2 → 0.3.1 - Mend

@huggingface/tasks 0.2.2 → 0.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (79) hide show

package/README.md +1 -1
package/dist/index.cjs +3144 -3085
package/dist/index.d.ts +441 -74
package/dist/index.js +3143 -3084
package/package.json +1 -1
package/src/index.ts +2 -5
package/src/library-to-tasks.ts +1 -1
package/src/model-libraries-downloads.ts +20 -0
package/src/{library-ui-elements.ts → model-libraries-snippets.ts} +46 -292
package/src/model-libraries.ts +375 -44
package/src/pipelines.ts +14 -8
package/src/tasks/audio-classification/inference.ts +4 -4
package/src/tasks/audio-classification/spec/input.json +4 -4
package/src/tasks/audio-classification/spec/output.json +1 -12
package/src/tasks/automatic-speech-recognition/inference.ts +35 -30
package/src/tasks/automatic-speech-recognition/spec/input.json +3 -3
package/src/tasks/automatic-speech-recognition/spec/output.json +30 -28
package/src/tasks/common-definitions.json +25 -17
package/src/tasks/depth-estimation/inference.ts +10 -10
package/src/tasks/depth-estimation/spec/input.json +3 -8
package/src/tasks/depth-estimation/spec/output.json +9 -3
package/src/tasks/document-question-answering/inference.ts +16 -8
package/src/tasks/document-question-answering/spec/input.json +9 -9
package/src/tasks/document-question-answering/spec/output.json +2 -2
package/src/tasks/feature-extraction/inference.ts +1 -1
package/src/tasks/feature-extraction/spec/input.json +2 -2
package/src/tasks/fill-mask/inference.ts +4 -3
package/src/tasks/fill-mask/spec/input.json +3 -3
package/src/tasks/fill-mask/spec/output.json +1 -1
package/src/tasks/image-classification/inference.ts +3 -3
package/src/tasks/image-classification/spec/input.json +4 -4
package/src/tasks/image-segmentation/inference.ts +3 -3
package/src/tasks/image-segmentation/spec/input.json +4 -4
package/src/tasks/image-to-image/inference.ts +5 -5
package/src/tasks/image-to-image/spec/input.json +9 -7
package/src/tasks/image-to-text/inference.ts +25 -20
package/src/tasks/image-to-text/spec/input.json +3 -3
package/src/tasks/image-to-text/spec/output.json +8 -11
package/src/tasks/index.ts +2 -0
package/src/tasks/object-detection/inference.ts +1 -1
package/src/tasks/object-detection/spec/input.json +2 -2
package/src/tasks/placeholder/spec/input.json +4 -4
package/src/tasks/placeholder/spec/output.json +1 -1
package/src/tasks/question-answering/inference.ts +8 -8
package/src/tasks/question-answering/spec/input.json +9 -9
package/src/tasks/sentence-similarity/inference.ts +1 -1
package/src/tasks/sentence-similarity/spec/input.json +2 -2
package/src/tasks/summarization/inference.ts +5 -4
package/src/tasks/table-question-answering/inference.ts +1 -1
package/src/tasks/table-question-answering/spec/input.json +8 -3
package/src/tasks/text-classification/inference.ts +3 -3
package/src/tasks/text-classification/spec/input.json +4 -4
package/src/tasks/text-generation/inference.ts +123 -14
package/src/tasks/text-generation/spec/input.json +28 -12
package/src/tasks/text-generation/spec/output.json +112 -9
package/src/tasks/text-to-audio/inference.ts +24 -19
package/src/tasks/text-to-audio/spec/input.json +2 -2
package/src/tasks/text-to-audio/spec/output.json +10 -13
package/src/tasks/text-to-image/inference.ts +6 -8
package/src/tasks/text-to-image/spec/input.json +9 -7
package/src/tasks/text-to-image/spec/output.json +7 -9
package/src/tasks/text-to-speech/inference.ts +18 -17
package/src/tasks/text2text-generation/inference.ts +10 -8
package/src/tasks/text2text-generation/spec/input.json +4 -4
package/src/tasks/text2text-generation/spec/output.json +8 -11
package/src/tasks/token-classification/inference.ts +4 -4
package/src/tasks/token-classification/spec/input.json +4 -4
package/src/tasks/token-classification/spec/output.json +1 -1
package/src/tasks/translation/inference.ts +5 -4
package/src/tasks/video-classification/inference.ts +5 -5
package/src/tasks/video-classification/spec/input.json +6 -6
package/src/tasks/visual-question-answering/inference.ts +2 -2
package/src/tasks/visual-question-answering/spec/input.json +3 -3
package/src/tasks/zero-shot-classification/inference.ts +3 -3
package/src/tasks/zero-shot-classification/spec/input.json +4 -4
package/src/tasks/zero-shot-image-classification/inference.ts +2 -2
package/src/tasks/zero-shot-image-classification/spec/input.json +3 -3
package/src/tasks/zero-shot-object-detection/inference.ts +1 -1
package/src/tasks/zero-shot-object-detection/spec/input.json +2 -2

package/src/tasks/text-to-audio/spec/output.json CHANGED Viewed

@@ -3,18 +3,15 @@
 	"$schema": "http://json-schema.org/draft-06/schema#",
 	"description": "Outputs of inference for the Text To Audio task",
 	"title": "TextToAudioOutput",
-	"type": "array",
-	"items": {
-		"type": "object",
-		"properties": {
-			"audio": {
-				"description": "The generated audio waveform."
-			},
-			"samplingRate": {
-				"type": "number",
-				"description": "The sampling rate of the generated audio waveform."
-			}
+	"type": "object",
+	"properties": {
+		"audio": {
+			"description": "The generated audio waveform."
 		},
-		"required": ["audio", "samplingRate"]
-	}
+		"sampling_rate": {
+			"type": "number",
+			"description": "The sampling rate of the generated audio waveform."
+		}
+	},
+	"required": ["audio", "samplingRate"]
 }

package/src/tasks/text-to-image/inference.ts CHANGED Viewed

@@ -11,7 +11,7 @@ export interface TextToImageInput {
 	/**
 	 * The input text data (sometimes called "prompt"
 	 */
-	data: string;
+	inputs: string;
 	/**
 	 * Additional inference parameters
 	 */
@@ -29,16 +29,16 @@ export interface TextToImageParameters {
 	 * For diffusion models. A higher guidance scale value encourages the model to generate
 	 * images closely linked to the text prompt at the expense of lower image quality.
 	 */
-	guidanceScale?: number;
+	guidance_scale?: number;
 	/**
 	 * One or several prompt to guide what NOT to include in image generation.
 	 */
-	negativePrompt?: string[];
+	negative_prompt?: string[];
 	/**
 	 * For diffusion models. The number of denoising steps. More denoising steps usually lead to
 	 * a higher quality image at the expense of slower inference.
 	 */
-	numInferenceSteps?: number;
+	num_inference_steps?: number;
 	/**
 	 * For diffusion models. Override the scheduler with a compatible one
 	 */
@@ -46,7 +46,7 @@ export interface TextToImageParameters {
 	/**
 	 * The size in pixel of the output image
 	 */
-	targetSize?: TargetSize;
+	target_size?: TargetSize;
 	[property: string]: unknown;
 }
@@ -62,9 +62,7 @@ export interface TargetSize {
 /**
  * Outputs of inference for the Text To Image task
  */
-export type TextToImageOutput = unknown[] | boolean | number | number | null | TextToImageOutputObject | string;
-export interface TextToImageOutputObject {
+export interface TextToImageOutput {
 	/**
 	 * The generated image
 	 */

package/src/tasks/text-to-image/spec/input.json CHANGED Viewed

@@ -5,7 +5,7 @@
 	"title": "TextToImageInput",
 	"type": "object",
 	"properties": {
-		"data": {
+		"inputs": {
 			"description": "The input text data (sometimes called \"prompt\"",
 			"type": "string"
 		},
@@ -20,20 +20,22 @@
 			"description": "Additional inference parameters for Text To Image",
 			"type": "object",
 			"properties": {
-				"guidanceScale": {
+				"guidance_scale": {
 					"type": "number",
 					"description": "For diffusion models. A higher guidance scale value encourages the model to generate images closely linked to the text prompt at the expense of lower image quality."
 				},
-				"negativePrompt": {
+				"negative_prompt": {
 					"type": "array",
-					"items": { "type": "string" },
+					"items": {
+						"type": "string"
+					},
 					"description": "One or several prompt to guide what NOT to include in image generation."
 				},
-				"numInferenceSteps": {
+				"num_inference_steps": {
 					"type": "integer",
 					"description": "For diffusion models. The number of denoising steps. More denoising steps usually lead to a higher quality image at the expense of slower inference."
 				},
-				"targetSize": {
+				"target_size": {
 					"type": "object",
 					"description": "The size in pixel of the output image",
 					"properties": {
@@ -53,5 +55,5 @@
 			}
 		}
 	},
-	"required": ["data"]
+	"required": ["inputs"]
 }

package/src/tasks/text-to-image/spec/output.json CHANGED Viewed

@@ -3,13 +3,11 @@
 	"$schema": "http://json-schema.org/draft-06/schema#",
 	"description": "Outputs of inference for the Text To Image task",
 	"title": "TextToImageOutput",
-	"type": "array",
-	"items": {
-		"properties": {
-			"image": {
-				"description": "The generated image"
-			}
-		},
-		"required": ["image"]
-	}
+	"type": "object",
+	"properties": {
+		"image": {
+			"description": "The generated image"
+		}
+	},
+	"required": ["image"]
 }

package/src/tasks/text-to-speech/inference.ts CHANGED Viewed

@@ -13,7 +13,7 @@ export interface TextToSpeechInput {
 	/**
 	 * The input text data
 	 */
-	data: string;
+	inputs: string;
 	/**
 	 * Additional inference parameters
 	 */
@@ -43,18 +43,18 @@ export interface GenerationParameters {
 	/**
 	 * Whether to use sampling instead of greedy decoding when generating new tokens.
 	 */
-	doSample?: boolean;
+	do_sample?: boolean;
 	/**
 	 * Controls the stopping condition for beam-based methods.
 	 */
-	earlyStopping?: EarlyStoppingUnion;
+	early_stopping?: EarlyStoppingUnion;
 	/**
 	 * If set to float strictly between 0 and 1, only tokens with a conditional probability
 	 * greater than epsilon_cutoff will be sampled. In the paper, suggested values range from
 	 * 3e-4 to 9e-4, depending on the size of the model. See [Truncation Sampling as Language
 	 * Model Desmoothing](https://hf.co/papers/2210.15191) for more details.
 	 */
-	epsilonCutoff?: number;
+	epsilon_cutoff?: number;
 	/**
 	 * Eta sampling is a hybrid of locally typical sampling and epsilon sampling. If set to
 	 * float strictly between 0 and 1, a token is only considered if it is greater than either
@@ -64,37 +64,37 @@ export interface GenerationParameters {
 	 * See [Truncation Sampling as Language Model Desmoothing](https://hf.co/papers/2210.15191)
 	 * for more details.
 	 */
-	etaCutoff?: number;
+	eta_cutoff?: number;
 	/**
 	 * The maximum length (in tokens) of the generated text, including the input.
 	 */
-	maxLength?: number;
+	max_length?: number;
 	/**
 	 * The maximum number of tokens to generate. Takes precedence over maxLength.
 	 */
-	maxNewTokens?: number;
+	max_new_tokens?: number;
 	/**
 	 * The minimum length (in tokens) of the generated text, including the input.
 	 */
-	minLength?: number;
+	min_length?: number;
 	/**
 	 * The minimum number of tokens to generate. Takes precedence over maxLength.
 	 */
-	minNewTokens?: number;
+	min_new_tokens?: number;
 	/**
 	 * Number of groups to divide num_beams into in order to ensure diversity among different
 	 * groups of beams. See [this paper](https://hf.co/papers/1610.02424) for more details.
 	 */
-	numBeamGroups?: number;
+	num_beam_groups?: number;
 	/**
 	 * Number of beams to use for beam search.
 	 */
-	numBeams?: number;
+	num_beams?: number;
 	/**
 	 * The value balances the model confidence and the degeneration penalty in contrastive
 	 * search decoding.
 	 */
-	penaltyAlpha?: number;
+	penalty_alpha?: number;
 	/**
 	 * The value used to modulate the next token probabilities.
 	 */
@@ -102,12 +102,12 @@ export interface GenerationParameters {
 	/**
 	 * The number of highest probability vocabulary tokens to keep for top-k-filtering.
 	 */
-	topK?: number;
+	top_k?: number;
 	/**
 	 * If set to float < 1, only the smallest set of most probable tokens with probabilities
 	 * that add up to top_p or higher are kept for generation.
 	 */
-	topP?: number;
+	top_p?: number;
 	/**
 	 * Local typicality measures how similar the conditional probability of predicting a target
 	 * token next is to the expected conditional probability of predicting a random token next,
@@ -115,11 +115,11 @@ export interface GenerationParameters {
 	 * most locally typical tokens with probabilities that add up to typical_p or higher are
 	 * kept for generation. See [this paper](https://hf.co/papers/2202.00666) for more details.
 	 */
-	typicalP?: number;
+	typical_p?: number;
 	/**
 	 * Whether the model should use the past last key/values attentions to speed up decoding
 	 */
-	useCache?: boolean;
+	use_cache?: boolean;
 	[property: string]: unknown;
 }
@@ -138,9 +138,10 @@ export interface TextToSpeechOutput {
 	 * The generated audio waveform.
 	 */
 	audio: unknown;
+	samplingRate: unknown;
 	/**
 	 * The sampling rate of the generated audio waveform.
 	 */
-	samplingRate: number;
+	sampling_rate?: number;
 	[property: string]: unknown;
 }

package/src/tasks/text2text-generation/inference.ts CHANGED Viewed

@@ -3,6 +3,7 @@
  *
  * Using src/scripts/inference-codegen
  */
 /**
  * Inputs for Text2text Generation inference
  */
@@ -10,13 +11,14 @@ export interface Text2TextGenerationInput {
 	/**
 	 * The input text data
 	 */
-	data: string;
+	inputs: string;
 	/**
 	 * Additional inference parameters
 	 */
 	parameters?: Text2TextGenerationParameters;
 	[property: string]: unknown;
 }
 /**
  * Additional inference parameters
  *
@@ -26,28 +28,28 @@ export interface Text2TextGenerationParameters {
 	/**
 	 * Whether to clean up the potential extra spaces in the text output.
 	 */
-	cleanUpTokenizationSpaces?: boolean;
+	clean_up_tokenization_spaces?: boolean;
 	/**
 	 * Additional parametrization of the text generation algorithm
 	 */
-	generateParameters?: {
-		[key: string]: unknown;
-	};
+	generate_parameters?: { [key: string]: unknown };
 	/**
 	 * The truncation strategy to use
 	 */
 	truncation?: Text2TextGenerationTruncationStrategy;
 	[property: string]: unknown;
 }
 export type Text2TextGenerationTruncationStrategy = "do_not_truncate" | "longest_first" | "only_first" | "only_second";
-export type Text2TextGenerationOutput = Text2TextGenerationOutputElement[];
 /**
  * Outputs of inference for the Text2text Generation task
  */
-export interface Text2TextGenerationOutputElement {
+export interface Text2TextGenerationOutput {
+	generatedText: unknown;
 	/**
 	 * The generated text.
 	 */
-	generatedText: string;
+	generated_text?: string;
 	[property: string]: unknown;
 }

package/src/tasks/text2text-generation/spec/input.json CHANGED Viewed

@@ -5,7 +5,7 @@
 	"title": "Text2TextGenerationInput",
 	"type": "object",
 	"properties": {
-		"data": {
+		"inputs": {
 			"description": "The input text data",
 			"type": "string"
 		},
@@ -20,7 +20,7 @@
 			"description": "Additional inference parameters for Text2text Generation",
 			"type": "object",
 			"properties": {
-				"cleanUpTokenizationSpaces": {
+				"clean_up_tokenization_spaces": {
 					"type": "boolean",
 					"description": "Whether to clean up the potential extra spaces in the text output."
 				},
@@ -43,7 +43,7 @@
 						}
 					]
 				},
-				"generateParameters": {
+				"generate_parameters": {
 					"title": "generateParameters",
 					"type": "object",
 					"description": "Additional parametrization of the text generation algorithm"
@@ -51,5 +51,5 @@
 			}
 		}
 	},
-	"required": ["data"]
+	"required": ["inputs"]
 }

package/src/tasks/text2text-generation/spec/output.json CHANGED Viewed

@@ -3,15 +3,12 @@
 	"$schema": "http://json-schema.org/draft-06/schema#",
 	"description": "Outputs of inference for the Text2text Generation task",
 	"title": "Text2TextGenerationOutput",
-	"type": "array",
-	"items": {
-		"type": "object",
-		"properties": {
-			"generatedText": {
-				"type": "string",
-				"description": "The generated text."
-			}
-		},
-		"required": ["generatedText"]
-	}
+	"type": "object",
+	"properties": {
+		"generated_text": {
+			"type": "string",
+			"description": "The generated text."
+		}
+	},
+	"required": ["generatedText"]
 }

package/src/tasks/token-classification/inference.ts CHANGED Viewed

@@ -10,7 +10,7 @@ export interface TokenClassificationInput {
 	/**
 	 * The input text data
 	 */
-	data: string;
+	inputs: string;
 	/**
 	 * Additional inference parameters
 	 */
@@ -26,11 +26,11 @@ export interface TokenClassificationParameters {
 	/**
 	 * The strategy used to fuse tokens based on model predictions
 	 */
-	aggregationStrategy?: TokenClassificationAggregationStrategy;
+	aggregation_strategy?: TokenClassificationAggregationStrategy;
 	/**
 	 * A list of labels to ignore
 	 */
-	ignoreLabels?: string[];
+	ignore_labels?: string[];
 	/**
 	 * The number of overlapping tokens between chunks when splitting the input text.
 	 */
@@ -64,7 +64,7 @@ export interface TokenClassificationOutputElement {
 	/**
 	 * The predicted label for that group of tokens
 	 */
-	entityGroup?: string;
+	entity_group?: string;
 	label: unknown;
 	/**
 	 * The associated score / probability

package/src/tasks/token-classification/spec/input.json CHANGED Viewed

@@ -5,7 +5,7 @@
 	"title": "TokenClassificationInput",
 	"type": "object",
 	"properties": {
-		"data": {
+		"inputs": {
 			"description": "The input text data",
 			"type": "string"
 		},
@@ -20,7 +20,7 @@
 			"description": "Additional inference parameters for Token Classification",
 			"type": "object",
 			"properties": {
-				"ignoreLabels": {
+				"ignore_labels": {
 					"type": "array",
 					"items": {
 						"type": "string"
@@ -31,7 +31,7 @@
 					"type": "integer",
 					"description": "The number of overlapping tokens between chunks when splitting the input text."
 				},
-				"aggregationStrategy": {
+				"aggregation_strategy": {
 					"title": "TokenClassificationAggregationStrategy",
 					"type": "string",
 					"description": "The strategy used to fuse tokens based on model predictions",
@@ -61,5 +61,5 @@
 			}
 		}
 	},
-	"required": ["data"]
+	"required": ["inputs"]
 }

package/src/tasks/token-classification/spec/output.json CHANGED Viewed

@@ -7,7 +7,7 @@
 	"items": {
 		"type": "object",
 		"properties": {
-			"entityGroup": {
+			"entity_group": {
 				"type": "string",
 				"description": "The predicted label for that group of tokens"
 			},

package/src/tasks/translation/inference.ts CHANGED Viewed

@@ -13,7 +13,7 @@ export interface TranslationInput {
 	/**
 	 * The input text data
 	 */
-	data: string;
+	inputs: string;
 	/**
 	 * Additional inference parameters
 	 */
@@ -30,11 +30,11 @@ export interface Text2TextGenerationParameters {
 	/**
 	 * Whether to clean up the potential extra spaces in the text output.
 	 */
-	cleanUpTokenizationSpaces?: boolean;
+	clean_up_tokenization_spaces?: boolean;
 	/**
 	 * Additional parametrization of the text generation algorithm
 	 */
-	generateParameters?: { [key: string]: unknown };
+	generate_parameters?: { [key: string]: unknown };
 	/**
 	 * The truncation strategy to use
 	 */
@@ -50,9 +50,10 @@ export type Text2TextGenerationTruncationStrategy = "do_not_truncate" | "longest
  * Outputs of inference for the Text2text Generation task
  */
 export interface TranslationOutput {
+	generatedText: unknown;
 	/**
 	 * The generated text.
 	 */
-	generatedText: string;
+	generated_text?: string;
 	[property: string]: unknown;
 }

package/src/tasks/video-classification/inference.ts CHANGED Viewed

@@ -10,7 +10,7 @@ export interface VideoClassificationInput {
 	/**
 	 * The input video data
 	 */
-	data: unknown;
+	inputs: unknown;
 	/**
 	 * Additional inference parameters
 	 */
@@ -26,16 +26,16 @@ export interface VideoClassificationParameters {
 	/**
 	 * The sampling rate used to select frames from the video.
 	 */
-	frameSamplingRate?: number;
-	functionToApply?: ClassificationOutputTransform;
+	frame_sampling_rate?: number;
+	function_to_apply?: ClassificationOutputTransform;
 	/**
 	 * The number of sampled frames to consider for classification.
 	 */
-	numFrames?: number;
+	num_frames?: number;
 	/**
 	 * When specified, limits the output to the top K most probable classes.
 	 */
-	topK?: number;
+	top_k?: number;
 	[property: string]: unknown;
 }
 /**

package/src/tasks/video-classification/spec/input.json CHANGED Viewed

@@ -5,7 +5,7 @@
 	"title": "VideoClassificationInput",
 	"type": "object",
 	"properties": {
-		"data": {
+		"inputs": {
 			"description": "The input video data"
 		},
 		"parameters": {
@@ -19,24 +19,24 @@
 			"description": "Additional inference parameters for Video Classification",
 			"type": "object",
 			"properties": {
-				"functionToApply": {
+				"function_to_apply": {
 					"title": "TextClassificationOutputTransform",
 					"$ref": "/inference/schemas/common-definitions.json#/definitions/ClassificationOutputTransform"
 				},
-				"numFrames": {
+				"num_frames": {
 					"type": "integer",
 					"description": "The number of sampled frames to consider for classification."
 				},
-				"frameSamplingRate": {
+				"frame_sampling_rate": {
 					"type": "integer",
 					"description": "The sampling rate used to select frames from the video."
 				},
-				"topK": {
+				"top_k": {
 					"type": "integer",
 					"description": "When specified, limits the output to the top K most probable classes."
 				}
 			}
 		}
 	},
-	"required": ["data"]
+	"required": ["inputs"]
 }

package/src/tasks/visual-question-answering/inference.ts CHANGED Viewed

@@ -10,7 +10,7 @@ export interface VisualQuestionAnsweringInput {
 	/**
 	 * One (image, question) pair to answer
 	 */
-	data: VisualQuestionAnsweringInputData;
+	inputs: VisualQuestionAnsweringInputData;
 	/**
 	 * Additional inference parameters
 	 */
@@ -42,7 +42,7 @@ export interface VisualQuestionAnsweringParameters {
 	 * return less than topk answers if there are not enough options available within the
 	 * context.
 	 */
-	topK?: number;
+	top_k?: number;
 	[property: string]: unknown;
 }
 export type VisualQuestionAnsweringOutput = VisualQuestionAnsweringOutputElement[];

package/src/tasks/visual-question-answering/spec/input.json CHANGED Viewed

@@ -5,7 +5,7 @@
 	"title": "VisualQuestionAnsweringInput",
 	"type": "object",
 	"properties": {
-		"data": {
+		"inputs": {
 			"description": "One (image, question) pair to answer",
 			"type": "object",
 			"title": "VisualQuestionAnsweringInputData",
@@ -30,12 +30,12 @@
 			"description": "Additional inference parameters for Visual Question Answering",
 			"type": "object",
 			"properties": {
-				"topK": {
+				"top_k": {
 					"type": "integer",
 					"description": "The number of answers to return (will be chosen by order of likelihood). Note that we return less than topk answers if there are not enough options available within the context."
 				}
 			}
 		}
 	},
-	"required": ["data"]
+	"required": ["inputs"]
 }

package/src/tasks/zero-shot-classification/inference.ts CHANGED Viewed

@@ -10,7 +10,7 @@ export interface ZeroShotClassificationInput {
 	/**
 	 * The input text data, with candidate labels
 	 */
-	data: ZeroShotClassificationInputData;
+	inputs: ZeroShotClassificationInputData;
 	/**
 	 * Additional inference parameters
 	 */
@@ -41,13 +41,13 @@ export interface ZeroShotClassificationParameters {
 	 * The sentence used in conjunction with candidateLabels to attempt the text classification
 	 * by replacing the placeholder with the candidate labels.
 	 */
-	hypothesisTemplate?: string;
+	hypothesis_template?: string;
 	/**
 	 * Whether multiple candidate labels can be true. If false, the scores are normalized such
 	 * that the sum of the label likelihoods for each sequence is 1. If true, the labels are
 	 * considered independent and probabilities are normalized for each candidate.
 	 */
-	multiLabel?: boolean;
+	multi_label?: boolean;
 	[property: string]: unknown;
 }
 export type ZeroShotClassificationOutput = ZeroShotClassificationOutputElement[];

package/src/tasks/zero-shot-classification/spec/input.json CHANGED Viewed

@@ -5,7 +5,7 @@
 	"title": "ZeroShotClassificationInput",
 	"type": "object",
 	"properties": {
-		"data": {
+		"inputs": {
 			"description": "The input text data, with candidate labels",
 			"type": "object",
 			"title": "ZeroShotClassificationInputData",
@@ -35,16 +35,16 @@
 			"description": "Additional inference parameters for Zero Shot Classification",
 			"type": "object",
 			"properties": {
-				"hypothesisTemplate": {
+				"hypothesis_template": {
 					"type": "string",
 					"description": "The sentence used in conjunction with candidateLabels to attempt the text classification by replacing the placeholder with the candidate labels."
 				},
-				"multiLabel": {
+				"multi_label": {
 					"type": "boolean",
 					"description": "Whether multiple candidate labels can be true. If false, the scores are normalized such that the sum of the label likelihoods for each sequence is 1. If true, the labels are considered independent and probabilities are normalized for each candidate."
 				}
 			}
 		}
 	},
-	"required": ["data"]
+	"required": ["inputs"]
 }