@huggingface/tasks 0.13.17 → 0.14.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (155) hide show
  1. package/dist/commonjs/model-libraries-snippets.d.ts +2 -2
  2. package/dist/commonjs/model-libraries-snippets.d.ts.map +1 -1
  3. package/dist/commonjs/model-libraries-snippets.js +2 -2
  4. package/dist/commonjs/model-libraries.d.ts +2 -2
  5. package/dist/commonjs/tasks/audio-classification/inference.d.ts +1 -1
  6. package/dist/commonjs/tasks/audio-classification/inference.d.ts.map +1 -1
  7. package/dist/commonjs/tasks/automatic-speech-recognition/inference.d.ts +1 -1
  8. package/dist/commonjs/tasks/automatic-speech-recognition/inference.d.ts.map +1 -1
  9. package/dist/commonjs/tasks/automatic-speech-recognition/inference.js +0 -5
  10. package/dist/commonjs/tasks/chat-completion/inference.d.ts.map +1 -1
  11. package/dist/commonjs/tasks/chat-completion/inference.js +0 -5
  12. package/dist/commonjs/tasks/depth-estimation/inference.d.ts.map +1 -1
  13. package/dist/commonjs/tasks/depth-estimation/inference.js +0 -5
  14. package/dist/commonjs/tasks/feature-extraction/inference.d.ts.map +1 -1
  15. package/dist/commonjs/tasks/feature-extraction/inference.js +0 -5
  16. package/dist/commonjs/tasks/image-classification/inference.d.ts +1 -1
  17. package/dist/commonjs/tasks/image-classification/inference.d.ts.map +1 -1
  18. package/dist/commonjs/tasks/image-segmentation/inference.d.ts +1 -1
  19. package/dist/commonjs/tasks/image-segmentation/inference.d.ts.map +1 -1
  20. package/dist/commonjs/tasks/image-to-image/inference.d.ts +3 -3
  21. package/dist/commonjs/tasks/image-to-image/inference.d.ts.map +1 -1
  22. package/dist/commonjs/tasks/image-to-image/inference.js +0 -5
  23. package/dist/commonjs/tasks/image-to-text/inference.d.ts +1 -1
  24. package/dist/commonjs/tasks/image-to-text/inference.d.ts.map +1 -1
  25. package/dist/commonjs/tasks/image-to-text/inference.js +0 -5
  26. package/dist/commonjs/tasks/index.d.ts +1 -0
  27. package/dist/commonjs/tasks/index.d.ts.map +1 -1
  28. package/dist/commonjs/tasks/object-detection/inference.d.ts +1 -1
  29. package/dist/commonjs/tasks/object-detection/inference.d.ts.map +1 -1
  30. package/dist/commonjs/tasks/sentence-similarity/inference.d.ts.map +1 -1
  31. package/dist/commonjs/tasks/sentence-similarity/inference.js +0 -5
  32. package/dist/commonjs/tasks/summarization/inference.d.ts.map +1 -1
  33. package/dist/commonjs/tasks/summarization/inference.js +0 -5
  34. package/dist/commonjs/tasks/text-generation/inference.d.ts.map +1 -1
  35. package/dist/commonjs/tasks/text-generation/inference.js +0 -5
  36. package/dist/commonjs/tasks/text-to-audio/inference.d.ts +14 -15
  37. package/dist/commonjs/tasks/text-to-audio/inference.d.ts.map +1 -1
  38. package/dist/commonjs/tasks/text-to-audio/inference.js +0 -5
  39. package/dist/commonjs/tasks/text-to-image/inference.d.ts +2 -2
  40. package/dist/commonjs/tasks/text-to-image/inference.d.ts.map +1 -1
  41. package/dist/commonjs/tasks/text-to-image/inference.js +0 -5
  42. package/dist/commonjs/tasks/text-to-speech/inference.d.ts +14 -17
  43. package/dist/commonjs/tasks/text-to-speech/inference.d.ts.map +1 -1
  44. package/dist/commonjs/tasks/text-to-speech/inference.js +0 -5
  45. package/dist/commonjs/tasks/text-to-video/inference.d.ts +58 -0
  46. package/dist/commonjs/tasks/text-to-video/inference.d.ts.map +1 -0
  47. package/dist/commonjs/tasks/text-to-video/inference.js +2 -0
  48. package/dist/commonjs/tasks/text2text-generation/inference.d.ts.map +1 -1
  49. package/dist/commonjs/tasks/text2text-generation/inference.js +0 -5
  50. package/dist/commonjs/tasks/translation/inference.d.ts.map +1 -1
  51. package/dist/commonjs/tasks/translation/inference.js +0 -5
  52. package/dist/commonjs/tasks/visual-question-answering/inference.d.ts +1 -1
  53. package/dist/commonjs/tasks/visual-question-answering/inference.d.ts.map +1 -1
  54. package/dist/commonjs/tasks/zero-shot-image-classification/inference.d.ts +1 -1
  55. package/dist/commonjs/tasks/zero-shot-image-classification/inference.d.ts.map +1 -1
  56. package/dist/commonjs/tasks/zero-shot-object-detection/inference.d.ts +1 -1
  57. package/dist/commonjs/tasks/zero-shot-object-detection/inference.d.ts.map +1 -1
  58. package/dist/esm/model-libraries-snippets.d.ts +2 -2
  59. package/dist/esm/model-libraries-snippets.d.ts.map +1 -1
  60. package/dist/esm/model-libraries-snippets.js +2 -2
  61. package/dist/esm/model-libraries.d.ts +2 -2
  62. package/dist/esm/tasks/audio-classification/inference.d.ts +1 -1
  63. package/dist/esm/tasks/audio-classification/inference.d.ts.map +1 -1
  64. package/dist/esm/tasks/automatic-speech-recognition/inference.d.ts +1 -1
  65. package/dist/esm/tasks/automatic-speech-recognition/inference.d.ts.map +1 -1
  66. package/dist/esm/tasks/automatic-speech-recognition/inference.js +0 -5
  67. package/dist/esm/tasks/chat-completion/inference.d.ts.map +1 -1
  68. package/dist/esm/tasks/chat-completion/inference.js +0 -5
  69. package/dist/esm/tasks/depth-estimation/inference.d.ts.map +1 -1
  70. package/dist/esm/tasks/depth-estimation/inference.js +0 -5
  71. package/dist/esm/tasks/feature-extraction/inference.d.ts.map +1 -1
  72. package/dist/esm/tasks/feature-extraction/inference.js +0 -5
  73. package/dist/esm/tasks/image-classification/inference.d.ts +1 -1
  74. package/dist/esm/tasks/image-classification/inference.d.ts.map +1 -1
  75. package/dist/esm/tasks/image-segmentation/inference.d.ts +1 -1
  76. package/dist/esm/tasks/image-segmentation/inference.d.ts.map +1 -1
  77. package/dist/esm/tasks/image-to-image/inference.d.ts +3 -3
  78. package/dist/esm/tasks/image-to-image/inference.d.ts.map +1 -1
  79. package/dist/esm/tasks/image-to-image/inference.js +0 -5
  80. package/dist/esm/tasks/image-to-text/inference.d.ts +1 -1
  81. package/dist/esm/tasks/image-to-text/inference.d.ts.map +1 -1
  82. package/dist/esm/tasks/image-to-text/inference.js +0 -5
  83. package/dist/esm/tasks/index.d.ts +1 -0
  84. package/dist/esm/tasks/index.d.ts.map +1 -1
  85. package/dist/esm/tasks/object-detection/inference.d.ts +1 -1
  86. package/dist/esm/tasks/object-detection/inference.d.ts.map +1 -1
  87. package/dist/esm/tasks/sentence-similarity/inference.d.ts.map +1 -1
  88. package/dist/esm/tasks/sentence-similarity/inference.js +0 -5
  89. package/dist/esm/tasks/summarization/inference.d.ts.map +1 -1
  90. package/dist/esm/tasks/summarization/inference.js +0 -5
  91. package/dist/esm/tasks/text-generation/inference.d.ts.map +1 -1
  92. package/dist/esm/tasks/text-generation/inference.js +0 -5
  93. package/dist/esm/tasks/text-to-audio/inference.d.ts +14 -15
  94. package/dist/esm/tasks/text-to-audio/inference.d.ts.map +1 -1
  95. package/dist/esm/tasks/text-to-audio/inference.js +0 -5
  96. package/dist/esm/tasks/text-to-image/inference.d.ts +2 -2
  97. package/dist/esm/tasks/text-to-image/inference.d.ts.map +1 -1
  98. package/dist/esm/tasks/text-to-image/inference.js +0 -5
  99. package/dist/esm/tasks/text-to-speech/inference.d.ts +14 -17
  100. package/dist/esm/tasks/text-to-speech/inference.d.ts.map +1 -1
  101. package/dist/esm/tasks/text-to-speech/inference.js +0 -5
  102. package/dist/esm/tasks/text-to-video/inference.d.ts +58 -0
  103. package/dist/esm/tasks/text-to-video/inference.d.ts.map +1 -0
  104. package/dist/esm/tasks/text-to-video/inference.js +1 -0
  105. package/dist/esm/tasks/text2text-generation/inference.d.ts.map +1 -1
  106. package/dist/esm/tasks/text2text-generation/inference.js +0 -5
  107. package/dist/esm/tasks/translation/inference.d.ts.map +1 -1
  108. package/dist/esm/tasks/translation/inference.js +0 -5
  109. package/dist/esm/tasks/visual-question-answering/inference.d.ts +1 -1
  110. package/dist/esm/tasks/visual-question-answering/inference.d.ts.map +1 -1
  111. package/dist/esm/tasks/zero-shot-image-classification/inference.d.ts +1 -1
  112. package/dist/esm/tasks/zero-shot-image-classification/inference.d.ts.map +1 -1
  113. package/dist/esm/tasks/zero-shot-object-detection/inference.d.ts +1 -1
  114. package/dist/esm/tasks/zero-shot-object-detection/inference.d.ts.map +1 -1
  115. package/package.json +1 -1
  116. package/src/model-libraries-snippets.ts +3 -3
  117. package/src/tasks/audio-classification/inference.ts +1 -1
  118. package/src/tasks/audio-classification/spec/input.json +2 -1
  119. package/src/tasks/automatic-speech-recognition/inference.ts +1 -7
  120. package/src/tasks/automatic-speech-recognition/spec/input.json +2 -1
  121. package/src/tasks/chat-completion/inference.ts +0 -33
  122. package/src/tasks/depth-estimation/inference.ts +3 -3
  123. package/src/tasks/document-question-answering/spec/input.json +2 -1
  124. package/src/tasks/feature-extraction/inference.ts +0 -3
  125. package/src/tasks/image-classification/inference.ts +1 -1
  126. package/src/tasks/image-classification/spec/input.json +2 -1
  127. package/src/tasks/image-segmentation/inference.ts +1 -1
  128. package/src/tasks/image-segmentation/spec/input.json +2 -1
  129. package/src/tasks/image-to-image/inference.ts +3 -7
  130. package/src/tasks/image-to-image/spec/input.json +4 -6
  131. package/src/tasks/image-to-text/inference.ts +1 -6
  132. package/src/tasks/image-to-text/spec/input.json +2 -1
  133. package/src/tasks/index.ts +1 -0
  134. package/src/tasks/object-detection/inference.ts +1 -1
  135. package/src/tasks/object-detection/spec/input.json +2 -1
  136. package/src/tasks/sentence-similarity/inference.ts +3 -4
  137. package/src/tasks/summarization/inference.ts +3 -5
  138. package/src/tasks/text-generation/inference.ts +0 -13
  139. package/src/tasks/text-to-audio/inference.ts +14 -20
  140. package/src/tasks/text-to-audio/spec/output.json +3 -2
  141. package/src/tasks/text-to-image/inference.ts +2 -6
  142. package/src/tasks/text-to-image/spec/input.json +2 -5
  143. package/src/tasks/text-to-speech/inference.ts +14 -22
  144. package/src/tasks/text-to-speech/spec/output.json +13 -2
  145. package/src/tasks/text-to-video/inference.ts +57 -0
  146. package/src/tasks/text-to-video/spec/input.json +49 -0
  147. package/src/tasks/text-to-video/spec/output.json +13 -0
  148. package/src/tasks/text2text-generation/inference.ts +3 -5
  149. package/src/tasks/translation/inference.ts +3 -5
  150. package/src/tasks/visual-question-answering/inference.ts +1 -1
  151. package/src/tasks/visual-question-answering/spec/input.json +4 -2
  152. package/src/tasks/zero-shot-image-classification/inference.ts +1 -1
  153. package/src/tasks/zero-shot-image-classification/spec/input.json +2 -1
  154. package/src/tasks/zero-shot-object-detection/inference.ts +1 -1
  155. package/src/tasks/zero-shot-object-detection/spec/input.json +2 -1
@@ -3,7 +3,6 @@
3
3
  *
4
4
  * Using src/scripts/inference-codegen
5
5
  */
6
-
7
6
  /**
8
7
  * Inputs for Text2text Generation inference
9
8
  */
@@ -18,7 +17,6 @@ export interface Text2TextGenerationInput {
18
17
  parameters?: Text2TextGenerationParameters;
19
18
  [property: string]: unknown;
20
19
  }
21
-
22
20
  /**
23
21
  * Additional inference parameters for Text2text Generation
24
22
  */
@@ -30,16 +28,16 @@ export interface Text2TextGenerationParameters {
30
28
  /**
31
29
  * Additional parametrization of the text generation algorithm
32
30
  */
33
- generate_parameters?: { [key: string]: unknown };
31
+ generate_parameters?: {
32
+ [key: string]: unknown;
33
+ };
34
34
  /**
35
35
  * The truncation strategy to use
36
36
  */
37
37
  truncation?: Text2TextGenerationTruncationStrategy;
38
38
  [property: string]: unknown;
39
39
  }
40
-
41
40
  export type Text2TextGenerationTruncationStrategy = "do_not_truncate" | "longest_first" | "only_first" | "only_second";
42
-
43
41
  /**
44
42
  * Outputs of inference for the Text2text Generation task
45
43
  */
@@ -3,7 +3,6 @@
3
3
  *
4
4
  * Using src/scripts/inference-codegen
5
5
  */
6
-
7
6
  /**
8
7
  * Inputs for Translation inference
9
8
  */
@@ -18,7 +17,6 @@ export interface TranslationInput {
18
17
  parameters?: TranslationParameters;
19
18
  [property: string]: unknown;
20
19
  }
21
-
22
20
  /**
23
21
  * Additional inference parameters for Translation
24
22
  */
@@ -30,7 +28,9 @@ export interface TranslationParameters {
30
28
  /**
31
29
  * Additional parametrization of the text generation algorithm.
32
30
  */
33
- generate_parameters?: { [key: string]: unknown };
31
+ generate_parameters?: {
32
+ [key: string]: unknown;
33
+ };
34
34
  /**
35
35
  * The source language of the text. Required for models that can translate from multiple
36
36
  * languages.
@@ -47,12 +47,10 @@ export interface TranslationParameters {
47
47
  truncation?: TranslationTruncationStrategy;
48
48
  [property: string]: unknown;
49
49
  }
50
-
51
50
  /**
52
51
  * The truncation strategy to use.
53
52
  */
54
53
  export type TranslationTruncationStrategy = "do_not_truncate" | "longest_first" | "only_first" | "only_second";
55
-
56
54
  /**
57
55
  * Outputs of inference for the Translation task
58
56
  */
@@ -28,7 +28,7 @@ export interface VisualQuestionAnsweringInputData {
28
28
  /**
29
29
  * The question to answer based on the image.
30
30
  */
31
- question: unknown;
31
+ question: string;
32
32
  [property: string]: unknown;
33
33
  }
34
34
  /**
@@ -11,10 +11,12 @@
11
11
  "title": "VisualQuestionAnsweringInputData",
12
12
  "properties": {
13
13
  "image": {
14
- "description": "The image."
14
+ "description": "The image.",
15
+ "comment": "type=binary"
15
16
  },
16
17
  "question": {
17
- "description": "The question to answer based on the image."
18
+ "description": "The question to answer based on the image.",
19
+ "type": "string"
18
20
  }
19
21
  },
20
22
  "required": ["question", "image"]
@@ -10,7 +10,7 @@ export interface ZeroShotImageClassificationInput {
10
10
  /**
11
11
  * The input image data to classify as a base64-encoded string.
12
12
  */
13
- inputs: string;
13
+ inputs: Blob;
14
14
  /**
15
15
  * Additional inference parameters for Zero Shot Image Classification
16
16
  */
@@ -7,7 +7,8 @@
7
7
  "properties": {
8
8
  "inputs": {
9
9
  "type": "string",
10
- "description": "The input image data to classify as a base64-encoded string."
10
+ "description": "The input image data to classify as a base64-encoded string.",
11
+ "comment": "type=binary"
11
12
  },
12
13
  "parameters": {
13
14
  "description": "Additional inference parameters for Zero Shot Image Classification",
@@ -10,7 +10,7 @@ export interface ZeroShotObjectDetectionInput {
10
10
  /**
11
11
  * The input image data as a base64-encoded string.
12
12
  */
13
- inputs: string;
13
+ inputs: Blob;
14
14
  /**
15
15
  * Additional inference parameters for Zero Shot Object Detection
16
16
  */
@@ -7,7 +7,8 @@
7
7
  "properties": {
8
8
  "inputs": {
9
9
  "description": "The input image data as a base64-encoded string.",
10
- "type": "string"
10
+ "type": "string",
11
+ "comment": "type=binary"
11
12
  },
12
13
  "parameters": {
13
14
  "description": "Additional inference parameters for Zero Shot Object Detection",