@huggingface/tasks 0.19.35 → 0.19.37
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/commonjs/local-apps.d.ts +7 -0
- package/dist/commonjs/local-apps.d.ts.map +1 -1
- package/dist/commonjs/local-apps.js +31 -0
- package/dist/commonjs/model-libraries-snippets.d.ts +1 -0
- package/dist/commonjs/model-libraries-snippets.d.ts.map +1 -1
- package/dist/commonjs/model-libraries-snippets.js +12 -2
- package/dist/commonjs/model-libraries.d.ts +15 -1
- package/dist/commonjs/model-libraries.d.ts.map +1 -1
- package/dist/commonjs/model-libraries.js +14 -0
- package/dist/commonjs/tasks/any-to-any/data.js +3 -3
- package/dist/commonjs/tasks/image-segmentation/data.js +2 -2
- package/dist/commonjs/tasks/image-text-to-text/data.d.ts.map +1 -1
- package/dist/commonjs/tasks/image-text-to-text/data.js +10 -38
- package/dist/commonjs/tasks/image-to-3d/data.js +2 -2
- package/dist/commonjs/tasks/image-to-image/data.d.ts.map +1 -1
- package/dist/commonjs/tasks/image-to-image/data.js +13 -25
- package/dist/commonjs/tasks/image-to-text/data.d.ts.map +1 -1
- package/dist/commonjs/tasks/image-to-text/data.js +10 -30
- package/dist/commonjs/tasks/keypoint-detection/data.js +5 -5
- package/dist/commonjs/tasks/object-detection/data.js +2 -2
- package/dist/commonjs/tasks/text-generation/data.d.ts.map +1 -1
- package/dist/commonjs/tasks/text-generation/data.js +14 -10
- package/dist/commonjs/tasks/text-to-image/data.js +6 -6
- package/dist/commonjs/tasks/text-to-speech/data.d.ts.map +1 -1
- package/dist/commonjs/tasks/text-to-speech/data.js +10 -14
- package/dist/commonjs/tasks/text-to-video/data.js +3 -3
- package/dist/commonjs/tasks/visual-document-retrieval/data.d.ts.map +1 -1
- package/dist/commonjs/tasks/visual-document-retrieval/data.js +6 -2
- package/dist/commonjs/tasks/zero-shot-object-detection/data.js +4 -4
- package/dist/esm/local-apps.d.ts +7 -0
- package/dist/esm/local-apps.d.ts.map +1 -1
- package/dist/esm/local-apps.js +31 -0
- package/dist/esm/model-libraries-snippets.d.ts +1 -0
- package/dist/esm/model-libraries-snippets.d.ts.map +1 -1
- package/dist/esm/model-libraries-snippets.js +10 -1
- package/dist/esm/model-libraries.d.ts +15 -1
- package/dist/esm/model-libraries.d.ts.map +1 -1
- package/dist/esm/model-libraries.js +14 -0
- package/dist/esm/tasks/any-to-any/data.js +3 -3
- package/dist/esm/tasks/image-segmentation/data.js +2 -2
- package/dist/esm/tasks/image-text-to-text/data.d.ts.map +1 -1
- package/dist/esm/tasks/image-text-to-text/data.js +10 -38
- package/dist/esm/tasks/image-to-3d/data.js +2 -2
- package/dist/esm/tasks/image-to-image/data.d.ts.map +1 -1
- package/dist/esm/tasks/image-to-image/data.js +13 -25
- package/dist/esm/tasks/image-to-text/data.d.ts.map +1 -1
- package/dist/esm/tasks/image-to-text/data.js +10 -30
- package/dist/esm/tasks/keypoint-detection/data.js +5 -5
- package/dist/esm/tasks/object-detection/data.js +2 -2
- package/dist/esm/tasks/text-generation/data.d.ts.map +1 -1
- package/dist/esm/tasks/text-generation/data.js +14 -10
- package/dist/esm/tasks/text-to-image/data.js +6 -6
- package/dist/esm/tasks/text-to-speech/data.d.ts.map +1 -1
- package/dist/esm/tasks/text-to-speech/data.js +10 -14
- package/dist/esm/tasks/text-to-video/data.js +3 -3
- package/dist/esm/tasks/visual-document-retrieval/data.d.ts.map +1 -1
- package/dist/esm/tasks/visual-document-retrieval/data.js +6 -2
- package/dist/esm/tasks/zero-shot-object-detection/data.js +4 -4
- package/package.json +1 -1
- package/src/local-apps.ts +32 -0
- package/src/model-libraries-snippets.ts +11 -1
- package/src/model-libraries.ts +14 -0
- package/src/tasks/any-to-any/data.ts +3 -3
- package/src/tasks/image-segmentation/data.ts +2 -2
- package/src/tasks/image-text-to-text/data.ts +10 -38
- package/src/tasks/image-to-3d/data.ts +2 -2
- package/src/tasks/image-to-image/data.ts +13 -25
- package/src/tasks/image-to-text/data.ts +10 -30
- package/src/tasks/keypoint-detection/data.ts +5 -5
- package/src/tasks/object-detection/data.ts +2 -2
- package/src/tasks/text-generation/data.ts +14 -10
- package/src/tasks/text-to-image/data.ts +6 -6
- package/src/tasks/text-to-speech/data.ts +10 -14
- package/src/tasks/text-to-video/data.ts +3 -3
- package/src/tasks/visual-document-retrieval/data.ts +7 -2
- package/src/tasks/zero-shot-object-detection/data.ts +4 -4
|
@@ -63,20 +63,20 @@ const taskData: TaskDataCustom = {
|
|
|
63
63
|
models: [
|
|
64
64
|
{ description: "A text-generation model trained to follow instructions.", id: "google/gemma-2-2b-it" },
|
|
65
65
|
{
|
|
66
|
-
description: "
|
|
67
|
-
id: "
|
|
66
|
+
description: "Powerful text generation model for coding.",
|
|
67
|
+
id: "Qwen/Qwen3-Coder-480B-A35B-Instruct",
|
|
68
68
|
},
|
|
69
69
|
{
|
|
70
|
-
description: "
|
|
71
|
-
id: "
|
|
70
|
+
description: "Great text generation model with top-notch tool calling capabilities.",
|
|
71
|
+
id: "openai/gpt-oss-120b",
|
|
72
72
|
},
|
|
73
73
|
{
|
|
74
|
-
description: "Powerful text generation model
|
|
75
|
-
id: "
|
|
74
|
+
description: "Powerful text generation model.",
|
|
75
|
+
id: "zai-org/GLM-4.5",
|
|
76
76
|
},
|
|
77
77
|
{
|
|
78
|
-
description: "A
|
|
79
|
-
id: "
|
|
78
|
+
description: "A powerful small model with reasoning capabilities.",
|
|
79
|
+
id: "Qwen/Qwen3-4B-Thinking-2507",
|
|
80
80
|
},
|
|
81
81
|
{
|
|
82
82
|
description: "Strong conversational model that supports very long instructions.",
|
|
@@ -93,8 +93,12 @@ const taskData: TaskDataCustom = {
|
|
|
93
93
|
],
|
|
94
94
|
spaces: [
|
|
95
95
|
{
|
|
96
|
-
description: "
|
|
97
|
-
id: "
|
|
96
|
+
description: "An application that writes and executes code from text instructions and supports many models.",
|
|
97
|
+
id: "akhaliq/anycoder",
|
|
98
|
+
},
|
|
99
|
+
{
|
|
100
|
+
description: "An application that builds websites from natural language prompts.",
|
|
101
|
+
id: "enzostvs/deepsite",
|
|
98
102
|
},
|
|
99
103
|
{
|
|
100
104
|
description: "A leaderboard for comparing chain-of-thought performance of models.",
|
|
@@ -50,19 +50,19 @@ const taskData: TaskDataCustom = {
|
|
|
50
50
|
models: [
|
|
51
51
|
{
|
|
52
52
|
description: "One of the most powerful image generation models that can generate realistic outputs.",
|
|
53
|
-
id: "black-forest-labs/FLUX.1-dev",
|
|
53
|
+
id: "black-forest-labs/FLUX.1-Krea-dev",
|
|
54
54
|
},
|
|
55
55
|
{
|
|
56
|
-
description: "A powerful
|
|
57
|
-
id: "
|
|
56
|
+
description: "A powerful image generation model.",
|
|
57
|
+
id: "Qwen/Qwen-Image",
|
|
58
58
|
},
|
|
59
59
|
{
|
|
60
|
-
description: "
|
|
61
|
-
id: "
|
|
60
|
+
description: "Powerful and fast image generation model.",
|
|
61
|
+
id: "ByteDance/SDXL-Lightning",
|
|
62
62
|
},
|
|
63
63
|
{
|
|
64
64
|
description: "A powerful text-to-image model.",
|
|
65
|
-
id: "
|
|
65
|
+
id: "ByteDance/Hyper-SD",
|
|
66
66
|
},
|
|
67
67
|
],
|
|
68
68
|
spaces: [
|
|
@@ -39,24 +39,20 @@ const taskData: TaskDataCustom = {
|
|
|
39
39
|
],
|
|
40
40
|
models: [
|
|
41
41
|
{
|
|
42
|
-
description: "
|
|
43
|
-
id: "
|
|
42
|
+
description: "Small yet powerful TTS model.",
|
|
43
|
+
id: "KittenML/kitten-tts-nano-0.1",
|
|
44
44
|
},
|
|
45
45
|
{
|
|
46
|
-
description: "
|
|
47
|
-
id: "
|
|
46
|
+
description: "Bleeding edge TTS model.",
|
|
47
|
+
id: "ResembleAI/chatterbox",
|
|
48
48
|
},
|
|
49
49
|
{
|
|
50
50
|
description: "A massively multi-lingual TTS model.",
|
|
51
51
|
id: "fishaudio/fish-speech-1.5",
|
|
52
52
|
},
|
|
53
53
|
{
|
|
54
|
-
description: "A
|
|
55
|
-
id: "
|
|
56
|
-
},
|
|
57
|
-
{
|
|
58
|
-
description: "Small yet powerful TTS model.",
|
|
59
|
-
id: "hexgrad/Kokoro-82M",
|
|
54
|
+
description: "A text-to-dialogue model.",
|
|
55
|
+
id: "nari-labs/Dia-1.6B-0626",
|
|
60
56
|
},
|
|
61
57
|
],
|
|
62
58
|
spaces: [
|
|
@@ -69,12 +65,12 @@ const taskData: TaskDataCustom = {
|
|
|
69
65
|
id: "fishaudio/fish-speech-1",
|
|
70
66
|
},
|
|
71
67
|
{
|
|
72
|
-
description: "
|
|
73
|
-
id: "
|
|
68
|
+
description: "Performant TTS application.",
|
|
69
|
+
id: "ResembleAI/Chatterbox",
|
|
74
70
|
},
|
|
75
71
|
{
|
|
76
|
-
description: "An application
|
|
77
|
-
id: "
|
|
72
|
+
description: "An application to compare different TTS models.",
|
|
73
|
+
id: "TTS-AGI/TTS-Arena-V2",
|
|
78
74
|
},
|
|
79
75
|
{
|
|
80
76
|
description: "An application that generates podcast episodes.",
|
|
@@ -79,8 +79,8 @@ const taskData: TaskDataCustom = {
|
|
|
79
79
|
id: "nvidia/Cosmos-1.0-Diffusion-7B-Text2World",
|
|
80
80
|
},
|
|
81
81
|
{
|
|
82
|
-
description: "
|
|
83
|
-
id: "
|
|
82
|
+
description: "Very fast model for video generation.",
|
|
83
|
+
id: "Lightricks/LTX-Video-0.9.8-13B-distilled",
|
|
84
84
|
},
|
|
85
85
|
],
|
|
86
86
|
spaces: [
|
|
@@ -99,7 +99,7 @@ const taskData: TaskDataCustom = {
|
|
|
99
99
|
],
|
|
100
100
|
summary:
|
|
101
101
|
"Text-to-video models can be used in any application that requires generating consistent sequence of images from text. ",
|
|
102
|
-
widgetModels: ["Wan-AI/Wan2.
|
|
102
|
+
widgetModels: ["Wan-AI/Wan2.2-TI2V-5B"],
|
|
103
103
|
youtubeId: undefined,
|
|
104
104
|
};
|
|
105
105
|
|
|
@@ -52,8 +52,9 @@ const taskData: TaskDataCustom = {
|
|
|
52
52
|
id: "vidore/colqwen2-v1.0",
|
|
53
53
|
},
|
|
54
54
|
{
|
|
55
|
-
description:
|
|
56
|
-
|
|
55
|
+
description:
|
|
56
|
+
"Very fast and efficient visual document retrieval model that can also take in other modalities like audio.",
|
|
57
|
+
id: "Tevatron/OmniEmbed-v0.1",
|
|
57
58
|
},
|
|
58
59
|
],
|
|
59
60
|
spaces: [
|
|
@@ -61,6 +62,10 @@ const taskData: TaskDataCustom = {
|
|
|
61
62
|
description: "A leaderboard of visual document retrieval models.",
|
|
62
63
|
id: "vidore/vidore-leaderboard",
|
|
63
64
|
},
|
|
65
|
+
{
|
|
66
|
+
description: "Visual retrieval augmented generation demo based on ColQwen2 model.",
|
|
67
|
+
id: "vidore/visual-rag-tool",
|
|
68
|
+
},
|
|
64
69
|
],
|
|
65
70
|
summary:
|
|
66
71
|
"Visual document retrieval is the task of searching for relevant image-based documents, such as PDFs. These models take a text query and multiple documents as input and return the top-most relevant documents and relevancy scores as output.",
|
|
@@ -40,17 +40,17 @@ const taskData: TaskDataCustom = {
|
|
|
40
40
|
models: [
|
|
41
41
|
{
|
|
42
42
|
description: "Solid zero-shot object detection model.",
|
|
43
|
-
id: "
|
|
43
|
+
id: "openmmlab-community/mm_grounding_dino_large_all",
|
|
44
44
|
},
|
|
45
45
|
{
|
|
46
46
|
description: "Cutting-edge zero-shot object detection model.",
|
|
47
|
-
id: "
|
|
47
|
+
id: "fushh7/LLMDet",
|
|
48
48
|
},
|
|
49
49
|
],
|
|
50
50
|
spaces: [
|
|
51
51
|
{
|
|
52
|
-
description: "A demo to
|
|
53
|
-
id: "
|
|
52
|
+
description: "A demo to compare different zero-shot object detection models per output and latency.",
|
|
53
|
+
id: "ariG23498/zero-shot-od",
|
|
54
54
|
},
|
|
55
55
|
{
|
|
56
56
|
description:
|