npm - @huggingface/tasks - Versions diffs - 0.12.3 → 0.12.5 - Mend

@huggingface/tasks 0.12.3 → 0.12.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (25) hide show

package/dist/index.cjs +95 -9
package/dist/index.js +95 -9
package/dist/src/hardware.d.ts +25 -0
package/dist/src/hardware.d.ts.map +1 -1
package/dist/src/model-data.d.ts +1 -0
package/dist/src/model-data.d.ts.map +1 -1
package/dist/src/model-libraries-snippets.d.ts +2 -0
package/dist/src/model-libraries-snippets.d.ts.map +1 -1
package/dist/src/model-libraries.d.ts +39 -3
package/dist/src/model-libraries.d.ts.map +1 -1
package/dist/src/tasks/keypoint-detection/data.d.ts.map +1 -1
package/dist/src/tasks/video-text-to-text/data.d.ts +4 -0
package/dist/src/tasks/video-text-to-text/data.d.ts.map +1 -0
package/package.json +1 -1
package/src/hardware.ts +25 -0
package/src/model-data.ts +1 -0
package/src/model-libraries-snippets.ts +37 -6
package/src/model-libraries.ts +37 -1
package/src/tasks/image-text-to-text/data.ts +1 -1
package/src/tasks/keypoint-detection/about.md +6 -8
package/src/tasks/keypoint-detection/data.ts +4 -0
package/src/tasks/text-to-image/about.md +24 -3
package/src/tasks/text-to-image/data.ts +1 -1
package/src/tasks/video-text-to-text/about.md +98 -0
package/src/tasks/video-text-to-text/data.ts +58 -0

package/dist/index.cjs CHANGED Viewed

@@ -2237,7 +2237,7 @@ var taskData11 = {
     },
     {
       description: "Strong image-text-to-text model.",
-      id: "llava-hf/llava-v1.6-mistral-7b-hf"
+      id: "microsoft/Phi-3.5-vision-instruct"
     }
   ],
   spaces: [
@@ -3147,7 +3147,7 @@ var taskData24 = {
       id: "InstantX/InstantID"
     }
   ],
-  summary: "Generates images from input text. These models can be used to generate and modify images based on text prompts.",
+  summary: "Text-to-image is the task of generating images from input text. These pipelines can also be used to modify and edit images based on text prompts.",
   widgetModels: ["black-forest-labs/FLUX.1-dev"],
   youtubeId: ""
 };
@@ -4390,6 +4390,7 @@ function nameWithoutNamespace(modelId) {
   const splitted = modelId.split("/");
   return splitted.length === 1 ? splitted[0] : splitted[1];
 }
+var escapeStringForJson = (str) => JSON.stringify(str);
 var adapters = (model) => [
   `from adapters import AutoAdapterModel
@@ -4442,6 +4443,12 @@ result, message = detector.detect_watermark(watermarked_audio, sr)`;
 function get_base_diffusers_model(model) {
   return model.cardData?.base_model?.toString() ?? "fill-in-base-model";
 }
+function get_prompt_from_diffusers_model(model) {
+  const prompt = (model.widgetData?.[0]).text ?? model.cardData?.instance_prompt;
+  if (prompt) {
+    return escapeStringForJson(prompt);
+  }
+}
 var bertopic = (model) => [
   `from bertopic import BERTopic
@@ -4495,30 +4502,37 @@ depth = model.infer_image(raw_img) # HxW raw depth map in numpy
     `
   ];
 };
+var diffusersDefaultPrompt = "Astronaut in a jungle, cold color palette, muted colors, detailed, 8k";
 var diffusers_default = (model) => [
   `from diffusers import DiffusionPipeline
-pipeline = DiffusionPipeline.from_pretrained("${model.id}")`
+pipe = DiffusionPipeline.from_pretrained("${model.id}")
+prompt = "${get_prompt_from_diffusers_model(model) ?? diffusersDefaultPrompt}"
+image = pipe(prompt).images[0]`
 ];
 var diffusers_controlnet = (model) => [
   `from diffusers import ControlNetModel, StableDiffusionControlNetPipeline
 controlnet = ControlNetModel.from_pretrained("${model.id}")
-pipeline = StableDiffusionControlNetPipeline.from_pretrained(
+pipe = StableDiffusionControlNetPipeline.from_pretrained(
 	"${get_base_diffusers_model(model)}", controlnet=controlnet
 )`
 ];
 var diffusers_lora = (model) => [
   `from diffusers import DiffusionPipeline
-pipeline = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
-pipeline.load_lora_weights("${model.id}")`
+pipe = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
+pipe.load_lora_weights("${model.id}")
+prompt = "${get_prompt_from_diffusers_model(model) ?? diffusersDefaultPrompt}"
+image = pipe(prompt).images[0]`
 ];
 var diffusers_textual_inversion = (model) => [
   `from diffusers import DiffusionPipeline
-pipeline = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
-pipeline.load_textual_inversion("${model.id}")`
+pipe = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
+pipe.load_textual_inversion("${model.id}")`
 ];
 var diffusers = (model) => {
   if (model.tags.includes("controlnet")) {
@@ -5158,6 +5172,11 @@ IWorker engine = WorkerFactory.CreateWorker(BackendType.GPUCompute, model);
 // Please see provided C# file for more details
 `
 ];
+var vfimamba = (model) => [
+  `from Trainer_finetune import Model
+model = Model.from_pretrained("${model.id}")`
+];
 var voicecraft = (model) => [
   `from voicecraft import VoiceCraft
@@ -5268,6 +5287,12 @@ whisperkit-cli transcribe --audio-path /path/to/audio.mp3
 # Or use your preferred model variant
 whisperkit-cli transcribe --model "large-v3" --model-prefix "distil" --audio-path /path/to/audio.mp3 --verbose`
 ];
+var threedtopia_xl = (model) => [
+  `from threedtopia_xl.models import threedtopia_xl
+model = threedtopia_xl.from_pretrained("${model.id}")
+model.generate(cond="path/to/image.png")`
+];
 // src/model-libraries.ts
 var MODEL_LIBRARIES_UI_ELEMENTS = {
@@ -5671,7 +5696,7 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     repoName: "pythae",
     repoUrl: "https://github.com/clementchadebec/benchmark_VAE",
     snippets: pythae,
-    filter: true
+    filter: false
   },
   recurrentgemma: {
     prettyLabel: "RecurrentGemma",
@@ -5719,6 +5744,13 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     filter: true,
     countDownloads: `path:"cfg.json"`
   },
+  sapiens: {
+    prettyLabel: "sapiens",
+    repoName: "sapiens",
+    repoUrl: "https://github.com/facebookresearch/sapiens",
+    filter: false,
+    countDownloads: `path_extension:"pt2" OR path_extension:"pth" OR path_extension:"onnx"`
+  },
   "sentence-transformers": {
     prettyLabel: "sentence-transformers",
     repoName: "sentence-transformers",
@@ -5769,6 +5801,13 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     filter: true,
     countDownloads: `path:"hyperparams.yaml"`
   },
+  "ssr-speech": {
+    prettyLabel: "SSR-Speech",
+    repoName: "SSR-Speech",
+    repoUrl: "https://github.com/WangHelin1997/SSR-Speech",
+    filter: false,
+    countDownloads: `path_extension:".pth"`
+  },
   "stable-audio-tools": {
     prettyLabel: "Stable Audio Tools",
     repoName: "stable-audio-tools",
@@ -5792,6 +5831,13 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     countDownloads: `path:"cvlm_llama2_tokenizer/tokenizer.model"`,
     snippets: seed_story
   },
+  soloaudio: {
+    prettyLabel: "SoloAudio",
+    repoName: "SoloAudio",
+    repoUrl: "https://github.com/WangHelin1997/SoloAudio",
+    filter: false,
+    countDownloads: `path:"soloaudio_v2.pt"`
+  },
   "stable-baselines3": {
     prettyLabel: "stable-baselines3",
     repoName: "stable-baselines3",
@@ -5863,6 +5909,13 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     filter: true,
     countDownloads: `path_extension:"sentis"`
   },
+  "vfi-mamba": {
+    prettyLabel: "VFIMamba",
+    repoName: "VFIMamba",
+    repoUrl: "https://github.com/MCG-NJU/VFIMamba",
+    countDownloads: `path_extension:"pkl"`,
+    snippets: vfimamba
+  },
   voicecraft: {
     prettyLabel: "VoiceCraft",
     repoName: "VoiceCraft",
@@ -5884,6 +5937,14 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     docsUrl: "https://github.com/argmaxinc/WhisperKit?tab=readme-ov-file#homebrew",
     snippets: whisperkit,
     countDownloads: `path_filename:"model" AND path_extension:"mil" AND _exists_:"path_prefix"`
+  },
+  "3dtopia-xl": {
+    prettyLabel: "3DTopia-XL",
+    repoName: "3DTopia-XL",
+    repoUrl: "https://github.com/3DTopia/3DTopia-XL",
+    filter: false,
+    countDownloads: `path:"model_vae_fp16.pt"`,
+    snippets: threedtopia_xl
   }
 };
 var ALL_MODEL_LIBRARY_KEYS = Object.keys(MODEL_LIBRARIES_UI_ELEMENTS);
@@ -6568,6 +6629,14 @@ var SKUS = {
         tflops: 14.93,
         memory: [8]
       },
+      "RTX 2070 SUPER Mobile": {
+        tflops: 14.13,
+        memory: [8]
+      },
+      "RTX 2070 SUPER": {
+        tflops: 18.12,
+        memory: [8]
+      },
       "RTX 3050 Mobile": {
         tflops: 7.639,
         memory: [6]
@@ -6670,6 +6739,23 @@ var SKUS = {
         tflops: 26.11,
         memory: [16]
       }
+    },
+    QUALCOMM: {
+      "Snapdragon X Elite X1E-00-1DE": {
+        tflops: 4.6
+      },
+      "Snapdragon X Elite X1E-84-100": {
+        tflops: 4.6
+      },
+      "Snapdragon X Elite X1E-80-100": {
+        tflops: 3.8
+      },
+      "Snapdragon X Elite X1E-78-100": {
+        tflops: 3.8
+      },
+      "Snapdragon X Plus X1P-64-100": {
+        tflops: 3.8
+      }
     }
   },
   CPU: {

package/dist/index.js CHANGED Viewed

@@ -2199,7 +2199,7 @@ var taskData11 = {
     },
     {
       description: "Strong image-text-to-text model.",
-      id: "llava-hf/llava-v1.6-mistral-7b-hf"
+      id: "microsoft/Phi-3.5-vision-instruct"
     }
   ],
   spaces: [
@@ -3109,7 +3109,7 @@ var taskData24 = {
       id: "InstantX/InstantID"
     }
   ],
-  summary: "Generates images from input text. These models can be used to generate and modify images based on text prompts.",
+  summary: "Text-to-image is the task of generating images from input text. These pipelines can also be used to modify and edit images based on text prompts.",
   widgetModels: ["black-forest-labs/FLUX.1-dev"],
   youtubeId: ""
 };
@@ -4352,6 +4352,7 @@ function nameWithoutNamespace(modelId) {
   const splitted = modelId.split("/");
   return splitted.length === 1 ? splitted[0] : splitted[1];
 }
+var escapeStringForJson = (str) => JSON.stringify(str);
 var adapters = (model) => [
   `from adapters import AutoAdapterModel
@@ -4404,6 +4405,12 @@ result, message = detector.detect_watermark(watermarked_audio, sr)`;
 function get_base_diffusers_model(model) {
   return model.cardData?.base_model?.toString() ?? "fill-in-base-model";
 }
+function get_prompt_from_diffusers_model(model) {
+  const prompt = (model.widgetData?.[0]).text ?? model.cardData?.instance_prompt;
+  if (prompt) {
+    return escapeStringForJson(prompt);
+  }
+}
 var bertopic = (model) => [
   `from bertopic import BERTopic
@@ -4457,30 +4464,37 @@ depth = model.infer_image(raw_img) # HxW raw depth map in numpy
     `
   ];
 };
+var diffusersDefaultPrompt = "Astronaut in a jungle, cold color palette, muted colors, detailed, 8k";
 var diffusers_default = (model) => [
   `from diffusers import DiffusionPipeline
-pipeline = DiffusionPipeline.from_pretrained("${model.id}")`
+pipe = DiffusionPipeline.from_pretrained("${model.id}")
+prompt = "${get_prompt_from_diffusers_model(model) ?? diffusersDefaultPrompt}"
+image = pipe(prompt).images[0]`
 ];
 var diffusers_controlnet = (model) => [
   `from diffusers import ControlNetModel, StableDiffusionControlNetPipeline
 controlnet = ControlNetModel.from_pretrained("${model.id}")
-pipeline = StableDiffusionControlNetPipeline.from_pretrained(
+pipe = StableDiffusionControlNetPipeline.from_pretrained(
 	"${get_base_diffusers_model(model)}", controlnet=controlnet
 )`
 ];
 var diffusers_lora = (model) => [
   `from diffusers import DiffusionPipeline
-pipeline = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
-pipeline.load_lora_weights("${model.id}")`
+pipe = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
+pipe.load_lora_weights("${model.id}")
+prompt = "${get_prompt_from_diffusers_model(model) ?? diffusersDefaultPrompt}"
+image = pipe(prompt).images[0]`
 ];
 var diffusers_textual_inversion = (model) => [
   `from diffusers import DiffusionPipeline
-pipeline = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
-pipeline.load_textual_inversion("${model.id}")`
+pipe = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
+pipe.load_textual_inversion("${model.id}")`
 ];
 var diffusers = (model) => {
   if (model.tags.includes("controlnet")) {
@@ -5120,6 +5134,11 @@ IWorker engine = WorkerFactory.CreateWorker(BackendType.GPUCompute, model);
 // Please see provided C# file for more details
 `
 ];
+var vfimamba = (model) => [
+  `from Trainer_finetune import Model
+model = Model.from_pretrained("${model.id}")`
+];
 var voicecraft = (model) => [
   `from voicecraft import VoiceCraft
@@ -5230,6 +5249,12 @@ whisperkit-cli transcribe --audio-path /path/to/audio.mp3
 # Or use your preferred model variant
 whisperkit-cli transcribe --model "large-v3" --model-prefix "distil" --audio-path /path/to/audio.mp3 --verbose`
 ];
+var threedtopia_xl = (model) => [
+  `from threedtopia_xl.models import threedtopia_xl
+model = threedtopia_xl.from_pretrained("${model.id}")
+model.generate(cond="path/to/image.png")`
+];
 // src/model-libraries.ts
 var MODEL_LIBRARIES_UI_ELEMENTS = {
@@ -5633,7 +5658,7 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     repoName: "pythae",
     repoUrl: "https://github.com/clementchadebec/benchmark_VAE",
     snippets: pythae,
-    filter: true
+    filter: false
   },
   recurrentgemma: {
     prettyLabel: "RecurrentGemma",
@@ -5681,6 +5706,13 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     filter: true,
     countDownloads: `path:"cfg.json"`
   },
+  sapiens: {
+    prettyLabel: "sapiens",
+    repoName: "sapiens",
+    repoUrl: "https://github.com/facebookresearch/sapiens",
+    filter: false,
+    countDownloads: `path_extension:"pt2" OR path_extension:"pth" OR path_extension:"onnx"`
+  },
   "sentence-transformers": {
     prettyLabel: "sentence-transformers",
     repoName: "sentence-transformers",
@@ -5731,6 +5763,13 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     filter: true,
     countDownloads: `path:"hyperparams.yaml"`
   },
+  "ssr-speech": {
+    prettyLabel: "SSR-Speech",
+    repoName: "SSR-Speech",
+    repoUrl: "https://github.com/WangHelin1997/SSR-Speech",
+    filter: false,
+    countDownloads: `path_extension:".pth"`
+  },
   "stable-audio-tools": {
     prettyLabel: "Stable Audio Tools",
     repoName: "stable-audio-tools",
@@ -5754,6 +5793,13 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     countDownloads: `path:"cvlm_llama2_tokenizer/tokenizer.model"`,
     snippets: seed_story
   },
+  soloaudio: {
+    prettyLabel: "SoloAudio",
+    repoName: "SoloAudio",
+    repoUrl: "https://github.com/WangHelin1997/SoloAudio",
+    filter: false,
+    countDownloads: `path:"soloaudio_v2.pt"`
+  },
   "stable-baselines3": {
     prettyLabel: "stable-baselines3",
     repoName: "stable-baselines3",
@@ -5825,6 +5871,13 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     filter: true,
     countDownloads: `path_extension:"sentis"`
   },
+  "vfi-mamba": {
+    prettyLabel: "VFIMamba",
+    repoName: "VFIMamba",
+    repoUrl: "https://github.com/MCG-NJU/VFIMamba",
+    countDownloads: `path_extension:"pkl"`,
+    snippets: vfimamba
+  },
   voicecraft: {
     prettyLabel: "VoiceCraft",
     repoName: "VoiceCraft",
@@ -5846,6 +5899,14 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     docsUrl: "https://github.com/argmaxinc/WhisperKit?tab=readme-ov-file#homebrew",
     snippets: whisperkit,
     countDownloads: `path_filename:"model" AND path_extension:"mil" AND _exists_:"path_prefix"`
+  },
+  "3dtopia-xl": {
+    prettyLabel: "3DTopia-XL",
+    repoName: "3DTopia-XL",
+    repoUrl: "https://github.com/3DTopia/3DTopia-XL",
+    filter: false,
+    countDownloads: `path:"model_vae_fp16.pt"`,
+    snippets: threedtopia_xl
   }
 };
 var ALL_MODEL_LIBRARY_KEYS = Object.keys(MODEL_LIBRARIES_UI_ELEMENTS);
@@ -6530,6 +6591,14 @@ var SKUS = {
         tflops: 14.93,
         memory: [8]
       },
+      "RTX 2070 SUPER Mobile": {
+        tflops: 14.13,
+        memory: [8]
+      },
+      "RTX 2070 SUPER": {
+        tflops: 18.12,
+        memory: [8]
+      },
       "RTX 3050 Mobile": {
         tflops: 7.639,
         memory: [6]
@@ -6632,6 +6701,23 @@ var SKUS = {
         tflops: 26.11,
         memory: [16]
       }
+    },
+    QUALCOMM: {
+      "Snapdragon X Elite X1E-00-1DE": {
+        tflops: 4.6
+      },
+      "Snapdragon X Elite X1E-84-100": {
+        tflops: 4.6
+      },
+      "Snapdragon X Elite X1E-80-100": {
+        tflops: 3.8
+      },
+      "Snapdragon X Elite X1E-78-100": {
+        tflops: 3.8
+      },
+      "Snapdragon X Plus X1P-64-100": {
+        tflops: 3.8
+      }
     }
   },
   CPU: {

package/dist/src/hardware.d.ts CHANGED Viewed

@@ -172,6 +172,14 @@ export declare const SKUS: {
                 tflops: number;
                 memory: number[];
             };
+            "RTX 2070 SUPER Mobile": {
+                tflops: number;
+                memory: number[];
+            };
+            "RTX 2070 SUPER": {
+                tflops: number;
+                memory: number[];
+            };
             "RTX 3050 Mobile": {
                 tflops: number;
                 memory: number[];
@@ -271,6 +279,23 @@ export declare const SKUS: {
                 memory: number[];
             };
         };
+        QUALCOMM: {
+            "Snapdragon X Elite X1E-00-1DE": {
+                tflops: number;
+            };
+            "Snapdragon X Elite X1E-84-100": {
+                tflops: number;
+            };
+            "Snapdragon X Elite X1E-80-100": {
+                tflops: number;
+            };
+            "Snapdragon X Elite X1E-78-100": {
+                tflops: number;
+            };
+            "Snapdragon X Plus X1P-64-100": {
+                tflops: number;
+            };
+        };
     };
     CPU: {
         Intel: {

package/dist/src/hardware.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"hardware.d.ts","sourceRoot":"","sources":["../../src/hardware.ts"],"names":[],"mappings":"AAAA;;;GAGG;AACH,eAAO,MAAM,iDAAiD,QAAW,CAAC;AAC1E,eAAO,MAAM,yDAAyD,QAAW,CAAC;AAClF,eAAO,MAAM,oCAAoC,QAAU,CAAC;AAE5D;;;GAGG;AACH,eAAO,MAAM,+CAA+C,QAAW,CAAC;AAExE,MAAM,WAAW,YAAY;IAC5B;;;;;;;;;OASG;IACH,MAAM,EAAE,MAAM,CAAC;IACf;;;OAGG;IACH,MAAM,CAAC,EAAE,MAAM,EAAE,CAAC;CAClB;AAED,eAAO,MAAM,sBAAsB,UAAqD,CAAC;AAEzF,eAAO,MAAM,IAAI;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CA+YuD,CAAC;AAEzE,MAAM,MAAM,OAAO,GAAG,MAAM,OAAO,IAAI,CAAC"}
1	+ {"version":3,"file":"hardware.d.ts","sourceRoot":"","sources":["../../src/hardware.ts"],"names":[],"mappings":"AAAA;;;GAGG;AACH,eAAO,MAAM,iDAAiD,QAAW,CAAC;AAC1E,eAAO,MAAM,yDAAyD,QAAW,CAAC;AAClF,eAAO,MAAM,oCAAoC,QAAU,CAAC;AAE5D;;;GAGG;AACH,eAAO,MAAM,+CAA+C,QAAW,CAAC;AAExE,MAAM,WAAW,YAAY;IAC5B;;;;;;;;;OASG;IACH,MAAM,EAAE,MAAM,CAAC;IACf;;;OAGG;IACH,MAAM,CAAC,EAAE,MAAM,EAAE,CAAC;CAClB;AAED,eAAO,MAAM,sBAAsB,UAAqD,CAAC;AAEzF,eAAO,MAAM,IAAI;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAwauD,CAAC;AAEzE,MAAM,MAAM,OAAO,GAAG,MAAM,OAAO,IAAI,CAAC"}

package/dist/src/model-data.d.ts CHANGED Viewed

@@ -104,6 +104,7 @@ export interface ModelData {
             parameters?: Record<string, unknown>;
         };
         base_model?: string | string[];
+        instance_prompt?: string;
     };
     /**
      * Library name

package/dist/src/model-data.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"model-data.d.ts","sourceRoot":"","sources":["../../src/model-data.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,YAAY,EAAE,MAAM,aAAa,CAAC;AAChD,OAAO,KAAK,EAAE,aAAa,EAAE,MAAM,kBAAkB,CAAC;AACtD,OAAO,KAAK,EAAE,eAAe,EAAE,MAAM,kBAAkB,CAAC;AAExD;;GAEG;AACH,MAAM,WAAW,SAAS;IACzB;;OAEG;IACH,EAAE,EAAE,MAAM,CAAC;IACX;;;OAGG;IACH,SAAS,EAAE,MAAM,CAAC;IAClB;;OAEG;IACH,OAAO,CAAC,EAAE,OAAO,CAAC;IAClB;;OAEG;IACH,MAAM,CAAC,EAAE;QACR,aAAa,CAAC,EAAE,MAAM,EAAE,CAAC;QACzB;;WAEG;QACH,QAAQ,CAAC,EAAE;YACV;;eAEG;YACH,CAAC,CAAC,EAAE,MAAM,GAAG,MAAM,CAAC;SACpB,CAAC;QACF,UAAU,CAAC,EAAE,MAAM,CAAC;QACpB,mBAAmB,CAAC,EAAE;YACrB,IAAI,CAAC,EAAE,MAAM,CAAC;YACd,YAAY,CAAC,EAAE,OAAO,CAAC;YACvB,YAAY,CAAC,EAAE,OAAO,CAAC;YACvB;;eAEG;YACH,YAAY,CAAC,EAAE,MAAM,CAAC;SACtB,CAAC;QACF,gBAAgB,CAAC,EAAE,eAAe,CAAC;QACnC,oBAAoB,CAAC,EAAE;YACtB,UAAU,CAAC,EAAE,MAAM,CAAC;YACpB,WAAW,CAAC,EAAE,MAAM,CAAC;SACrB,CAAC;QACF,SAAS,CAAC,EAAE;YACX,WAAW,CAAC,EAAE,MAAM,CAAC;SACrB,CAAC;QACF,OAAO,CAAC,EAAE;YACT,KAAK,CAAC,EAAE;gBACP,IAAI,CAAC,EAAE,MAAM,CAAC;aACd,CAAC;YACF,YAAY,CAAC,EAAE,MAAM,CAAC;SACtB,CAAC;QACF,WAAW,CAAC,EAAE;YACb,qBAAqB,CAAC,EAAE,MAAM,CAAC;YAC/B,iBAAiB,CAAC,EAAE,MAAM,CAAC;YAC3B,gBAAgB,CAAC,EAAE,MAAM,CAAC;SAC1B,CAAC;QACF,IAAI,CAAC,EAAE;YACN,uBAAuB,CAAC,EAAE,MAAM,CAAC;YACjC,SAAS,CAAC,EAAE,MAAM,CAAC;SACnB,CAAC;KACF,CAAC;IACF;;OAEG;IACH,IAAI,EAAE,MAAM,EAAE,CAAC;IACf;;OAEG;IACH,gBAAgB,CAAC,EAAE,gBAAgB,CAAC;IACpC;;OAEG;IACH,YAAY,CAAC,EAAE,YAAY,GAAG,SAAS,CAAC;IACxC;;OAEG;IACH,UAAU,CAAC,EAAE,MAAM,GAAG,SAAS,CAAC;IAChC;;;;;OAKG;IACH,UAAU,CAAC,EAAE,aAAa,EAAE,GAAG,SAAS,CAAC;IACzC;;;;;;;;;OASG;IACH,QAAQ,CAAC,EAAE;QACV,SAAS,CAAC,EACP,OAAO,GACP;YACA,UAAU,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;SACpC,CAAC;QACL,UAAU,CAAC,EAAE,MAAM,GAAG,MAAM,EAAE,CAAC;~~KAC~~/B,CAAC;IACF;;;OAGG;IACH,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,WAAW,CAAC,EAAE;QACb,UAAU,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;QACnC,KAAK,EAAE,MAAM,CAAC;QACd,OAAO,EAAE,OAAO,CAAC;KACjB,CAAC;IACF,IAAI,CAAC,EAAE;QACN,KAAK,EAAE,MAAM,CAAC;QACd,YAAY,CAAC,EAAE,MAAM,CAAC;QACtB,cAAc,CAAC,EAAE,MAAM,CAAC;KACxB,CAAC;CACF;AAED;;GAEG;AACH,MAAM,WAAW,gBAAgB;IAChC;;OAEG;IACH,UAAU,EAAE,MAAM,CAAC;IACnB;;OAEG;IACH,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB;;OAEG;IACH,YAAY,CAAC,EAAE,YAAY,CAAC;IAC5B;;OAEG;IACH,SAAS,CAAC,EAAE,MAAM,CAAC;CACnB"}
1	+ {"version":3,"file":"model-data.d.ts","sourceRoot":"","sources":["../../src/model-data.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,YAAY,EAAE,MAAM,aAAa,CAAC;AAChD,OAAO,KAAK,EAAE,aAAa,EAAE,MAAM,kBAAkB,CAAC;AACtD,OAAO,KAAK,EAAE,eAAe,EAAE,MAAM,kBAAkB,CAAC;AAExD;;GAEG;AACH,MAAM,WAAW,SAAS;IACzB;;OAEG;IACH,EAAE,EAAE,MAAM,CAAC;IACX;;;OAGG;IACH,SAAS,EAAE,MAAM,CAAC;IAClB;;OAEG;IACH,OAAO,CAAC,EAAE,OAAO,CAAC;IAClB;;OAEG;IACH,MAAM,CAAC,EAAE;QACR,aAAa,CAAC,EAAE,MAAM,EAAE,CAAC;QACzB;;WAEG;QACH,QAAQ,CAAC,EAAE;YACV;;eAEG;YACH,CAAC,CAAC,EAAE,MAAM,GAAG,MAAM,CAAC;SACpB,CAAC;QACF,UAAU,CAAC,EAAE,MAAM,CAAC;QACpB,mBAAmB,CAAC,EAAE;YACrB,IAAI,CAAC,EAAE,MAAM,CAAC;YACd,YAAY,CAAC,EAAE,OAAO,CAAC;YACvB,YAAY,CAAC,EAAE,OAAO,CAAC;YACvB;;eAEG;YACH,YAAY,CAAC,EAAE,MAAM,CAAC;SACtB,CAAC;QACF,gBAAgB,CAAC,EAAE,eAAe,CAAC;QACnC,oBAAoB,CAAC,EAAE;YACtB,UAAU,CAAC,EAAE,MAAM,CAAC;YACpB,WAAW,CAAC,EAAE,MAAM,CAAC;SACrB,CAAC;QACF,SAAS,CAAC,EAAE;YACX,WAAW,CAAC,EAAE,MAAM,CAAC;SACrB,CAAC;QACF,OAAO,CAAC,EAAE;YACT,KAAK,CAAC,EAAE;gBACP,IAAI,CAAC,EAAE,MAAM,CAAC;aACd,CAAC;YACF,YAAY,CAAC,EAAE,MAAM,CAAC;SACtB,CAAC;QACF,WAAW,CAAC,EAAE;YACb,qBAAqB,CAAC,EAAE,MAAM,CAAC;YAC/B,iBAAiB,CAAC,EAAE,MAAM,CAAC;YAC3B,gBAAgB,CAAC,EAAE,MAAM,CAAC;SAC1B,CAAC;QACF,IAAI,CAAC,EAAE;YACN,uBAAuB,CAAC,EAAE,MAAM,CAAC;YACjC,SAAS,CAAC,EAAE,MAAM,CAAC;SACnB,CAAC;KACF,CAAC;IACF;;OAEG;IACH,IAAI,EAAE,MAAM,EAAE,CAAC;IACf;;OAEG;IACH,gBAAgB,CAAC,EAAE,gBAAgB,CAAC;IACpC;;OAEG;IACH,YAAY,CAAC,EAAE,YAAY,GAAG,SAAS,CAAC;IACxC;;OAEG;IACH,UAAU,CAAC,EAAE,MAAM,GAAG,SAAS,CAAC;IAChC;;;;;OAKG;IACH,UAAU,CAAC,EAAE,aAAa,EAAE,GAAG,SAAS,CAAC;IACzC;;;;;;;;;OASG;IACH,QAAQ,CAAC,EAAE;QACV,SAAS,CAAC,EACP,OAAO,GACP;YACA,UAAU,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;SACpC,CAAC;QACL,UAAU,CAAC,EAAE,MAAM,GAAG,MAAM,EAAE,CAAC;QAC/B,eAAe,CAAC,EAAE,MAAM,CAAC;KACzB,CAAC;IACF;;;OAGG;IACH,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB,WAAW,CAAC,EAAE;QACb,UAAU,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;QACnC,KAAK,EAAE,MAAM,CAAC;QACd,OAAO,EAAE,OAAO,CAAC;KACjB,CAAC;IACF,IAAI,CAAC,EAAE;QACN,KAAK,EAAE,MAAM,CAAC;QACd,YAAY,CAAC,EAAE,MAAM,CAAC;QACtB,cAAc,CAAC,EAAE,MAAM,CAAC;KACxB,CAAC;CACF;AAED;;GAEG;AACH,MAAM,WAAW,gBAAgB;IAChC;;OAEG;IACH,UAAU,EAAE,MAAM,CAAC;IACnB;;OAEG;IACH,YAAY,CAAC,EAAE,MAAM,CAAC;IACtB;;OAEG;IACH,YAAY,CAAC,EAAE,YAAY,CAAC;IAC5B;;OAEG;IACH,SAAS,CAAC,EAAE,MAAM,CAAC;CACnB"}

package/dist/src/model-libraries-snippets.d.ts CHANGED Viewed

@@ -51,6 +51,7 @@ export declare const fasttext: (model: ModelData) => string[];
 export declare const stableBaselines3: (model: ModelData) => string[];
 export declare const mlAgents: (model: ModelData) => string[];
 export declare const sentis: () => string[];
+export declare const vfimamba: (model: ModelData) => string[];
 export declare const voicecraft: (model: ModelData) => string[];
 export declare const chattts: () => string[];
 export declare const yolov10: (model: ModelData) => string[];
@@ -61,4 +62,5 @@ export declare const nemo: (model: ModelData) => string[];
 export declare const pythae: (model: ModelData) => string[];
 export declare const audiocraft: (model: ModelData) => string[];
 export declare const whisperkit: () => string[];
+export declare const threedtopia_xl: (model: ModelData) => string[];
 //# sourceMappingURL=model-libraries-snippets.d.ts.map

package/dist/src/model-libraries-snippets.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"model-libraries-snippets.d.ts","sourceRoot":"","sources":["../../src/model-libraries-snippets.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,SAAS,EAAE,MAAM,cAAc,CAAC;~~AAY9C~~,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAKjD,CAAC;AAkBF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAKjD,CAAC;AAEF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAIjD,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAkBlD,CAAC;~~AAMF~~,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAIjD,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAI9C,CAAC;AAEF,eAAO,MAAM,iBAAiB,UAAW,SAAS,KAAG,MAAM,EA6C1D,CAAC;~~AA+BF~~,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAUlD,CAAC;AAEF,eAAO,MAAM,YAAY,UAAW,SAAS,KAAG,MAAM,EAwCrD,CAAC;AAEF,eAAO,MAAM,gBAAgB,UAAW,SAAS,KAAG,MAAM,EAgBzD,CAAC;AAEF,eAAO,MAAM,YAAY,UAAW,SAAS,KAAG,MAAM,EAmBrD,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAgB/C,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAMlD,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EASlD,CAAC;AAIF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAO/C,CAAC;AAEF,eAAO,MAAM,OAAO,UAAW,SAAS,KAAG,MAAM,EAMhD,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAI9C,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAI/C,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAS9C,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAUlD,CAAC;AAEF,eAAO,MAAM,gBAAgB,UAAW,SAAS,KAAG,MAAM,EAgBzD,CAAC;AAEF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAOjD,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAIlD,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAKlD,CAAC;AAEF,eAAO,MAAM,aAAa,QAAO,MAAM,EAQtC,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAKlD,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAsBlD,CAAC;AAEF,eAAO,MAAM,uBAAuB,UAAW,SAAS,KAAG,MAAM,EAehE,CAAC;AAiBF,eAAO,MAAM,cAAc,UAAW,SAAS,KAAG,MAAM,EAKvD,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAI9C,CAAC;AAyBF,eAAO,MAAM,aAAa,UAAW,SAAS,KAAG,MAAM,EAOtD,CAAC;AAEF,eAAO,MAAM,IAAI,UAAW,SAAS,KAAG,MAAM,EAI7C,CAAC;AAEF,eAAO,MAAM,OAAO,QAA6B,MAAM,EAQtD,CAAC;AAEF,eAAO,MAAM,UAAU,QAAO,MAAM,EAanC,CAAC;AAsCF,eAAO,MAAM,OAAO,UAAW,SAAS,KAAG,MAAM,EAehD,CAAC;AAEF,eAAO,MAAM,kBAAkB,UAAW,SAAS,KAAG,MAAM,EAmC3D,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAI/C,CAAC;AAEF,eAAO,MAAM,IAAI,UAAW,SAAS,KAAG,MAAM,EA2B7C,CAAC;AAEF,eAAO,MAAM,aAAa,UAAW,SAAS,KAAG,MAAM,EAEtD,CAAC;AAEF,eAAO,MAAM,oBAAoB,UAAW,SAAS,KAAG,MAAM,EAI7D,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAI/C,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAU9C,CAAC;AAEF,eAAO,MAAM,WAAW,UAAW,SAAS,KAAG,MAAM,EAIpD,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAK/C,CAAC;AAkBF,eAAO,MAAM,WAAW,UAAW,SAAS,KAAG,MAAM,EAkBpD,CAAC;AAEF,eAAO,MAAM,YAAY,UAAW,SAAS,KAAG,MAAM,EA4CrD,CAAC;AAEF,eAAO,MAAM,cAAc,UAAW,SAAS,KAAG,MAAM,EAcvD,CAAC;AAiBF,eAAO,MAAM,IAAI,UAAW,SAAS,KAAG,MAAM,EAkB7C,CAAC;AAEF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAKjD,CAAC;AAEF,eAAO,MAAM,gBAAgB,UAAW,SAAS,KAAG,MAAM,EAMzD,CAAC;AAgBF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAEjD,CAAC;AAEF,eAAO,MAAM,MAAM,QAA6B,MAAM,EAMrD,CAAC;AAEF,eAAO,MAAM,UAAU,UAAW,SAAS,KAAG,MAAM,EAInD,CAAC;AAEF,eAAO,MAAM,OAAO,QAAO,MAAM,EAYhC,CAAC;AAEF,eAAO,MAAM,OAAO,UAAW,SAAS,KAAG,MAAM,EAOhD,CAAC;AAEF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAYjD,CAAC;AAEF,eAAO,MAAM,GAAG,UAAW,SAAS,KAAG,MAAM,EAK5C,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAI9C,CAAC;AAEF,eAAO,MAAM,IAAI,UAAW,SAAS,KAAG,MAAM,EAQ7C,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAI/C,CAAC;AA6BF,eAAO,MAAM,UAAU,UAAW,SAAS,KAAG,MAAM,EAUnD,CAAC;AAEF,eAAO,MAAM,UAAU,QAAO,MAAM,EAYnC,CAAC"}
1	+ {"version":3,"file":"model-libraries-snippets.d.ts","sourceRoot":"","sources":["../../src/model-libraries-snippets.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,SAAS,EAAE,MAAM,cAAc,CAAC;AAe9C,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAKjD,CAAC;AAkBF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAKjD,CAAC;AAEF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAIjD,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAkBlD,CAAC;AAaF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAIjD,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAI9C,CAAC;AAEF,eAAO,MAAM,iBAAiB,UAAW,SAAS,KAAG,MAAM,EA6C1D,CAAC;AAuCF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAUlD,CAAC;AAEF,eAAO,MAAM,YAAY,UAAW,SAAS,KAAG,MAAM,EAwCrD,CAAC;AAEF,eAAO,MAAM,gBAAgB,UAAW,SAAS,KAAG,MAAM,EAgBzD,CAAC;AAEF,eAAO,MAAM,YAAY,UAAW,SAAS,KAAG,MAAM,EAmBrD,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAgB/C,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAMlD,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EASlD,CAAC;AAIF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAO/C,CAAC;AAEF,eAAO,MAAM,OAAO,UAAW,SAAS,KAAG,MAAM,EAMhD,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAI9C,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAI/C,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAS9C,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAUlD,CAAC;AAEF,eAAO,MAAM,gBAAgB,UAAW,SAAS,KAAG,MAAM,EAgBzD,CAAC;AAEF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAOjD,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAIlD,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAKlD,CAAC;AAEF,eAAO,MAAM,aAAa,QAAO,MAAM,EAQtC,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAKlD,CAAC;AAEF,eAAO,MAAM,SAAS,UAAW,SAAS,KAAG,MAAM,EAsBlD,CAAC;AAEF,eAAO,MAAM,uBAAuB,UAAW,SAAS,KAAG,MAAM,EAehE,CAAC;AAiBF,eAAO,MAAM,cAAc,UAAW,SAAS,KAAG,MAAM,EAKvD,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAI9C,CAAC;AAyBF,eAAO,MAAM,aAAa,UAAW,SAAS,KAAG,MAAM,EAOtD,CAAC;AAEF,eAAO,MAAM,IAAI,UAAW,SAAS,KAAG,MAAM,EAI7C,CAAC;AAEF,eAAO,MAAM,OAAO,QAA6B,MAAM,EAQtD,CAAC;AAEF,eAAO,MAAM,UAAU,QAAO,MAAM,EAanC,CAAC;AAsCF,eAAO,MAAM,OAAO,UAAW,SAAS,KAAG,MAAM,EAehD,CAAC;AAEF,eAAO,MAAM,kBAAkB,UAAW,SAAS,KAAG,MAAM,EAmC3D,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAI/C,CAAC;AAEF,eAAO,MAAM,IAAI,UAAW,SAAS,KAAG,MAAM,EA2B7C,CAAC;AAEF,eAAO,MAAM,aAAa,UAAW,SAAS,KAAG,MAAM,EAEtD,CAAC;AAEF,eAAO,MAAM,oBAAoB,UAAW,SAAS,KAAG,MAAM,EAI7D,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAI/C,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAU9C,CAAC;AAEF,eAAO,MAAM,WAAW,UAAW,SAAS,KAAG,MAAM,EAIpD,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAK/C,CAAC;AAkBF,eAAO,MAAM,WAAW,UAAW,SAAS,KAAG,MAAM,EAkBpD,CAAC;AAEF,eAAO,MAAM,YAAY,UAAW,SAAS,KAAG,MAAM,EA4CrD,CAAC;AAEF,eAAO,MAAM,cAAc,UAAW,SAAS,KAAG,MAAM,EAcvD,CAAC;AAiBF,eAAO,MAAM,IAAI,UAAW,SAAS,KAAG,MAAM,EAkB7C,CAAC;AAEF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAKjD,CAAC;AAEF,eAAO,MAAM,gBAAgB,UAAW,SAAS,KAAG,MAAM,EAMzD,CAAC;AAgBF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAEjD,CAAC;AAEF,eAAO,MAAM,MAAM,QAA6B,MAAM,EAMrD,CAAC;AAEF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAIjD,CAAC;AAEF,eAAO,MAAM,UAAU,UAAW,SAAS,KAAG,MAAM,EAInD,CAAC;AAEF,eAAO,MAAM,OAAO,QAAO,MAAM,EAYhC,CAAC;AAEF,eAAO,MAAM,OAAO,UAAW,SAAS,KAAG,MAAM,EAOhD,CAAC;AAEF,eAAO,MAAM,QAAQ,UAAW,SAAS,KAAG,MAAM,EAYjD,CAAC;AAEF,eAAO,MAAM,GAAG,UAAW,SAAS,KAAG,MAAM,EAK5C,CAAC;AAEF,eAAO,MAAM,KAAK,UAAW,SAAS,KAAG,MAAM,EAI9C,CAAC;AAEF,eAAO,MAAM,IAAI,UAAW,SAAS,KAAG,MAAM,EAQ7C,CAAC;AAEF,eAAO,MAAM,MAAM,UAAW,SAAS,KAAG,MAAM,EAI/C,CAAC;AA6BF,eAAO,MAAM,UAAU,UAAW,SAAS,KAAG,MAAM,EAUnD,CAAC;AAEF,eAAO,MAAM,UAAU,QAAO,MAAM,EAYnC,CAAC;AAEF,eAAO,MAAM,cAAc,UAAW,SAAS,KAAG,MAAM,EAKvD,CAAC"}

package/dist/src/model-libraries.d.ts CHANGED Viewed

@@ -452,7 +452,7 @@ export declare const MODEL_LIBRARIES_UI_ELEMENTS: {
         repoName: string;
         repoUrl: string;
         snippets: (model: ModelData) => string[];
-        filter: true;
+        filter: false;
     };
     recurrentgemma: {
         prettyLabel: string;
@@ -500,6 +500,13 @@ export declare const MODEL_LIBRARIES_UI_ELEMENTS: {
         filter: true;
         countDownloads: string;
     };
+    sapiens: {
+        prettyLabel: string;
+        repoName: string;
+        repoUrl: string;
+        filter: false;
+        countDownloads: string;
+    };
     "sentence-transformers": {
         prettyLabel: string;
         repoName: string;
@@ -550,6 +557,13 @@ export declare const MODEL_LIBRARIES_UI_ELEMENTS: {
         filter: true;
         countDownloads: string;
     };
+    "ssr-speech": {
+        prettyLabel: string;
+        repoName: string;
+        repoUrl: string;
+        filter: false;
+        countDownloads: string;
+    };
     "stable-audio-tools": {
         prettyLabel: string;
         repoName: string;
@@ -573,6 +587,13 @@ export declare const MODEL_LIBRARIES_UI_ELEMENTS: {
         countDownloads: string;
         snippets: () => string[];
     };
+    soloaudio: {
+        prettyLabel: string;
+        repoName: string;
+        repoUrl: string;
+        filter: false;
+        countDownloads: string;
+    };
     "stable-baselines3": {
         prettyLabel: string;
         repoName: string;
@@ -644,6 +665,13 @@ export declare const MODEL_LIBRARIES_UI_ELEMENTS: {
         filter: true;
         countDownloads: string;
     };
+    "vfi-mamba": {
+        prettyLabel: string;
+        repoName: string;
+        repoUrl: string;
+        countDownloads: string;
+        snippets: (model: ModelData) => string[];
+    };
     voicecraft: {
         prettyLabel: string;
         repoName: string;
@@ -666,8 +694,16 @@ export declare const MODEL_LIBRARIES_UI_ELEMENTS: {
         snippets: () => string[];
         countDownloads: string;
     };
+    "3dtopia-xl": {
+        prettyLabel: string;
+        repoName: string;
+        repoUrl: string;
+        filter: false;
+        countDownloads: string;
+        snippets: (model: ModelData) => string[];
+    };
 };
 export type ModelLibraryKey = keyof typeof MODEL_LIBRARIES_UI_ELEMENTS;
-export declare const ALL_MODEL_LIBRARY_KEYS: ("adapter-transformers" | "allennlp" | "asteroid" | "audiocraft" | "audioseal" | "bertopic" | "big_vision" | "birefnet" | "bm25s" | "champ" | "chat_tts" | "colpali" | "deepforest" | "depth-anything-v2" | "diffree" | "diffusers" | "diffusionkit" | "doctr" | "cartesia_pytorch" | "cartesia_mlx" | "edsnlp" | "elm" | "espnet" | "fairseq" | "fastai" | "fasttext" | "flair" | "gemma.cpp" | "gliner" | "glyph-byt5" | "grok" | "hallo" | "hunyuan-dit" | "keras" | "tf-keras" | "keras-nlp" | "k2" | "liveportrait" | "llama-cpp-python" | "mindspore" | "mamba-ssm" | "mars5-tts" | "mesh-anything" | "ml-agents" | "mlx" | "mlx-image" | "mlc-llm" | "nemo" | "open_clip" | "paddlenlp" | "peft" | "pyannote-audio" | "py-feat" | "pythae" | "recurrentgemma" | "relik" | "refiners" | "saelens" | "sam2" | "sample-factory" | "sentence-transformers" | "setfit" | "sklearn" | "spacy" | "span-marker" | "speechbrain" | "stable-audio-tools" | "diffusion-single-file" | "seed-story" | "stable-baselines3" | "stanza" | "tensorflowtts" | "tic-clip" | "timesfm" | "timm" | "transformers" | "transformers.js" | "unity-sentis" | "voicecraft" | "yolov10" | "whisperkit")[];
-export declare const ALL_DISPLAY_MODEL_LIBRARY_KEYS: ("adapter-transformers" | "allennlp" | "asteroid" | "audiocraft" | "audioseal" | "bertopic" | "big_vision" | "birefnet" | "bm25s" | "champ" | "chat_tts" | "colpali" | "deepforest" | "depth-anything-v2" | "diffree" | "diffusers" | "diffusionkit" | "doctr" | "cartesia_pytorch" | "cartesia_mlx" | "edsnlp" | "elm" | "espnet" | "fairseq" | "fastai" | "fasttext" | "flair" | "gemma.cpp" | "gliner" | "glyph-byt5" | "grok" | "hallo" | "hunyuan-dit" | "keras" | "tf-keras" | "keras-nlp" | "k2" | "liveportrait" | "llama-cpp-python" | "mindspore" | "mamba-ssm" | "mars5-tts" | "mesh-anything" | "ml-agents" | "mlx" | "mlx-image" | "mlc-llm" | "nemo" | "open_clip" | "paddlenlp" | "peft" | "pyannote-audio" | "py-feat" | "pythae" | "recurrentgemma" | "relik" | "refiners" | "saelens" | "sam2" | "sample-factory" | "sentence-transformers" | "setfit" | "sklearn" | "spacy" | "span-marker" | "speechbrain" | "stable-audio-tools" | "diffusion-single-file" | "seed-story" | "stable-baselines3" | "stanza" | "tensorflowtts" | "tic-clip" | "timesfm" | "timm" | "transformers" | "transformers.js" | "unity-sentis" | "voicecraft" | "yolov10" | "whisperkit")[];
+export declare const ALL_MODEL_LIBRARY_KEYS: ("adapter-transformers" | "allennlp" | "asteroid" | "audiocraft" | "audioseal" | "bertopic" | "big_vision" | "birefnet" | "bm25s" | "champ" | "chat_tts" | "colpali" | "deepforest" | "depth-anything-v2" | "diffree" | "diffusers" | "diffusionkit" | "doctr" | "cartesia_pytorch" | "cartesia_mlx" | "edsnlp" | "elm" | "espnet" | "fairseq" | "fastai" | "fasttext" | "flair" | "gemma.cpp" | "gliner" | "glyph-byt5" | "grok" | "hallo" | "hunyuan-dit" | "keras" | "tf-keras" | "keras-nlp" | "k2" | "liveportrait" | "llama-cpp-python" | "mindspore" | "mamba-ssm" | "mars5-tts" | "mesh-anything" | "ml-agents" | "mlx" | "mlx-image" | "mlc-llm" | "nemo" | "open_clip" | "paddlenlp" | "peft" | "pyannote-audio" | "py-feat" | "pythae" | "recurrentgemma" | "relik" | "refiners" | "saelens" | "sam2" | "sample-factory" | "sapiens" | "sentence-transformers" | "setfit" | "sklearn" | "spacy" | "span-marker" | "speechbrain" | "ssr-speech" | "stable-audio-tools" | "diffusion-single-file" | "seed-story" | "soloaudio" | "stable-baselines3" | "stanza" | "tensorflowtts" | "tic-clip" | "timesfm" | "timm" | "transformers" | "transformers.js" | "unity-sentis" | "vfi-mamba" | "voicecraft" | "yolov10" | "whisperkit" | "3dtopia-xl")[];
+export declare const ALL_DISPLAY_MODEL_LIBRARY_KEYS: ("adapter-transformers" | "allennlp" | "asteroid" | "audiocraft" | "audioseal" | "bertopic" | "big_vision" | "birefnet" | "bm25s" | "champ" | "chat_tts" | "colpali" | "deepforest" | "depth-anything-v2" | "diffree" | "diffusers" | "diffusionkit" | "doctr" | "cartesia_pytorch" | "cartesia_mlx" | "edsnlp" | "elm" | "espnet" | "fairseq" | "fastai" | "fasttext" | "flair" | "gemma.cpp" | "gliner" | "glyph-byt5" | "grok" | "hallo" | "hunyuan-dit" | "keras" | "tf-keras" | "keras-nlp" | "k2" | "liveportrait" | "llama-cpp-python" | "mindspore" | "mamba-ssm" | "mars5-tts" | "mesh-anything" | "ml-agents" | "mlx" | "mlx-image" | "mlc-llm" | "nemo" | "open_clip" | "paddlenlp" | "peft" | "pyannote-audio" | "py-feat" | "pythae" | "recurrentgemma" | "relik" | "refiners" | "saelens" | "sam2" | "sample-factory" | "sapiens" | "sentence-transformers" | "setfit" | "sklearn" | "spacy" | "span-marker" | "speechbrain" | "ssr-speech" | "stable-audio-tools" | "diffusion-single-file" | "seed-story" | "soloaudio" | "stable-baselines3" | "stanza" | "tensorflowtts" | "tic-clip" | "timesfm" | "timm" | "transformers" | "transformers.js" | "unity-sentis" | "vfi-mamba" | "voicecraft" | "yolov10" | "whisperkit" | "3dtopia-xl")[];
 //# sourceMappingURL=model-libraries.d.ts.map

package/dist/src/model-libraries.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"model-libraries.d.ts","sourceRoot":"","sources":["../../src/model-libraries.ts"],"names":[],"mappings":"AACA,OAAO,KAAK,EAAE,SAAS,EAAE,MAAM,cAAc,CAAC;AAC9C,OAAO,KAAK,EAAE,kBAAkB,EAAE,MAAM,6BAA6B,CAAC;AAEtE;;GAEG;AACH,MAAM,WAAW,gBAAgB;IAChC;;;;OAIG;IACH,WAAW,EAAE,MAAM,CAAC;IACpB;;OAEG;IACH,QAAQ,EAAE,MAAM,CAAC;IACjB;;OAEG;IACH,OAAO,EAAE,MAAM,CAAC;IAChB;;OAEG;IACH,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB;;OAEG;IACH,QAAQ,CAAC,EAAE,CAAC,KAAK,EAAE,SAAS,KAAK,MAAM,EAAE,CAAC;IAC1C;;;;;OAKG;IACH,cAAc,CAAC,EAAE,kBAAkB,CAAC;IACpC;;;OAGG;IACH,MAAM,CAAC,EAAE,OAAO,CAAC;CACjB;AAED;;;;;;;;;;;;;GAaG;AAEH,eAAO,MAAM,2BAA2B;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAumBI,CAAC;AAE7C,MAAM,MAAM,eAAe,GAAG,MAAM,OAAO,2BAA2B,CAAC;AAEvE,eAAO,MAAM,sBAAsB,~~wnCAAgE~~,CAAC;AAEpG,eAAO,MAAM,8BAA8B,~~wnCAQ1B~~,CAAC"}
1	+ {"version":3,"file":"model-libraries.d.ts","sourceRoot":"","sources":["../../src/model-libraries.ts"],"names":[],"mappings":"AACA,OAAO,KAAK,EAAE,SAAS,EAAE,MAAM,cAAc,CAAC;AAC9C,OAAO,KAAK,EAAE,kBAAkB,EAAE,MAAM,6BAA6B,CAAC;AAEtE;;GAEG;AACH,MAAM,WAAW,gBAAgB;IAChC;;;;OAIG;IACH,WAAW,EAAE,MAAM,CAAC;IACpB;;OAEG;IACH,QAAQ,EAAE,MAAM,CAAC;IACjB;;OAEG;IACH,OAAO,EAAE,MAAM,CAAC;IAChB;;OAEG;IACH,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB;;OAEG;IACH,QAAQ,CAAC,EAAE,CAAC,KAAK,EAAE,SAAS,KAAK,MAAM,EAAE,CAAC;IAC1C;;;;;OAKG;IACH,cAAc,CAAC,EAAE,kBAAkB,CAAC;IACpC;;;OAGG;IACH,MAAM,CAAC,EAAE,OAAO,CAAC;CACjB;AAED;;;;;;;;;;;;;GAaG;AAEH,eAAO,MAAM,2BAA2B;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CA2oBI,CAAC;AAE7C,MAAM,MAAM,eAAe,GAAG,MAAM,OAAO,2BAA2B,CAAC;AAEvE,eAAO,MAAM,sBAAsB,8rCAAgE,CAAC;AAEpG,eAAO,MAAM,8BAA8B,8rCAQ1B,CAAC"}

package/dist/src/tasks/keypoint-detection/data.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"data.d.ts","sourceRoot":"","sources":["../../../../src/tasks/keypoint-detection/data.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,cAAc,EAAE,MAAM,IAAI,CAAC;AAEzC,QAAA,MAAM,QAAQ,EAAE,~~cAyCf~~,CAAC;AAEF,eAAe,QAAQ,CAAC"}
1	+ {"version":3,"file":"data.d.ts","sourceRoot":"","sources":["../../../../src/tasks/keypoint-detection/data.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,cAAc,EAAE,MAAM,IAAI,CAAC;AAEzC,QAAA,MAAM,QAAQ,EAAE,cA6Cf,CAAC;AAEF,eAAe,QAAQ,CAAC"}

package/dist/src/tasks/video-text-to-text/data.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+import type { TaskDataCustom } from "..";
+declare const taskData: TaskDataCustom;
+export default taskData;
+//# sourceMappingURL=data.d.ts.map

package/dist/src/tasks/video-text-to-text/data.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"data.d.ts","sourceRoot":"","sources":["../../../../src/tasks/video-text-to-text/data.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,cAAc,EAAE,MAAM,IAAI,CAAC;AAEzC,QAAA,MAAM,QAAQ,EAAE,cAqDf,CAAC;AAEF,eAAe,QAAQ,CAAC"}

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "@huggingface/tasks",
   "packageManager": "pnpm@8.10.5",
-  "version": "0.12.3",
+  "version": "0.12.5",
   "description": "List of ML tasks for huggingface.co/tasks",
   "repository": "https://github.com/huggingface/huggingface.js.git",
   "publishConfig": {

package/src/hardware.ts CHANGED Viewed

@@ -176,6 +176,14 @@ export const SKUS = {
 				tflops: 14.93,
 				memory: [8],
 			},
+			"RTX 2070 SUPER Mobile": {
+				tflops: 14.13,
+				memory: [8],
+			},
+			"RTX 2070 SUPER": {
+				tflops: 18.12,
+				memory: [8],
+			},
 			"RTX 3050 Mobile": {
 				tflops: 7.639,
 				memory: [6],
@@ -275,6 +283,23 @@ export const SKUS = {
 				memory: [16],
 			},
 		},
+		QUALCOMM: {
+			"Snapdragon X Elite X1E-00-1DE": {
+				tflops: 4.6,
+			},
+			"Snapdragon X Elite X1E-84-100": {
+				tflops: 4.6,
+			},
+			"Snapdragon X Elite X1E-80-100": {
+				tflops: 3.8,
+			},
+			"Snapdragon X Elite X1E-78-100": {
+				tflops: 3.8,
+			},
+			"Snapdragon X Plus X1P-64-100": {
+				tflops: 3.8,
+			},
+		},
 	},
 	CPU: {
 		Intel: {

package/src/model-data.ts CHANGED Viewed

@@ -107,6 +107,7 @@ export interface ModelData {
 					parameters?: Record<string, unknown>;
 			  };
 		base_model?: string | string[];
+		instance_prompt?: string;
 	};
 	/**
 	 * Library name

package/src/model-libraries-snippets.ts CHANGED Viewed

@@ -1,4 +1,5 @@
 import type { ModelData } from "./model-data";
+import type { WidgetExampleTextInput } from "./widget-example";
 import { LIBRARY_TASK_MAPPING } from "./library-to-tasks";
 const TAG_CUSTOM_CODE = "custom_code";
@@ -8,6 +9,8 @@ function nameWithoutNamespace(modelId: string): string {
 	return splitted.length === 1 ? splitted[0] : splitted[1];
 }
+const escapeStringForJson = (str: string): string => JSON.stringify(str);
 //#region snippets
 export const adapters = (model: ModelData): string[] => [
@@ -70,6 +73,13 @@ function get_base_diffusers_model(model: ModelData): string {
 	return model.cardData?.base_model?.toString() ?? "fill-in-base-model";
 }
+function get_prompt_from_diffusers_model(model: ModelData): string | undefined {
+	const prompt = (model.widgetData?.[0] as WidgetExampleTextInput).text ?? model.cardData?.instance_prompt;
+	if (prompt) {
+		return escapeStringForJson(prompt);
+	}
+}
 export const bertopic = (model: ModelData): string[] => [
 	`from bertopic import BERTopic
@@ -129,17 +139,22 @@ depth = model.infer_image(raw_img) # HxW raw depth map in numpy
 	];
 };
+const diffusersDefaultPrompt = "Astronaut in a jungle, cold color palette, muted colors, detailed, 8k";
 const diffusers_default = (model: ModelData) => [
 	`from diffusers import DiffusionPipeline
-pipeline = DiffusionPipeline.from_pretrained("${model.id}")`,
+pipe = DiffusionPipeline.from_pretrained("${model.id}")
+prompt = "${get_prompt_from_diffusers_model(model) ?? diffusersDefaultPrompt}"
+image = pipe(prompt).images[0]`,
 ];
 const diffusers_controlnet = (model: ModelData) => [
 	`from diffusers import ControlNetModel, StableDiffusionControlNetPipeline
 controlnet = ControlNetModel.from_pretrained("${model.id}")
-pipeline = StableDiffusionControlNetPipeline.from_pretrained(
+pipe = StableDiffusionControlNetPipeline.from_pretrained(
 	"${get_base_diffusers_model(model)}", controlnet=controlnet
 )`,
 ];
@@ -147,15 +162,18 @@ pipeline = StableDiffusionControlNetPipeline.from_pretrained(
 const diffusers_lora = (model: ModelData) => [
 	`from diffusers import DiffusionPipeline
-pipeline = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
-pipeline.load_lora_weights("${model.id}")`,
+pipe = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
+pipe.load_lora_weights("${model.id}")
+prompt = "${get_prompt_from_diffusers_model(model) ?? diffusersDefaultPrompt}"
+image = pipe(prompt).images[0]`,
 ];
 const diffusers_textual_inversion = (model: ModelData) => [
 	`from diffusers import DiffusionPipeline
-pipeline = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
-pipeline.load_textual_inversion("${model.id}")`,
+pipe = DiffusionPipeline.from_pretrained("${get_base_diffusers_model(model)}")
+pipe.load_textual_inversion("${model.id}")`,
 ];
 export const diffusers = (model: ModelData): string[] => {
@@ -871,6 +889,12 @@ IWorker engine = WorkerFactory.CreateWorker(BackendType.GPUCompute, model);
 `,
 ];
+export const vfimamba = (model: ModelData): string[] => [
+	`from Trainer_finetune import Model
+model = Model.from_pretrained("${model.id}")`,
+];
 export const voicecraft = (model: ModelData): string[] => [
 	`from voicecraft import VoiceCraft
@@ -995,4 +1019,11 @@ whisperkit-cli transcribe --audio-path /path/to/audio.mp3
 # Or use your preferred model variant
 whisperkit-cli transcribe --model "large-v3" --model-prefix "distil" --audio-path /path/to/audio.mp3 --verbose`,
 ];
+export const threedtopia_xl = (model: ModelData): string[] => [
+	`from threedtopia_xl.models import threedtopia_xl
+model = threedtopia_xl.from_pretrained("${model.id}")
+model.generate(cond="path/to/image.png")`,
+];
 //#endregion

package/src/model-libraries.ts CHANGED Viewed

@@ -458,7 +458,7 @@ export const MODEL_LIBRARIES_UI_ELEMENTS = {
 		repoName: "pythae",
 		repoUrl: "https://github.com/clementchadebec/benchmark_VAE",
 		snippets: snippets.pythae,
-		filter: true,
+		filter: false,
 	},
 	recurrentgemma: {
 		prettyLabel: "RecurrentGemma",
@@ -506,6 +506,13 @@ export const MODEL_LIBRARIES_UI_ELEMENTS = {
 		filter: true,
 		countDownloads: `path:"cfg.json"`,
 	},
+	sapiens: {
+		prettyLabel: "sapiens",
+		repoName: "sapiens",
+		repoUrl: "https://github.com/facebookresearch/sapiens",
+		filter: false,
+		countDownloads: `path_extension:"pt2" OR path_extension:"pth" OR path_extension:"onnx"`,
+	},
 	"sentence-transformers": {
 		prettyLabel: "sentence-transformers",
 		repoName: "sentence-transformers",
@@ -556,6 +563,13 @@ export const MODEL_LIBRARIES_UI_ELEMENTS = {
 		filter: true,
 		countDownloads: `path:"hyperparams.yaml"`,
 	},
+	"ssr-speech": {
+		prettyLabel: "SSR-Speech",
+		repoName: "SSR-Speech",
+		repoUrl: "https://github.com/WangHelin1997/SSR-Speech",
+		filter: false,
+		countDownloads: `path_extension:".pth"`,
+	},
 	"stable-audio-tools": {
 		prettyLabel: "Stable Audio Tools",
 		repoName: "stable-audio-tools",
@@ -579,6 +593,13 @@ export const MODEL_LIBRARIES_UI_ELEMENTS = {
 		countDownloads: `path:"cvlm_llama2_tokenizer/tokenizer.model"`,
 		snippets: snippets.seed_story,
 	},
+	soloaudio: {
+		prettyLabel: "SoloAudio",
+		repoName: "SoloAudio",
+		repoUrl: "https://github.com/WangHelin1997/SoloAudio",
+		filter: false,
+		countDownloads: `path:"soloaudio_v2.pt"`,
+	},
 	"stable-baselines3": {
 		prettyLabel: "stable-baselines3",
 		repoName: "stable-baselines3",
@@ -650,6 +671,13 @@ export const MODEL_LIBRARIES_UI_ELEMENTS = {
 		filter: true,
 		countDownloads: `path_extension:"sentis"`,
 	},
+	"vfi-mamba": {
+		prettyLabel: "VFIMamba",
+		repoName: "VFIMamba",
+		repoUrl: "https://github.com/MCG-NJU/VFIMamba",
+		countDownloads: `path_extension:"pkl"`,
+		snippets: snippets.vfimamba,
+	},
 	voicecraft: {
 		prettyLabel: "VoiceCraft",
 		repoName: "VoiceCraft",
@@ -672,6 +700,14 @@ export const MODEL_LIBRARIES_UI_ELEMENTS = {
 		snippets: snippets.whisperkit,
 		countDownloads: `path_filename:"model" AND path_extension:"mil" AND _exists_:"path_prefix"`,
 	},
+	"3dtopia-xl": {
+		prettyLabel: "3DTopia-XL",
+		repoName: "3DTopia-XL",
+		repoUrl: "https://github.com/3DTopia/3DTopia-XL",
+		filter: false,
+		countDownloads: `path:"model_vae_fp16.pt"`,
+		snippets: snippets.threedtopia_xl,
+	},
 } satisfies Record<string, LibraryUiElement>;
 export type ModelLibraryKey = keyof typeof MODEL_LIBRARIES_UI_ELEMENTS;

package/src/tasks/image-text-to-text/data.ts CHANGED Viewed

@@ -60,7 +60,7 @@ const taskData: TaskDataCustom = {
 		},
 		{
 			description: "Strong image-text-to-text model.",
-			id: "llava-hf/llava-v1.6-mistral-7b-hf",
+			id: "microsoft/Phi-3.5-vision-instruct",
 		},
 	],
 	spaces: [

package/src/tasks/keypoint-detection/about.md CHANGED Viewed

@@ -36,16 +36,14 @@ model = SuperPointForKeypointDetection.from_pretrained("magic-leap-community/sup
 inputs = processor(image, return_tensors="pt").to(model.device, model.dtype)
 outputs = model(**inputs)
-# visualize the output
+# postprocess
+image_sizes = [(image.size[1], image.size[0])]
+outputs = processor.post_process_keypoint_detection(model_outputs, image_sizes)
+keypoints = outputs[0]["keypoints"].detach().numpy()
+scores = outputs[0]["scores"].detach().numpy()
 image_width, image_height = image.size
-image_mask = outputs.mask
-image_indices = torch.nonzero(image_mask).squeeze()
-image_scores = outputs.scores.squeeze()
-image_keypoints = outputs.keypoints.squeeze()
-keypoints = image_keypoints.detach().numpy()
-scores = image_scores.detach().numpy()
+# plot
 plt.axis('off')
 plt.imshow(image)
 plt.scatter(

package/src/tasks/keypoint-detection/data.ts CHANGED Viewed

@@ -37,6 +37,10 @@ const taskData: TaskDataCustom = {
 			description: "An application that detects hand keypoints in real-time.",
 			id: "datasciencedojo/Hand-Keypoint-Detection-Realtime",
 		},
+		{
+			description: "An application to try a universal keypoint detection model.",
+			id: "merve/SuperPoint",
+		},
 	],
 	summary: "Keypoint detection is the task of identifying meaningful distinctive points or features in an image.",
 	widgetModels: [],

package/src/tasks/text-to-image/about.md CHANGED Viewed

@@ -2,7 +2,7 @@
 ### Data Generation
-Businesses can generate data for their their use cases by inputting text and getting image outputs.
+Businesses can generate data for their use cases by inputting text and getting image outputs.
 ### Immersive Conversational Chatbots
@@ -16,9 +16,27 @@ Different patterns can be generated to obtain unique pieces of fashion. Text-to-
 Architects can utilise the models to construct an environment based out on the requirements of the floor plan. This can also include the furniture that has to be placed in that environment.
-## Task Variants
+## Task Variants
-You can contribute variants of this task [here](https://github.com/huggingface/hub-docs/blob/main/tasks/src/text-to-image/about.md).
+### Image Editing
+Image editing with text-to-image models involves modifying an image following edit instructions provided in a text prompt.
+- **Synthetic image editing**: Adjusting images that were initially created using an input prompt while preserving the overall meaning or context of the original image.
+  ![Examples](https://huggingface.co/datasets/diffusers/diffusers-images-docs/resolve/main/edit_p2p.png)
+  _Figure taken from ["InstructPix2Pix: Learning to Follow Image Editing Instructions"](https://www.timothybrooks.com/instruct-pix2pix)_
+- **Real image editing**: Similar to synthetic image editing, except we're using real photos/images. This task is usually more complex.
+  ![Examples](https://huggingface.co/datasets/diffusers/diffusers-images-docs/resolve/main/pix2pix.jpeg)
+  _Figure taken from ["Prompt-to-Prompt Image Editing with Cross-Attention Control"](https://prompt-to-prompt.github.io)_
+### Personalization
+Personalization refers to techniques used to customize text-to-image models. We introduce new subjects or concepts to the model, which the model can then generate when we refer to them with a text prompt.
+For example, you can use these techniques to generate images of your dog in imaginary settings, after you have taught the model using a few reference images of the subject (or just one in some cases). Teaching the model a new concept can be achieved through fine-tuning, or by using training-free techniques.
 ## Inference
@@ -65,11 +83,14 @@ await inference.textToImage({
 - [Introducing Würstchen: Fast Diffusion for Image Generation](https://huggingface.co/blog/wuerstchen)
 - [Efficient Controllable Generation for SDXL with T2I-Adapters](https://huggingface.co/blog/t2i-sdxl-adapters)
 - [Welcome aMUSEd: Efficient Text-to-Image Generation](https://huggingface.co/blog/amused)
+- Image Editing Demos: [LEDITS++](https://huggingface.co/spaces/editing-images/leditsplusplus), [Turbo Edit](https://huggingface.co/spaces/turboedit/turbo_edit), [InstructPix2Pix](https://huggingface.co/spaces/timbrooks/instruct-pix2pix), [CosXL](https://huggingface.co/spaces/multimodalart/cosxl)
+- Training free Personalization Demos: [Face-to-All](https://huggingface.co/spaces/multimodalart/face-to-all), [InstantStyle](https://huggingface.co/spaces/InstantX/InstantStyle), [RB-modulation](https://huggingface.co/spaces/fffiloni/RB-Modulation), [Photomaker v2](https://huggingface.co/spaces/TencentARC/PhotoMaker-V2)
 ### Model Fine-tuning
 - [Finetune Stable Diffusion Models with DDPO via TRL](https://huggingface.co/blog/pref-tuning)
 - [LoRA training scripts of the world, unite!](https://huggingface.co/blog/sdxl_lora_advanced_script)
 - [Using LoRA for Efficient Stable Diffusion Fine-Tuning](https://huggingface.co/blog/lora)
+- LoRA fine tuning Spaces: [FLUX.1 finetuning](https://huggingface.co/spaces/autotrain-projects/train-flux-lora-ease), [SDXL finetuning](https://huggingface.co/spaces/multimodalart/lora-ease)
 This page was made possible thanks to the efforts of [Ishan Dutta](https://huggingface.co/ishandutta), [Enrique Elias Ubaldo](https://huggingface.co/herrius) and [Oğuz Akif](https://huggingface.co/oguzakif).

package/src/tasks/text-to-image/data.ts CHANGED Viewed

@@ -92,7 +92,7 @@ const taskData: TaskDataCustom = {
 		},
 	],
 	summary:
-		"Generates images from input text. These models can be used to generate and modify images based on text prompts.",
+		"Text-to-image is the task of generating images from input text. These pipelines can also be used to modify and edit images based on text prompts.",
 	widgetModels: ["black-forest-labs/FLUX.1-dev"],
 	youtubeId: "",
 };

package/src/tasks/video-text-to-text/about.md ADDED Viewed

@@ -0,0 +1,98 @@
+Most of the video language models can take in videos, multiple videos, images and multiple images. Some of these models can also take interleaved inputs, which can have images and videos inside the text, where you can refer to the input images and input videos within the text prompt.
+## Different Types of Video Language Models
+Video language models come in three types:
+- **Base:** Pre-trained models that can be fine-tuned.
+- **Instruction:** Base models fine-tuned on video-instruction pairs and answers.
+- **Chatty/Conversational:** Base models fine-tuned on video conversation datasets.
+## Use Cases
+### Video Question Answering
+Video language models trained on video-question-answer pairs can be used for video question answering and generating captions for videos.
+### Video Chat
+Video language models can be used to have a dialogue about a video.
+### Video Recognition with Instructions
+Video language models can recognize images through descriptions. When given detailed descriptions of specific entities, they can classify the entities in a video.
+## Inference
+You can use the Transformers library to interact with video-language models.
+Below we load [a video language model](https://huggingface.co/llava-hf/LLaVA-NeXT-Video-7B-hf), write a simple utility to sample videos, use chat template to format the text prompt, process the video and the text prompt and infer. To run the snippet below, please install [OpenCV](https://pypi.org/project/opencv-python/) by running `pip install opencv-python`.
+```python
+import uuid
+import requests
+import cv2
+import torch
+from transformers import LlavaNextVideoProcessor, LlavaNextVideoForConditionalGeneration
+device = "cuda" if torch.cuda.is_available() else "cpu"
+model_id = "llava-hf/LLaVA-NeXT-Video-7B-hf"
+model = LlavaNextVideoForConditionalGeneration.from_pretrained(
+    model_id,
+    torch_dtype=torch.float16,
+    low_cpu_mem_usage=True,
+).to(device)
+processor = LlavaNextVideoProcessor.from_pretrained(model_id)
+def sample_frames(url, num_frames):
+    response = requests.get(url)
+    path_id = str(uuid.uuid4())
+    path = f"./{path_id}.mp4"
+    with open(path, "wb") as f:
+         f.write(response.content)
+    video = cv2.VideoCapture(path)
+    total_frames = int(video.get(cv2.CAP_PROP_FRAME_COUNT))
+    interval = total_frames // num_frames
+    frames = []
+    for i in range(total_frames):
+        ret, frame = video.read()
+        if not ret:
+            continue
+        if i % interval == 0:
+            pil_img = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
+            frames.append(pil_img)
+    video.release()
+    return frames
+conversation = [
+    {
+        "role": "user",
+        "content": [
+            {"type": "text", "text": "Why is this video funny?"},
+            {"type": "video"},
+            ],
+    },
+]
+prompt = processor.apply_chat_template(conversation, add_generation_prompt=True)
+video_url = "https://huggingface.co/spaces/merve/llava-interleave/resolve/main/cats_1.mp4"
+video = sample_frames(video, 8)
+inputs = processor(text=prompt, videos=video, padding=True, return_tensors="pt").to(model.device)
+output = model.generate(**inputs, max_new_tokens=100, do_sample=False)
+print(processor.decode(output[0][2:], skip_special_tokens=True))
+# Why is this video funny? ASSISTANT: The humor in this video comes from the cat's facial expression and body language. The cat appears to be making a funny face, with its eyes squinted and mouth open, which can be interpreted as a playful or mischievous expression. Cats often make such faces when they are in a good mood or are playful, and this can be amusing to people who are familiar with their behavior. The combination of the cat's expression and the close-
+```
+## Useful Resources
+- [Transformers task guide on video-text-to-text](https://huggingface.co/docs/transformers/tasks/video_text_to_text)

package/src/tasks/video-text-to-text/data.ts ADDED Viewed

@@ -0,0 +1,58 @@
+import type { TaskDataCustom } from "..";
+const taskData: TaskDataCustom = {
+	datasets: [
+		{
+			description: "Multiple-choice questions and answers about videos.",
+			id: "lmms-lab/Video-MME",
+		},
+		{
+			description: "A dataset of instructions and question-answer pairs about videos.",
+			id: "lmms-lab/VideoChatGPT",
+		},
+	],
+	demo: {
+		inputs: [
+			{
+				filename: "video-text-to-text-input.gif",
+				type: "img",
+			},
+			{
+				label: "Text Prompt",
+				content: "What is happening in this video?",
+				type: "text",
+			},
+		],
+		outputs: [
+			{
+				label: "Answer",
+				content:
+					"The video shows a series of images showing a fountain with water jets and a variety of colorful flowers and butterflies in the background.",
+				type: "text",
+			},
+		],
+	},
+	metrics: [],
+	models: [
+		{
+			description: "A robust video-text-to-text model that can take in image and video inputs.",
+			id: "llava-hf/llava-onevision-qwen2-72b-ov-hf",
+		},
+		{
+			description: "Large and powerful video-text-to-text model that can take in image and video inputs.",
+			id: "llava-hf/LLaVA-NeXT-Video-34B-hf",
+		},
+	],
+	spaces: [
+		{
+			description: "An application to chat with a video-text-to-text model.",
+			id: "llava-hf/video-llava",
+		},
+	],
+	summary:
+		"Video-text-to-text models take in a video and a text prompt and output text. These models are also called video-language models.",
+	widgetModels: [""],
+	youtubeId: "",
+};
+export default taskData;