npm - @huggingface/tasks - Versions diffs - 0.12.23 → 0.12.24 - Mend

@huggingface/tasks 0.12.23 → 0.12.24

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (44) hide show

package/dist/index.cjs +476 -123
package/dist/index.js +476 -123
package/dist/src/hardware.d.ts +20 -0
package/dist/src/hardware.d.ts.map +1 -1
package/dist/src/model-libraries-snippets.d.ts +1 -0
package/dist/src/model-libraries-snippets.d.ts.map +1 -1
package/dist/src/model-libraries.d.ts +9 -2
package/dist/src/model-libraries.d.ts.map +1 -1
package/dist/src/snippets/common.d.ts +20 -0
package/dist/src/snippets/common.d.ts.map +1 -0
package/dist/src/snippets/curl.d.ts +15 -8
package/dist/src/snippets/curl.d.ts.map +1 -1
package/dist/src/snippets/js.d.ts +17 -10
package/dist/src/snippets/js.d.ts.map +1 -1
package/dist/src/snippets/python.d.ts +20 -13
package/dist/src/snippets/python.d.ts.map +1 -1
package/dist/src/snippets/types.d.ts +4 -0
package/dist/src/snippets/types.d.ts.map +1 -1
package/dist/src/tasks/depth-estimation/data.d.ts.map +1 -1
package/dist/src/tasks/image-text-to-text/data.d.ts.map +1 -1
package/dist/src/tasks/text-to-speech/data.d.ts.map +1 -1
package/dist/src/tasks/video-text-to-text/data.d.ts.map +1 -1
package/dist/src/tasks/visual-question-answering/inference.d.ts +0 -1
package/dist/src/tasks/visual-question-answering/inference.d.ts.map +1 -1
package/package.json +1 -1
package/src/hardware.ts +20 -0
package/src/model-libraries-snippets.ts +7 -1
package/src/model-libraries.ts +8 -1
package/src/snippets/common.ts +63 -0
package/src/snippets/curl.ts +71 -26
package/src/snippets/js.ts +165 -40
package/src/snippets/python.ts +186 -48
package/src/snippets/types.ts +5 -0
package/src/tasks/depth-estimation/data.ts +15 -7
package/src/tasks/image-segmentation/data.ts +5 -5
package/src/tasks/image-text-to-text/data.ts +17 -9
package/src/tasks/keypoint-detection/data.ts +1 -1
package/src/tasks/text-generation/data.ts +7 -7
package/src/tasks/text-to-image/data.ts +2 -2
package/src/tasks/text-to-speech/data.ts +5 -1
package/src/tasks/text-to-video/data.ts +10 -10
package/src/tasks/video-text-to-text/data.ts +8 -0
package/src/tasks/visual-question-answering/inference.ts +0 -1
package/src/tasks/visual-question-answering/spec/output.json +1 -1

package/dist/index.cjs CHANGED Viewed

@@ -2224,20 +2224,24 @@ var taskData11 = {
       id: "meta-llama/Llama-3.2-11B-Vision-Instruct"
     },
     {
-      description: "Cutting-edge conversational vision language model that can take multiple image inputs.",
-      id: "HuggingFaceM4/idefics2-8b-chatty"
+      description: "Cutting-edge vision language models.",
+      id: "allenai/Molmo-7B-D-0924"
     },
     {
       description: "Small yet powerful model.",
       id: "vikhyatk/moondream2"
     },
     {
-      description: "Strong image-text-to-text model made to understand documents.",
-      id: "mPLUG/DocOwl1.5"
+      description: "Strong image-text-to-text model.",
+      id: "Qwen/Qwen2-VL-7B-Instruct"
     },
     {
       description: "Strong image-text-to-text model.",
-      id: "microsoft/Phi-3.5-vision-instruct"
+      id: "mistralai/Pixtral-12B-2409"
+    },
+    {
+      description: "Strong image-text-to-text model focused on documents.",
+      id: "stepfun-ai/GOT-OCR2_0"
     }
   ],
   spaces: [
@@ -2251,19 +2255,23 @@ var taskData11 = {
     },
     {
       description: "Powerful vision-language model assistant.",
-      id: "liuhaotian/LLaVA-1.6"
+      id: "akhaliq/Molmo-7B-D-0924"
+    },
+    {
+      description: "An image-text-to-text application focused on documents.",
+      id: "stepfun-ai/GOT_official_online_demo"
     },
     {
       description: "An application to compare outputs of different vision language models.",
       id: "merve/compare_VLMs"
     },
     {
-      description: "An application for document vision language tasks.",
-      id: "mPLUG/DocOwl"
+      description: "An application for chatting with an image-text-to-text model.",
+      id: "GanymedeNil/Qwen2-VL-7B"
     }
   ],
   summary: "Image-text-to-text models take in an image and text prompt and output text. These models are also called vision-language models, or VLMs. The difference from image-to-text models is that these models take an additional text input, not restricting the model to certain use cases like image captioning, and may also be trained to accept a conversation as input.",
-  widgetModels: ["microsoft/kosmos-2-patch14-224"],
+  widgetModels: ["meta-llama/Llama-3.2-11B-Vision-Instruct"],
   youtubeId: "IoGaGfU1CIg"
 };
 var data_default11 = taskData11;
@@ -2323,11 +2331,11 @@ var taskData12 = {
       id: "ZhengPeng7/BiRefNet"
     },
     {
-      description: "Semantic segmentation model trained on ADE20k dataset.",
-      id: "nvidia/segformer-b0-finetuned-ade-512-512"
+      description: "Powerful human-centric image segmentation model.",
+      id: "facebook/sapiens-seg-1b"
     },
     {
-      description: "Panoptic segmentation model trained COCO (common objects) dataset.",
+      description: "Panoptic segmentation model trained on the COCO (common objects) dataset.",
       id: "facebook/mask2former-swin-large-coco-panoptic"
     }
   ],
@@ -2341,8 +2349,8 @@ var taskData12 = {
       id: "jbrinkma/segment-anything"
     },
     {
-      description: "A semantic segmentation application that predicts human silhouettes.",
-      id: "keras-io/Human-Part-Segmentation"
+      description: "A human-centric segmentation model.",
+      id: "facebook/sapiens-pose"
     },
     {
       description: "An instance segmentation application to predict neuronal cell types from microscopy images.",
@@ -2531,11 +2539,15 @@ var taskData15 = {
     },
     {
       description: "A strong monocular depth estimation model.",
-      id: "Bingxin/Marigold"
+      id: "jingheya/lotus-depth-g-v1-0"
     },
     {
-      description: "A metric depth estimation model trained on NYU dataset.",
-      id: "Intel/zoedepth-nyu"
+      description: "A depth estimation model that predicts depth in videos.",
+      id: "tencent/DepthCrafter"
+    },
+    {
+      description: "A robust depth estimation model.",
+      id: "apple/DepthPro"
     }
   ],
   spaces: [
@@ -2544,12 +2556,16 @@ var taskData15 = {
       id: "radames/dpt-depth-estimation-3d-voxels"
     },
     {
-      description: "An application on cutting-edge depth estimation.",
-      id: "depth-anything/Depth-Anything-V2"
+      description: "An application for bleeding-edge depth estimation.",
+      id: "akhaliq/depth-pro"
+    },
+    {
+      description: "An application on cutting-edge depth estimation in videos.",
+      id: "tencent/DepthCrafter"
     },
     {
-      description: "An application to try state-of-the-art depth estimation.",
-      id: "merve/compare_depth_models"
+      description: "A human-centric depth estimation application.",
+      id: "facebook/sapiens-depth"
     }
   ],
   summary: "Depth estimation is the task of predicting depth of the objects present in an image.",
@@ -3127,8 +3143,8 @@ var taskData24 = {
       id: "jbilcke-hf/ai-comic-factory"
     },
     {
-      description: "A text-to-image application that can generate coherent text inside the image.",
-      id: "DeepFloyd/IF"
+      description: "An application to match multiple custom image generation models.",
+      id: "multimodalart/flux-lora-lab"
     },
     {
       description: "A powerful yet very fast image generation application.",
@@ -3211,9 +3227,13 @@ var taskData25 = {
       id: "suno/bark"
     },
     {
-      description: "XTTS is a Voice generation model that lets you clone voices into different languages.",
+      description: "An application on XTTS, a voice generation model that lets you clone voices into different languages.",
       id: "coqui/xtts"
     },
+    {
+      description: "An application that generates speech in different styles in English and Chinese.",
+      id: "mrfakename/E2-F5-TTS"
+    },
     {
       description: "An application that synthesizes speech for diverse speaker prompts.",
       id: "parler-tts/parler_tts_mini"
@@ -3532,10 +3552,6 @@ var taskData29 = {
       description: "A text-generation model trained to follow instructions.",
       id: "google/gemma-2-2b-it"
     },
-    {
-      description: "A code generation model that can generate code in 80+ languages.",
-      id: "bigcode/starcoder"
-    },
     {
       description: "Very powerful text generation model trained to follow instructions.",
       id: "meta-llama/Meta-Llama-3.1-8B-Instruct"
@@ -3549,12 +3565,12 @@ var taskData29 = {
       id: "AI-MO/NuminaMath-7B-TIR"
     },
     {
-      description: "Strong coding assistant model.",
-      id: "HuggingFaceH4/starchat2-15b-v0.1"
+      description: "Strong text generation model to follow instructions.",
+      id: "Qwen/Qwen2.5-7B-Instruct"
     },
     {
       description: "Very strong open-source large language model.",
-      id: "mistralai/Mistral-Nemo-Instruct-2407"
+      id: "nvidia/Llama-3.1-Nemotron-70B-Instruct"
     }
   ],
   spaces: [
@@ -3562,6 +3578,10 @@ var taskData29 = {
       description: "A leaderboard to compare different open-source text generation models based on various benchmarks.",
       id: "open-llm-leaderboard/open_llm_leaderboard"
     },
+    {
+      description: "A leaderboard for comparing chain-of-thought performance of models.",
+      id: "logikon/open_cot_leaderboard"
+    },
     {
       description: "An text generation based application based on a very powerful LLaMA2 model.",
       id: "ysharma/Explore_llamav2_with_TGI"
@@ -3648,30 +3668,30 @@ var taskData30 = {
   ],
   models: [
     {
-      description: "A strong model for video generation.",
-      id: "Vchitect/LaVie"
+      description: "A strong model for consistent video generation.",
+      id: "rain1011/pyramid-flow-sd3"
     },
     {
       description: "A robust model for text-to-video generation.",
-      id: "damo-vilab/text-to-video-ms-1.7b"
+      id: "VideoCrafter/VideoCrafter2"
     },
     {
-      description: "A text-to-video generation model with high quality and smooth outputs.",
-      id: "hotshotco/Hotshot-XL"
+      description: "A cutting-edge text-to-video generation model.",
+      id: "TIGER-Lab/T2V-Turbo-V2"
     }
   ],
   spaces: [
     {
       description: "An application that generates video from text.",
-      id: "fffiloni/zeroscope"
+      id: "VideoCrafter/VideoCrafter"
     },
     {
-      description: "An application that generates video from image and text.",
-      id: "Vchitect/LaVie"
+      description: "Consistent video generation application.",
+      id: "TIGER-Lab/T2V-Turbo-V2"
     },
     {
-      description: "An application that generates videos from text and provides multi-model support.",
-      id: "ArtGAN/Video-Diffusion-WebUI"
+      description: "A cutting edge video generation application.",
+      id: "Pyramid-Flow/pyramid-flow"
     }
   ],
   summary: "Text-to-video models can be used in any application that requires generating consistent sequence of images from text. ",
@@ -4288,7 +4308,7 @@ var taskData39 = {
     },
     {
       description: "Strong keypoint detection model used to detect human pose.",
-      id: "qualcomm/MediaPipe-Pose-Estimation"
+      id: "facebook/sapiens-pose-1b"
     }
   ],
   spaces: [
@@ -4317,6 +4337,10 @@ var taskData40 = {
     {
       description: "A dataset of instructions and question-answer pairs about videos.",
       id: "lmms-lab/VideoChatGPT"
+    },
+    {
+      description: "Large video understanding dataset.",
+      id: "HuggingFaceFV/finevideo"
     }
   ],
   demo: {
@@ -4354,6 +4378,10 @@ var taskData40 = {
     {
       description: "An application to chat with a video-text-to-text model.",
       id: "llava-hf/video-llava"
+    },
+    {
+      description: "A leaderboard for various video-text-to-text models.",
+      id: "opencompass/openvlm_video_leaderboard"
     }
   ],
   summary: "Video-text-to-text models take in a video and a text prompt and output text. These models are also called video-language models.",
@@ -5243,7 +5271,7 @@ var transformersJS = (model) => {
   if (!model.pipeline_tag) {
     return [`// \u26A0\uFE0F Unknown pipeline tag`];
   }
-  const libName = "@xenova/transformers";
+  const libName = "@huggingface/transformers";
   return [
     `// npm i ${libName}
 import { pipeline } from '${libName}';
@@ -5387,6 +5415,11 @@ var nemo = (model) => {
   }
   return command ?? [`# tag did not correspond to a valid NeMo domain.`];
 };
+var pxia = (model) => [
+  `from pxia import AutoModel
+model = AutoModel.from_pretrained("${model.id}")`
+];
 var pythae = (model) => [
   `from pythae.models import AutoModel
@@ -5872,6 +5905,13 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
     filter: true,
     countDownloads: `path:"adapter_config.json"`
   },
+  pxia: {
+    prettyLabel: "pxia",
+    repoName: "pxia",
+    repoUrl: "https://github.com/not-lain/pxia",
+    snippets: pxia,
+    filter: false
+  },
   "pyannote-audio": {
     prettyLabel: "pyannote.audio",
     repoName: "pyannote-audio",
@@ -6104,7 +6144,7 @@ var MODEL_LIBRARIES_UI_ELEMENTS = {
   "transformers.js": {
     prettyLabel: "Transformers.js",
     repoName: "transformers.js",
-    repoUrl: "https://github.com/xenova/transformers.js",
+    repoUrl: "https://github.com/huggingface/transformers.js",
     docsUrl: "https://huggingface.co/docs/hub/transformers-js",
     snippets: transformersJS,
     filter: true
@@ -6293,30 +6333,91 @@ __export(curl_exports, {
   snippetTextGeneration: () => snippetTextGeneration,
   snippetZeroShotClassification: () => snippetZeroShotClassification
 });
-var snippetBasic = (model, accessToken) => `curl https://api-inference.huggingface.co/models/${model.id} \\
+// src/snippets/common.ts
+function stringifyMessages(messages, opts) {
+  const keyRole = opts.attributeKeyQuotes ? `"role"` : "role";
+  const keyContent = opts.attributeKeyQuotes ? `"role"` : "role";
+  const messagesStringified = messages.map(({ role, content }) => {
+    if (typeof content === "string") {
+      content = JSON.stringify(content).slice(1, -1);
+      if (opts.customContentEscaper) {
+        content = opts.customContentEscaper(content);
+      }
+      return `{ ${keyRole}: "${role}", ${keyContent}: "${content}" }`;
+    } else {
+      2;
+      content = content.map(({ image_url, text, type }) => ({
+        type,
+        image_url,
+        ...text ? { text: JSON.stringify(text).slice(1, -1) } : void 0
+      }));
+      content = JSON.stringify(content).slice(1, -1);
+      if (opts.customContentEscaper) {
+        content = opts.customContentEscaper(content);
+      }
+      return `{ ${keyRole}: "${role}", ${keyContent}: ${content} }`;
+    }
+  });
+  return opts.start + messagesStringified.join(opts.sep) + opts.end;
+}
+function stringifyGenerationConfig(config, opts) {
+  const quote = opts.attributeKeyQuotes ? `"` : "";
+  return opts.start + Object.entries(config).map(([key, val]) => `${quote}${key}${quote}${opts.attributeValueConnector}${val}`).join(opts.sep) + opts.end;
+}
+// src/snippets/curl.ts
+var snippetBasic = (model, accessToken) => ({
+  content: `curl https://api-inference.huggingface.co/models/${model.id} \\
 	-X POST \\
 	-d '{"inputs": ${getModelInputSnippet(model, true)}}' \\
 	-H 'Content-Type: application/json' \\
-	-H "Authorization: Bearer ${accessToken || `{API_TOKEN}`}"`;
-var snippetTextGeneration = (model, accessToken) => {
+	-H "Authorization: Bearer ${accessToken || `{API_TOKEN}`}"`
+});
+var snippetTextGeneration = (model, accessToken, opts) => {
   if (model.tags.includes("conversational")) {
-    return `curl 'https://api-inference.huggingface.co/models/${model.id}/v1/chat/completions' \\
+    const streaming = opts?.streaming ?? true;
+    const messages = opts?.messages ?? [
+      { role: "user", content: "What is the capital of France?" }
+    ];
+    const config = {
+      ...opts?.temperature ? { temperature: opts.temperature } : void 0,
+      max_tokens: opts?.max_tokens ?? 500,
+      ...opts?.top_p ? { top_p: opts.top_p } : void 0
+    };
+    return {
+      content: `curl 'https://api-inference.huggingface.co/models/${model.id}/v1/chat/completions' \\
 -H "Authorization: Bearer ${accessToken || `{API_TOKEN}`}" \\
 -H 'Content-Type: application/json' \\
--d '{
-	"model": "${model.id}",
-	"messages": [{"role": "user", "content": "What is the capital of France?"}],
-	"max_tokens": 500,
-	"stream": false
-}'
-`;
+--data '{
+    "model": "${model.id}",
+    "messages": ${stringifyMessages(messages, {
+        sep: ",\n		",
+        start: `[
+		`,
+        end: `
+	]`,
+        attributeKeyQuotes: true,
+        customContentEscaper: (str) => str.replace(/'/g, "'\\''")
+      })},
+    ${stringifyGenerationConfig(config, {
+        sep: ",\n    ",
+        start: "",
+        end: "",
+        attributeKeyQuotes: true,
+        attributeValueConnector: ": "
+      })},
+    "stream": ${!!streaming}
+}'`
+    };
   } else {
     return snippetBasic(model, accessToken);
   }
 };
 var snippetImageTextToTextGeneration = (model, accessToken) => {
   if (model.tags.includes("conversational")) {
-    return `curl 'https://api-inference.huggingface.co/models/${model.id}/v1/chat/completions' \\
+    return {
+      content: `curl 'https://api-inference.huggingface.co/models/${model.id}/v1/chat/completions' \\
 -H "Authorization: Bearer ${accessToken || `{API_TOKEN}`}" \\
 -H 'Content-Type: application/json' \\
 -d '{
@@ -6333,20 +6434,25 @@ var snippetImageTextToTextGeneration = (model, accessToken) => {
 	"max_tokens": 500,
 	"stream": false
 }'
-`;
+`
+    };
   } else {
     return snippetBasic(model, accessToken);
   }
 };
-var snippetZeroShotClassification = (model, accessToken) => `curl https://api-inference.huggingface.co/models/${model.id} \\
+var snippetZeroShotClassification = (model, accessToken) => ({
+  content: `curl https://api-inference.huggingface.co/models/${model.id} \\
 	-X POST \\
 	-d '{"inputs": ${getModelInputSnippet(model, true)}, "parameters": {"candidate_labels": ["refund", "legal", "faq"]}}' \\
 	-H 'Content-Type: application/json' \\
-	-H "Authorization: Bearer ${accessToken || `{API_TOKEN}`}"`;
-var snippetFile = (model, accessToken) => `curl https://api-inference.huggingface.co/models/${model.id} \\
+	-H "Authorization: Bearer ${accessToken || `{API_TOKEN}`}"`
+});
+var snippetFile = (model, accessToken) => ({
+  content: `curl https://api-inference.huggingface.co/models/${model.id} \\
 	-X POST \\
 	--data-binary '@${getModelInputSnippet(model, true, true)}' \\
-	-H "Authorization: Bearer ${accessToken || `{API_TOKEN}`}"`;
+	-H "Authorization: Bearer ${accessToken || `{API_TOKEN}`}"`
+});
 var curlSnippets = {
   // Same order as in js/src/lib/interfaces/Types.ts
   "text-classification": snippetBasic,
@@ -6374,7 +6480,7 @@ var curlSnippets = {
   "image-segmentation": snippetFile
 };
 function getCurlInferenceSnippet(model, accessToken) {
-  return model.pipeline_tag && model.pipeline_tag in curlSnippets ? curlSnippets[model.pipeline_tag]?.(model, accessToken) ?? "" : "";
+  return model.pipeline_tag && model.pipeline_tag in curlSnippets ? curlSnippets[model.pipeline_tag]?.(model, accessToken) ?? { content: "" } : { content: "" };
 }
 function hasCurlInferenceSnippet(model) {
   return !!model.pipeline_tag && model.pipeline_tag in curlSnippets;
@@ -6397,18 +6503,114 @@ __export(python_exports, {
   snippetZeroShotClassification: () => snippetZeroShotClassification2,
   snippetZeroShotImageClassification: () => snippetZeroShotImageClassification
 });
-var snippetConversational = (model, accessToken) => `from huggingface_hub import InferenceClient
+var snippetConversational = (model, accessToken, opts) => {
+  const streaming = opts?.streaming ?? true;
+  const messages = opts?.messages ?? [
+    { role: "user", content: "What is the capital of France?" }
+  ];
+  const messagesStr = stringifyMessages(messages, {
+    sep: ",\n	",
+    start: `[
+	`,
+    end: `
+]`,
+    attributeKeyQuotes: true
+  });
+  const config = {
+    ...opts?.temperature ? { temperature: opts.temperature } : void 0,
+    max_tokens: opts?.max_tokens ?? 500,
+    ...opts?.top_p ? { top_p: opts.top_p } : void 0
+  };
+  const configStr = stringifyGenerationConfig(config, {
+    sep: ",\n	",
+    start: "",
+    end: "",
+    attributeValueConnector: "="
+  });
+  if (streaming) {
+    return [
+      {
+        client: "huggingface_hub",
+        content: `from huggingface_hub import InferenceClient
 client = InferenceClient(api_key="${accessToken || "{API_TOKEN}"}")
-for message in client.chat_completion(
-	model="${model.id}",
-	messages=[{"role": "user", "content": "What is the capital of France?"}],
-	max_tokens=500,
-	stream=True,
-):
-    print(message.choices[0].delta.content, end="")`;
-var snippetConversationalWithImage = (model, accessToken) => `from huggingface_hub import InferenceClient
+messages = ${messagesStr}
+stream = client.chat.completions.create(
+    model="${model.id}",
+	messages=messages,
+	${configStr},
+	stream=True
+)
+for chunk in stream:
+    print(chunk.choices[0].delta.content)`
+      },
+      {
+        client: "openai",
+        content: `from openai import OpenAI
+client = OpenAI(
+	base_url="https://api-inference.huggingface.co/v1/",
+	api_key="${accessToken || "{API_TOKEN}"}"
+)
+messages = ${messagesStr}
+stream = client.chat.completions.create(
+    model="${model.id}",
+	messages=messages,
+	${configStr},
+	stream=True
+)
+for chunk in stream:
+    print(chunk.choices[0].delta.content)`
+      }
+    ];
+  } else {
+    return [
+      {
+        client: "huggingface_hub",
+        content: `from huggingface_hub import InferenceClient
+client = InferenceClient(api_key="${accessToken || "{API_TOKEN}"}")
+messages = ${messagesStr}
+completion = client.chat.completions.create(
+    model="${model.id}",
+	messages=messages,
+	${configStr}
+)
+print(completion.choices[0].message)`
+      },
+      {
+        client: "openai",
+        content: `from openai import OpenAI
+client = OpenAI(
+	base_url="https://api-inference.huggingface.co/v1/",
+	api_key="${accessToken || "{API_TOKEN}"}"
+)
+messages = ${messagesStr}
+completion = client.chat.completions.create(
+    model="${model.id}",
+	messages=messages,
+	${configStr}
+)
+print(completion.choices[0].message)`
+      }
+    ];
+  }
+};
+var snippetConversationalWithImage = (model, accessToken) => ({
+  content: `from huggingface_hub import InferenceClient
 client = InferenceClient(api_key="${accessToken || "{API_TOKEN}"}")
@@ -6428,16 +6630,20 @@ for message in client.chat_completion(
 	max_tokens=500,
 	stream=True,
 ):
-	print(message.choices[0].delta.content, end="")`;
-var snippetZeroShotClassification2 = (model) => `def query(payload):
+	print(message.choices[0].delta.content, end="")`
+});
+var snippetZeroShotClassification2 = (model) => ({
+  content: `def query(payload):
 	response = requests.post(API_URL, headers=headers, json=payload)
 	return response.json()
 output = query({
     "inputs": ${getModelInputSnippet(model)},
     "parameters": {"candidate_labels": ["refund", "legal", "faq"]},
-})`;
-var snippetZeroShotImageClassification = (model) => `def query(data):
+})`
+});
+var snippetZeroShotImageClassification = (model) => ({
+  content: `def query(data):
 	with open(data["image_path"], "rb") as f:
 		img = f.read()
 	payload={
@@ -6450,22 +6656,28 @@ var snippetZeroShotImageClassification = (model) => `def query(data):
 output = query({
     "image_path": ${getModelInputSnippet(model)},
     "parameters": {"candidate_labels": ["cat", "dog", "llama"]},
-})`;
-var snippetBasic2 = (model) => `def query(payload):
+})`
+});
+var snippetBasic2 = (model) => ({
+  content: `def query(payload):
 	response = requests.post(API_URL, headers=headers, json=payload)
 	return response.json()
 output = query({
 	"inputs": ${getModelInputSnippet(model)},
-})`;
-var snippetFile2 = (model) => `def query(filename):
+})`
+});
+var snippetFile2 = (model) => ({
+  content: `def query(filename):
     with open(filename, "rb") as f:
         data = f.read()
     response = requests.post(API_URL, headers=headers, data=data)
     return response.json()
-output = query(${getModelInputSnippet(model)})`;
-var snippetTextToImage = (model) => `def query(payload):
+output = query(${getModelInputSnippet(model)})`
+});
+var snippetTextToImage = (model) => ({
+  content: `def query(payload):
 	response = requests.post(API_URL, headers=headers, json=payload)
 	return response.content
 image_bytes = query({
@@ -6474,16 +6686,20 @@ image_bytes = query({
 # You can access the image with PIL.Image for example
 import io
 from PIL import Image
-image = Image.open(io.BytesIO(image_bytes))`;
-var snippetTabular = (model) => `def query(payload):
+image = Image.open(io.BytesIO(image_bytes))`
+});
+var snippetTabular = (model) => ({
+  content: `def query(payload):
 	response = requests.post(API_URL, headers=headers, json=payload)
 	return response.content
 response = query({
 	"inputs": {"data": ${getModelInputSnippet(model)}},
-})`;
+})`
+});
 var snippetTextToAudio = (model) => {
   if (model.library_name === "transformers") {
-    return `def query(payload):
+    return {
+      content: `def query(payload):
 	response = requests.post(API_URL, headers=headers, json=payload)
 	return response.content
@@ -6492,9 +6708,11 @@ audio_bytes = query({
 })
 # You can access the audio with IPython.display for example
 from IPython.display import Audio
-Audio(audio_bytes)`;
+Audio(audio_bytes)`
+    };
   } else {
-    return `def query(payload):
+    return {
+      content: `def query(payload):
 	response = requests.post(API_URL, headers=headers, json=payload)
 	return response.json()
@@ -6503,10 +6721,12 @@ audio, sampling_rate = query({
 })
 # You can access the audio with IPython.display for example
 from IPython.display import Audio
-Audio(audio, rate=sampling_rate)`;
+Audio(audio, rate=sampling_rate)`
+    };
   }
 };
-var snippetDocumentQuestionAnswering = (model) => `def query(payload):
+var snippetDocumentQuestionAnswering = (model) => ({
+  content: `def query(payload):
  	with open(payload["image"], "rb") as f:
   		img = f.read()
 		payload["image"] = base64.b64encode(img).decode("utf-8")
@@ -6515,7 +6735,8 @@ var snippetDocumentQuestionAnswering = (model) => `def query(payload):
 output = query({
     "inputs": ${getModelInputSnippet(model)},
-})`;
+})`
+});
 var pythonSnippets = {
   // Same order as in tasks/src/pipelines.ts
   "text-classification": snippetBasic2,
@@ -6546,19 +6767,25 @@ var pythonSnippets = {
   "image-to-text": snippetFile2,
   "zero-shot-image-classification": snippetZeroShotImageClassification
 };
-function getPythonInferenceSnippet(model, accessToken) {
+function getPythonInferenceSnippet(model, accessToken, opts) {
   if (model.pipeline_tag === "text-generation" && model.tags.includes("conversational")) {
-    return snippetConversational(model, accessToken);
+    return snippetConversational(model, accessToken, opts);
   } else if (model.pipeline_tag === "image-text-to-text" && model.tags.includes("conversational")) {
     return snippetConversationalWithImage(model, accessToken);
   } else {
-    const body = model.pipeline_tag && model.pipeline_tag in pythonSnippets ? pythonSnippets[model.pipeline_tag]?.(model, accessToken) ?? "" : "";
-    return `import requests
+    let snippets = model.pipeline_tag && model.pipeline_tag in pythonSnippets ? pythonSnippets[model.pipeline_tag]?.(model, accessToken) ?? { content: "" } : { content: "" };
+    snippets = Array.isArray(snippets) ? snippets : [snippets];
+    return snippets.map((snippet) => {
+      return {
+        ...snippet,
+        content: `import requests
 API_URL = "https://api-inference.huggingface.co/models/${model.id}"
 headers = {"Authorization": ${accessToken ? `"Bearer ${accessToken}"` : `f"Bearer {API_TOKEN}"`}}
-${body}`;
+${snippet.content}`
+      };
+    });
   }
 }
 function hasPythonInferenceSnippet(model) {
@@ -6579,7 +6806,8 @@ __export(js_exports, {
   snippetTextToImage: () => snippetTextToImage2,
   snippetZeroShotClassification: () => snippetZeroShotClassification3
 });
-var snippetBasic3 = (model, accessToken) => `async function query(data) {
+var snippetBasic3 = (model, accessToken) => ({
+  content: `async function query(data) {
 	const response = await fetch(
 		"https://api-inference.huggingface.co/models/${model.id}",
 		{
@@ -6597,27 +6825,120 @@ var snippetBasic3 = (model, accessToken) => `async function query(data) {
 query({"inputs": ${getModelInputSnippet(model)}}).then((response) => {
 	console.log(JSON.stringify(response));
-});`;
-var snippetTextGeneration2 = (model, accessToken) => {
+});`
+});
+var snippetTextGeneration2 = (model, accessToken, opts) => {
   if (model.tags.includes("conversational")) {
-    return `import { HfInference } from "@huggingface/inference";
+    const streaming = opts?.streaming ?? true;
+    const messages = opts?.messages ?? [
+      { role: "user", content: "What is the capital of France?" }
+    ];
+    const messagesStr = stringifyMessages(messages, { sep: ",\n		", start: "[\n		", end: "\n	]" });
+    const config = {
+      ...opts?.temperature ? { temperature: opts.temperature } : void 0,
+      max_tokens: opts?.max_tokens ?? 500,
+      ...opts?.top_p ? { top_p: opts.top_p } : void 0
+    };
+    const configStr = stringifyGenerationConfig(config, {
+      sep: ",\n	",
+      start: "",
+      end: "",
+      attributeValueConnector: ": "
+    });
+    if (streaming) {
+      return [
+        {
+          client: "huggingface_hub",
+          content: `import { HfInference } from "@huggingface/inference"
-const inference = new HfInference("${accessToken || `{API_TOKEN}`}");
+const client = new HfInference("${accessToken || `{API_TOKEN}`}")
-for await (const chunk of inference.chatCompletionStream({
+let out = "";
+const stream = client.chatCompletionStream({
 	model: "${model.id}",
-	messages: [{ role: "user", content: "What is the capital of France?" }],
-	max_tokens: 500,
-})) {
-	process.stdout.write(chunk.choices[0]?.delta?.content || "");
-}`;
+	messages: ${messagesStr},
+	${configStr}
+});
+for await (const chunk of stream) {
+	if (chunk.choices && chunk.choices.length > 0) {
+		const newContent = chunk.choices[0].delta.content;
+		out += newContent;
+		console.log(newContent);
+	}
+}`
+        },
+        {
+          client: "openai",
+          content: `import { OpenAI } from "openai"
+const client = new OpenAI({
+	baseURL: "https://api-inference.huggingface.co/v1/",
+    apiKey: "${accessToken || `{API_TOKEN}`}"
+})
+let out = "";
+const stream = await client.chat.completions.create({
+	model: "${model.id}",
+	messages: ${messagesStr},
+	${configStr},
+	stream: true,
+});
+for await (const chunk of stream) {
+	if (chunk.choices && chunk.choices.length > 0) {
+		const newContent = chunk.choices[0].delta.content;
+		out += newContent;
+		console.log(newContent);
+	}
+}`
+        }
+      ];
+    } else {
+      return [
+        {
+          client: "huggingface_hub",
+          content: `import { HfInference } from '@huggingface/inference'
+const client = new HfInference("${accessToken || `{API_TOKEN}`}")
+const chatCompletion = await client.chatCompletion({
+	model: "${model.id}",
+	messages: ${messagesStr},
+	${configStr}
+});
+console.log(chatCompletion.choices[0].message);`
+        },
+        {
+          client: "openai",
+          content: `import { OpenAI } from "openai"
+const client = new OpenAI({
+    baseURL: "https://api-inference.huggingface.co/v1/",
+    apiKey: "${accessToken || `{API_TOKEN}`}"
+})
+const chatCompletion = await client.chat.completions.create({
+	model: "${model.id}",
+	messages: ${messagesStr},
+	${configStr}
+});
+console.log(chatCompletion.choices[0].message);`
+        }
+      ];
+    }
   } else {
     return snippetBasic3(model, accessToken);
   }
 };
 var snippetImageTextToTextGeneration2 = (model, accessToken) => {
   if (model.tags.includes("conversational")) {
-    return `import { HfInference } from "@huggingface/inference";
+    return {
+      content: `import { HfInference } from "@huggingface/inference";
 const inference = new HfInference("${accessToken || `{API_TOKEN}`}");
 const imageUrl = "https://cdn.britannica.com/61/93061-050-99147DCE/Statue-of-Liberty-Island-New-York-Bay.jpg";
@@ -6636,12 +6957,14 @@ for await (const chunk of inference.chatCompletionStream({
 	max_tokens: 500,
 })) {
 	process.stdout.write(chunk.choices[0]?.delta?.content || "");
-}`;
+}`
+    };
   } else {
     return snippetBasic3(model, accessToken);
   }
 };
-var snippetZeroShotClassification3 = (model, accessToken) => `async function query(data) {
+var snippetZeroShotClassification3 = (model, accessToken) => ({
+  content: `async function query(data) {
 	const response = await fetch(
 		"https://api-inference.huggingface.co/models/${model.id}",
 		{
@@ -6658,11 +6981,13 @@ var snippetZeroShotClassification3 = (model, accessToken) => `async function que
 }
 query({"inputs": ${getModelInputSnippet(
-  model
-)}, "parameters": {"candidate_labels": ["refund", "legal", "faq"]}}).then((response) => {
+    model
+  )}, "parameters": {"candidate_labels": ["refund", "legal", "faq"]}}).then((response) => {
 	console.log(JSON.stringify(response));
-});`;
-var snippetTextToImage2 = (model, accessToken) => `async function query(data) {
+});`
+});
+var snippetTextToImage2 = (model, accessToken) => ({
+  content: `async function query(data) {
 	const response = await fetch(
 		"https://api-inference.huggingface.co/models/${model.id}",
 		{
@@ -6679,7 +7004,8 @@ var snippetTextToImage2 = (model, accessToken) => `async function query(data) {
 }
 query({"inputs": ${getModelInputSnippet(model)}}).then((response) => {
 	// Use image
-});`;
+});`
+});
 var snippetTextToAudio2 = (model, accessToken) => {
   const commonSnippet = `async function query(data) {
 		const response = await fetch(
@@ -6694,25 +7020,30 @@ var snippetTextToAudio2 = (model, accessToken) => {
 			}
 		);`;
   if (model.library_name === "transformers") {
-    return commonSnippet + `
+    return {
+      content: commonSnippet + `
 			const result = await response.blob();
 			return result;
 		}
 		query({"inputs": ${getModelInputSnippet(model)}}).then((response) => {
 			// Returns a byte object of the Audio wavform. Use it directly!
-		});`;
+		});`
+    };
   } else {
-    return commonSnippet + `
+    return {
+      content: commonSnippet + `
 			const result = await response.json();
 			return result;
 		}
 		query({"inputs": ${getModelInputSnippet(model)}}).then((response) => {
 			console.log(JSON.stringify(response));
-		});`;
+		});`
+    };
   }
 };
-var snippetFile3 = (model, accessToken) => `async function query(filename) {
+var snippetFile3 = (model, accessToken) => ({
+  content: `async function query(filename) {
 	const data = fs.readFileSync(filename);
 	const response = await fetch(
 		"https://api-inference.huggingface.co/models/${model.id}",
@@ -6731,7 +7062,8 @@ var snippetFile3 = (model, accessToken) => `async function query(filename) {
 query(${getModelInputSnippet(model)}).then((response) => {
 	console.log(JSON.stringify(response));
-});`;
+});`
+});
 var jsSnippets = {
   // Same order as in js/src/lib/interfaces/Types.ts
   "text-classification": snippetBasic3,
@@ -6759,7 +7091,7 @@ var jsSnippets = {
   "image-segmentation": snippetFile3
 };
 function getJsInferenceSnippet(model, accessToken) {
-  return model.pipeline_tag && model.pipeline_tag in jsSnippets ? jsSnippets[model.pipeline_tag]?.(model, accessToken) ?? "" : "";
+  return model.pipeline_tag && model.pipeline_tag in jsSnippets ? jsSnippets[model.pipeline_tag]?.(model, accessToken) ?? { content: "" } : { content: "" };
 }
 function hasJsInferenceSnippet(model) {
   return !!model.pipeline_tag && model.pipeline_tag in jsSnippets;
@@ -6826,6 +7158,11 @@ var SKUS = {
         tflops: 31.24,
         memory: [24]
       },
+      A2: {
+        tflops: 4.531,
+        // source: https://www.techpowerup.com/gpu-specs/a2.c3848
+        memory: [16]
+      },
       "RTX 4090": {
         tflops: 82.58,
         memory: [24]
@@ -6988,6 +7325,14 @@ var SKUS = {
         tflops: 184.6,
         memory: [32]
       },
+      MI60: {
+        tflops: 29.5,
+        memory: [32]
+      },
+      MI50: {
+        tflops: 26.5,
+        memory: [16]
+      },
       "RX 7900 XTX": {
         tflops: 122.8,
         memory: [24]
@@ -7020,6 +7365,14 @@ var SKUS = {
         tflops: 32.33,
         memory: [16]
       },
+      "RX 6700 XT": {
+        tflops: 26.43,
+        memory: [12]
+      },
+      "RX 6700": {
+        tflops: 22.58,
+        memory: [10]
+      },
       "Radeon Pro VII": {
         tflops: 26.11,
         memory: [16]