PyPI - ipex-llm - Versions diffs - 2.2.0b20250114__py3-none-win_amd64.whl → 2.2.0b20250116__py3-none-win_amd64.whl - Mend

ipex-llm 2.2.0b20250114__py3-none-win_amd64.whl → 2.2.0b20250116__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

ipex_llm/ggml/quantize.py +1 -0
ipex_llm/libs/bloom-api.dll +0 -0
ipex_llm/libs/bloom.dll +0 -0
ipex_llm/libs/gptneox-api.dll +0 -0
ipex_llm/libs/gptneox.dll +0 -0
ipex_llm/libs/libbloom_avx.dll +0 -0
ipex_llm/libs/libbloom_vnni.dll +0 -0
ipex_llm/libs/libgptneox_avx.dll +0 -0
ipex_llm/libs/libgptneox_vnni.dll +0 -0
ipex_llm/libs/libllama_avx.dll +0 -0
ipex_llm/libs/libllama_vnni.dll +0 -0
ipex_llm/libs/libstarcoder_avx.dll +0 -0
ipex_llm/libs/libstarcoder_vnni.dll +0 -0
ipex_llm/libs/llama-api.dll +0 -0
ipex_llm/libs/llama.dll +0 -0
ipex_llm/libs/main-bloom.exe +0 -0
ipex_llm/libs/main-gptneox.exe +0 -0
ipex_llm/libs/main-llama.exe +0 -0
ipex_llm/libs/main-starcoder.exe +0 -0
ipex_llm/libs/pipeline.dll +0 -0
ipex_llm/libs/quantize-bloom.exe +0 -0
ipex_llm/libs/quantize-bloom_vnni.exe +0 -0
ipex_llm/libs/quantize-gptneox.exe +0 -0
ipex_llm/libs/quantize-gptneox_vnni.exe +0 -0
ipex_llm/libs/quantize-llama.exe +0 -0
ipex_llm/libs/quantize-llama_vnni.exe +0 -0
ipex_llm/libs/quantize-starcoder.exe +0 -0
ipex_llm/libs/quantize-starcoder_vnni.exe +0 -0
ipex_llm/libs/starcoder-api.dll +0 -0
ipex_llm/libs/starcoder.dll +0 -0
ipex_llm/transformers/convert.py +29 -1
ipex_llm/transformers/low_bit_linear.py +7 -6
ipex_llm/transformers/models/llama.py +13 -2
ipex_llm/transformers/models/utils.py +4 -4
ipex_llm/transformers/models/whisper.py +103 -0
{ipex_llm-2.2.0b20250114.dist-info → ipex_llm-2.2.0b20250116.dist-info}/METADATA +23 -20
{ipex_llm-2.2.0b20250114.dist-info → ipex_llm-2.2.0b20250116.dist-info}/RECORD +43 -42
{ipex_llm-2.2.0b20250114.data → ipex_llm-2.2.0b20250116.data}/scripts/ipex-llm-init.bat +0 -0
{ipex_llm-2.2.0b20250114.data → ipex_llm-2.2.0b20250116.data}/scripts/llm-chat.ps1 +0 -0
{ipex_llm-2.2.0b20250114.data → ipex_llm-2.2.0b20250116.data}/scripts/llm-cli.ps1 +0 -0
{ipex_llm-2.2.0b20250114.dist-info → ipex_llm-2.2.0b20250116.dist-info}/WHEEL +0 -0
{ipex_llm-2.2.0b20250114.dist-info → ipex_llm-2.2.0b20250116.dist-info}/entry_points.txt +0 -0
{ipex_llm-2.2.0b20250114.dist-info → ipex_llm-2.2.0b20250116.dist-info}/top_level.txt +0 -0

ipex_llm/ggml/quantize.py CHANGED Viewed

@@ -53,6 +53,7 @@ ggml_tensor_qtype = {"sym_int4": 2,   # q4_0 in ggml
                      "sym_int4_rtn": 31,
                      "sym_int8_rtn": 32,
                      "asym_int4_rtn": 33,
+                     "woq_int4": 34,
                      }
 # mixed precison from llama.cpp

ipex_llm/libs/bloom-api.dll CHANGED Viewed

Binary file

ipex_llm/libs/bloom.dll CHANGED Viewed

Binary file

ipex_llm/libs/gptneox-api.dll CHANGED Viewed

Binary file

ipex_llm/libs/gptneox.dll CHANGED Viewed

Binary file

ipex_llm/libs/libbloom_avx.dll CHANGED Viewed

Binary file

ipex_llm/libs/libbloom_vnni.dll CHANGED Viewed

Binary file

ipex_llm/libs/libgptneox_avx.dll CHANGED Viewed

Binary file

ipex_llm/libs/libgptneox_vnni.dll CHANGED Viewed

Binary file

ipex_llm/libs/libllama_avx.dll CHANGED Viewed

Binary file

ipex_llm/libs/libllama_vnni.dll CHANGED Viewed

Binary file

ipex_llm/libs/libstarcoder_avx.dll CHANGED Viewed

Binary file

ipex_llm/libs/libstarcoder_vnni.dll CHANGED Viewed

Binary file

ipex_llm/libs/llama-api.dll CHANGED Viewed

Binary file

ipex_llm/libs/llama.dll CHANGED Viewed

Binary file

ipex_llm/libs/main-bloom.exe CHANGED Viewed

Binary file

ipex_llm/libs/main-gptneox.exe CHANGED Viewed

Binary file

ipex_llm/libs/main-llama.exe CHANGED Viewed

Binary file

ipex_llm/libs/main-starcoder.exe CHANGED Viewed

Binary file

ipex_llm/libs/pipeline.dll CHANGED Viewed

Binary file

ipex_llm/libs/quantize-bloom.exe CHANGED Viewed

Binary file

ipex_llm/libs/quantize-bloom_vnni.exe CHANGED Viewed

Binary file

ipex_llm/libs/quantize-gptneox.exe CHANGED Viewed

Binary file

ipex_llm/libs/quantize-gptneox_vnni.exe CHANGED Viewed

Binary file

ipex_llm/libs/quantize-llama.exe CHANGED Viewed

Binary file

ipex_llm/libs/quantize-llama_vnni.exe CHANGED Viewed

Binary file

ipex_llm/libs/quantize-starcoder.exe CHANGED Viewed

Binary file

ipex_llm/libs/quantize-starcoder_vnni.exe CHANGED Viewed

Binary file

ipex_llm/libs/starcoder-api.dll CHANGED Viewed

Binary file

ipex_llm/libs/starcoder.dll CHANGED Viewed

Binary file

ipex_llm/transformers/convert.py CHANGED Viewed

@@ -995,8 +995,9 @@ def _optimize_pre(model, qtype=None):
         from ipex_llm.transformers.models.gemma2 import merge_qkv
         model.apply(merge_qkv)
     elif model.config.model_type == "llama":
-        from ipex_llm.transformers.models.llama import merge_qkv
+        from ipex_llm.transformers.models.llama import merge_qkv, pre_compute_inv_freq
         model.apply(merge_qkv)
+        model.apply(pre_compute_inv_freq)
     elif model.config.model_type == "mllama":
         from ipex_llm.transformers.models.mllama import merge_qkv
         model.apply(merge_qkv)
@@ -1027,6 +1028,15 @@ def _optimize_pre(model, qtype=None):
             model.llm.config.model_type = "minicpm"
         _optimize_pre(model.llm, qtype=qtype)
         model.llm.config.model_type = "minicpmv"
+    elif model.config.model_type == "minicpmo":
+        # vpm opt
+        if hasattr(model, "vpm"):
+            from ipex_llm.transformers.models.minicpmv import merge_qkv
+            model.vpm.apply(merge_qkv)
+        # llm opt
+        model.llm.config.model_type = "qwen2"
+        _optimize_pre(model.llm, qtype=qtype)
+        model.llm.config.model_type = "minicpmo"
     elif model.config.model_type == "megrezo":
         from ipex_llm.transformers.models.minicpmv import merge_qkv
         model.vision.apply(merge_qkv)
@@ -1943,6 +1953,24 @@ def _optimize_post(model):
             convert_forward(model.vpm, vpm_module.Idefics2VisionAttention, siglip_attention_forward)
             minicpmv_chat = minicpmv_chat_wrapper(module.MiniCPMV.chat)
             model.chat = MethodType(minicpmv_chat, model)
+    elif model.config.model_type == "minicpmo":
+        # vpm opt
+        if hasattr(model, "vpm"):
+            vpm_modeling_module_name = model.vpm.__class__.__module__
+            vpm_module = importlib.import_module(vpm_modeling_module_name)
+            from ipex_llm.transformers.models.minicpmv import siglip_attention_forward
+            convert_forward(model.vpm, vpm_module.SiglipAttention, siglip_attention_forward)
+        # apm opt
+        if hasattr(model, "apm"):
+            apm_modeling_module_name = model.apm.__class__.__module__
+            apm_module = importlib.import_module(apm_modeling_module_name)
+            from transformers.models.whisper.modeling_whisper import WhisperSdpaAttention
+            from ipex_llm.transformers.models.whisper import whisper_attention_forward
+            convert_forward(model.apm, WhisperSdpaAttention, whisper_attention_forward)
+        # llm opt
+        model.llm.config.model_type = "qwen2"
+        _optimize_post(model.llm)
+        model.llm.config.model_type = "minicpmo"
     elif model.config.model_type == "megrezo":
         modeling_module_name = model.__class__.__module__
         module = importlib.import_module(modeling_module_name)

ipex_llm/transformers/low_bit_linear.py CHANGED Viewed

@@ -84,6 +84,7 @@ FP6_K = ggml_tensor_qtype["fp6_k"]
 SYM_INT4_RTN = ggml_tensor_qtype["sym_int4_rtn"]
 SYM_INT8_RTN = ggml_tensor_qtype["sym_int8_rtn"]
 ASYM_INT4_RTN = ggml_tensor_qtype["asym_int4_rtn"]
+WOQ_INT4 = ggml_tensor_qtype["woq_int4"]
 RTN_DTYPE = {
     SYM_INT4_RTN: torch.uint8,
     ASYM_INT4_RTN: torch.uint8,
@@ -187,7 +188,7 @@ def ggml_q_format_convet_cpu2xpu(tensor: torch.Tensor, num_elem: int, qtype: int
     src = ctypes.c_void_p(tensor.data.data_ptr())
     if qtype in [SYM_INT4, ASYM_INT4, SYM_INT8, NF4, NF3, FP4, FP6, FP8E4, FP8E5,
-                 Q4_K, Q6_K, FP6_K]:
+                 Q4_K, Q6_K, FP6_K, WOQ_INT4]:
         dst_tensor = torch.empty_like(tensor)
     elif qtype == ggml_tensor_qtype["sym_int5"]:
         QK = ggml.ggml_qk_size(qtype)
@@ -213,7 +214,7 @@ def ggml_q_format_convet_xpu2cpu(tensor: torch.Tensor, num_elem: int, qtype: int
     src = ctypes.c_void_p(tensor.data.data_ptr())
     if qtype in [SYM_INT4, ASYM_INT4, SYM_INT8, NF4, NF3, FP4, FP6, FP8E4, FP8E5,
-                 Q4_K, Q6_K, FP6_K]:
+                 Q4_K, Q6_K, FP6_K, WOQ_INT4]:
         dst_tensor = torch.empty_like(tensor)
     elif qtype == ggml_tensor_qtype["sym_int5"]:
         QK = ggml.ggml_qk_size(ggml_tensor_qtype["asym_int5"])
@@ -272,7 +273,7 @@ def use_batch_forward(x: torch.Tensor, qtype: int, output_len: int):
         and x.shape[1] % 128 == 0
         and (
             (
-                qtype in [SYM_INT4, ASYM_INT4, FP8E5, FP8E4]
+                qtype in [SYM_INT4, ASYM_INT4, FP8E5, FP8E4, WOQ_INT4]
                 and (
                     batch_size <= 48
                     or (
@@ -283,7 +284,7 @@ def use_batch_forward(x: torch.Tensor, qtype: int, output_len: int):
                 )
             )
             or (
-                qtype in [SYM_INT8, FP4, FP6, Q4_K, Q6_K]
+                qtype in [SYM_INT8, FP4, FP6, Q4_K, Q6_K, WOQ_INT4]
                 and batch_size <= 48
                 and device_name in ["arc", "pvc", "mtl", "arl"]
                 and x.shape[1] % 256 == 0
@@ -296,8 +297,8 @@ def use_batch_forward(x: torch.Tensor, qtype: int, output_len: int):
             batch_size > 1
             or (device_name in ["arc"] and qtype in [SYM_INT8, FP4])
             or (device_name in ["arc", "mtl"] and qtype in [FP8E4])
-            or (device_name in ["lnl"] and qtype in [SYM_INT4] and x.shape[1] % 512 == 0)
-            or (device_name in ["bmg"] and qtype in [SYM_INT4, FP8E5])
+            or (device_name in ["lnl"] and qtype in [SYM_INT4, WOQ_INT4] and x.shape[1] % 512 == 0)
+            or (device_name in ["bmg"] and qtype in [SYM_INT4, WOQ_INT4, FP8E5])
         )
     return False

ipex_llm/transformers/models/llama.py CHANGED Viewed

@@ -119,6 +119,13 @@ def merge_qkv(module: torch.nn.Module):
     merge_qkv_base(module, LlamaAttention)
+def pre_compute_inv_freq(module: torch.nn.Module):
+    if module.__class__.__name__ == "LlamaLinearScalingRotaryEmbedding":
+        if hasattr(module, "scaling_factor"):
+            module.register_buffer("inv_freq_scaled", None, persistent=False)
+            module.inv_freq_scaled = module.inv_freq / module.scaling_factor
 def llama_attention_forward(
     self,
     hidden_states: torch.Tensor,
@@ -147,8 +154,12 @@ def llama_attention_forward(
         import xe_addons
         if hasattr(self, "rotary_emb"):
             # transformers < 4.46
-            xe_addons.rotary_half_inplaced(self.rotary_emb.inv_freq, position_ids,
-                                           query_states, key_states)
+            if hasattr(self.rotary_emb, "inv_freq_scaled"):
+                xe_addons.rotary_half_inplaced(self.rotary_emb.inv_freq_scaled, position_ids,
+                                               query_states, key_states)
+            else:
+                xe_addons.rotary_half_inplaced(self.rotary_emb.inv_freq, position_ids,
+                                               query_states, key_states)
         else:
             # transformers >= 4.46
             cos, sin = position_embeddings

ipex_llm/transformers/models/utils.py CHANGED Viewed

@@ -21,7 +21,7 @@ from ipex_llm.utils.common import invalidInputError
 from ipex_llm.ggml.quantize import ggml_tensor_qtype
 from ipex_llm.transformers.utils import get_xpu_device_name
 from ipex_llm.transformers.low_bit_linear import SYM_INT4, SYM_INT8, FP8E5, IQ2_XXS, FP4, FP8E4,\
-    FP6, ASYM_INT4
+    FP6, ASYM_INT4, WOQ_INT4
 FP8_KV_ALLOC_LENGTH = 512
 KV_CACHE_ALLOC_BLOCK_LENGTH = int(os.environ.get("KV_CACHE_ALLOC_BLOCK_LENGTH", 256))
@@ -33,7 +33,7 @@ GELU = 1
 def decoding_fast_path_qtype_check(proj):
     qtype = getattr(proj, "qtype", None)
-    return qtype in [SYM_INT4, FP8E5, FP4]
+    return qtype in [SYM_INT4, FP8E5, FP4, WOQ_INT4]
 def init_kv_cache(batch_size, num_heads, head_dim, current_length, max_length, dtype, device):
@@ -248,7 +248,7 @@ def mlp_fusion_check(x, qtype, training):
         return False
     if x.device.type != 'xpu':
         return False
-    if qtype not in [SYM_INT4, FP8E5, FP4, IQ2_XXS, FP6]:
+    if qtype not in [SYM_INT4, FP8E5, FP4, IQ2_XXS, FP6, WOQ_INT4]:
         return False
     if training or x.requires_grad:
         return False
@@ -263,7 +263,7 @@ def use_xmx(x: torch.Tensor, qtype: int):
     device = get_xpu_device_name(x.device)
     return (
         device in ["arc", "pvc"]
-        and qtype in [SYM_INT4, SYM_INT8, FP8E4, FP8E5]
+        and qtype in [SYM_INT4, SYM_INT8, FP8E4, FP8E5, WOQ_INT4]
         and (
             (device == "pvc" and 1 < x.size(0) <= 16)
             or

ipex_llm/transformers/models/whisper.py ADDED Viewed

@@ -0,0 +1,103 @@
+#
+# Copyright 2016 The BigDL Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# Some parts of this file is adapted from
+# https://github.com/huggingface/transformers/blob/main/src/transformers/models/whisper/modeling_whisper.py
+# which is licensed under Apache License 2.0:
+#
+# Copyright 2022 The OpenAI Authors and The HuggingFace Inc. team. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+import torch
+from typing import Optional, Tuple
+from transformers.cache_utils import EncoderDecoderCache
+from ipex_llm.transformers.utils import invalidInputError
+from ipex_llm.transformers.models.common import scaled_dot_product_attention
+def whisper_attention_forward(
+    self,
+    hidden_states: torch.Tensor,
+    key_value_states: Optional[torch.Tensor] = None,
+    past_key_value: Optional[EncoderDecoderCache] = None,
+    attention_mask: Optional[torch.Tensor] = None,
+    layer_head_mask: Optional[torch.Tensor] = None,
+    output_attentions: bool = False,
+    cache_position: Optional[torch.LongTensor] = None,
+) -> Tuple[torch.Tensor, Optional[torch.Tensor], Optional[Tuple[torch.Tensor]]]:
+    invalidInputError(not output_attentions and layer_head_mask is None,
+                      "`output_attentions` and `layer_head_mask` are not supported")
+    # if key_value_states are provided this layer is used as a cross-attention layer
+    # for the decoder
+    is_cross_attention = key_value_states is not None
+    bsz, tgt_len, _ = hidden_states.size()
+    # get query proj
+    query_states = self._shape(self.q_proj(hidden_states), tgt_len, bsz)
+    if past_key_value is not None:
+        is_updated = past_key_value.is_updated.get(self.layer_idx)
+        if is_cross_attention:
+            past_key_value.is_updated[self.layer_idx] = True
+            past_key_value = past_key_value.cross_attention_cache
+        else:
+            past_key_value = past_key_value.self_attention_cache
+    # use key_value_states if cross attention
+    current_states = key_value_states if key_value_states is not None else hidden_states
+    if is_cross_attention and past_key_value and is_updated:
+        # reuse k,v, cross_attentions
+        key_states = past_key_value.key_cache[self.layer_idx]
+        value_states = past_key_value.value_cache[self.layer_idx]
+    else:
+        key_states = self._shape(self.k_proj(current_states), -1, bsz)
+        value_states = self._shape(self.v_proj(current_states), -1, bsz)
+        if past_key_value is not None:
+            cache_position = cache_position if not is_cross_attention else None
+            key_states, value_states = past_key_value.update(
+                key_states, value_states, self.layer_idx, {"cache_position": cache_position}
+            )
+    # IPEX-LLM OPT: sdpa
+    is_causal = True if self.is_causal and attention_mask is None and tgt_len > 1 else False
+    attn_output = scaled_dot_product_attention(
+        query_states,
+        key_states.contiguous(),
+        value_states.contiguous(),
+        attention_mask,
+        is_causal
+    )
+    attn_output = attn_output.transpose(1, 2)
+    attn_output = attn_output.reshape(bsz, tgt_len, self.embed_dim)
+    attn_output = self.out_proj(attn_output)
+    return attn_output, None, past_key_value

{ipex_llm-2.2.0b20250114.dist-info → ipex_llm-2.2.0b20250116.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: ipex-llm
-Version: 2.2.0b20250114
+Version: 2.2.0b20250116
 Summary: Large Language Model Develop Toolkit
 Home-page: https://github.com/intel-analytics/ipex-llm
 Author: BigDL Authors
@@ -27,10 +27,10 @@ Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine
 Requires-Dist: torch ==2.1.2+cpu ; (platform_system == "Linux") and extra == 'all'
 Requires-Dist: torch ==2.1.2 ; (platform_system == "Windows") and extra == 'all'
 Provides-Extra: cpp
-Requires-Dist: bigdl-core-cpp ==2.6.0b20250114 ; extra == 'cpp'
+Requires-Dist: bigdl-core-cpp ==2.6.0b20250116 ; extra == 'cpp'
 Requires-Dist: setuptools ; extra == 'cpp'
 Provides-Extra: cpp-arl
-Requires-Dist: bigdl-core-cpp ==2.6.0b20250114 ; extra == 'cpp-arl'
+Requires-Dist: bigdl-core-cpp ==2.6.0b20250116 ; extra == 'cpp-arl'
 Requires-Dist: setuptools ; extra == 'cpp-arl'
 Requires-Dist: onednn-devel ==2024.1.1 ; (platform_system == "Windows") and extra == 'cpp-arl'
 Requires-Dist: onednn ==2024.1.1 ; (platform_system == "Windows") and extra == 'cpp-arl'
@@ -67,7 +67,7 @@ Requires-Dist: transformers ==4.40.0 ; extra == 'npu'
 Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'npu'
 Requires-Dist: torch ==2.1.2+cpu ; (platform_system == "Linux") and extra == 'npu'
 Requires-Dist: torch ==2.1.2 ; (platform_system == "Windows") and extra == 'npu'
-Requires-Dist: bigdl-core-npu ==2.6.0b20250114 ; (platform_system == "Windows") and extra == 'npu'
+Requires-Dist: bigdl-core-npu ==2.6.0b20250116 ; (platform_system == "Windows") and extra == 'npu'
 Provides-Extra: serving
 Requires-Dist: py-cpuinfo ; extra == 'serving'
 Requires-Dist: fschat[model_worker,webui] ==0.2.36 ; extra == 'serving'
@@ -87,9 +87,9 @@ Requires-Dist: setuptools <70.0.0 ; extra == 'xpu'
 Requires-Dist: torch ==2.1.0a0 ; extra == 'xpu'
 Requires-Dist: torchvision ==0.16.0a0 ; extra == 'xpu'
 Requires-Dist: intel-extension-for-pytorch ==2.1.10+xpu ; extra == 'xpu'
-Requires-Dist: bigdl-core-xe-21 ==2.6.0b20250114 ; extra == 'xpu'
-Requires-Dist: bigdl-core-xe-batch-21 ==2.6.0b20250114 ; extra == 'xpu'
-Requires-Dist: bigdl-core-xe-addons-21 ==2.6.0b20250114 ; extra == 'xpu'
+Requires-Dist: bigdl-core-xe-21 ==2.6.0b20250116 ; extra == 'xpu'
+Requires-Dist: bigdl-core-xe-batch-21 ==2.6.0b20250116 ; extra == 'xpu'
+Requires-Dist: bigdl-core-xe-addons-21 ==2.6.0b20250116 ; extra == 'xpu'
 Provides-Extra: xpu-2-1
 Requires-Dist: py-cpuinfo ; extra == 'xpu-2-1'
 Requires-Dist: protobuf ; extra == 'xpu-2-1'
@@ -104,9 +104,9 @@ Requires-Dist: setuptools <70.0.0 ; extra == 'xpu-2-1'
 Requires-Dist: torch ==2.1.0a0 ; extra == 'xpu-2-1'
 Requires-Dist: torchvision ==0.16.0a0 ; extra == 'xpu-2-1'
 Requires-Dist: intel-extension-for-pytorch ==2.1.10+xpu ; extra == 'xpu-2-1'
-Requires-Dist: bigdl-core-xe-21 ==2.6.0b20250114 ; extra == 'xpu-2-1'
-Requires-Dist: bigdl-core-xe-batch-21 ==2.6.0b20250114 ; extra == 'xpu-2-1'
-Requires-Dist: bigdl-core-xe-addons-21 ==2.6.0b20250114 ; extra == 'xpu-2-1'
+Requires-Dist: bigdl-core-xe-21 ==2.6.0b20250116 ; extra == 'xpu-2-1'
+Requires-Dist: bigdl-core-xe-batch-21 ==2.6.0b20250116 ; extra == 'xpu-2-1'
+Requires-Dist: bigdl-core-xe-addons-21 ==2.6.0b20250116 ; extra == 'xpu-2-1'
 Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-2-1'
 Requires-Dist: dpcpp-cpp-rt ==2024.0.2 ; (platform_system == "Windows") and extra == 'xpu-2-1'
 Requires-Dist: mkl-dpcpp ==2024.0.0 ; (platform_system == "Windows") and extra == 'xpu-2-1'
@@ -124,7 +124,10 @@ Requires-Dist: setuptools ; extra == 'xpu-2-6'
 Requires-Dist: torch ==2.6.0+xpu ; extra == 'xpu-2-6'
 Requires-Dist: torchvision ==0.21.0+xpu ; extra == 'xpu-2-6'
 Requires-Dist: torchaudio ==2.6.0+xpu ; extra == 'xpu-2-6'
-Requires-Dist: bigdl-core-xe-all ==2.6.0b20250114 ; extra == 'xpu-2-6'
+Requires-Dist: bigdl-core-xe-all ==2.6.0b20250116 ; extra == 'xpu-2-6'
+Requires-Dist: onednn-devel ==2025.0.1 ; extra == 'xpu-2-6'
+Requires-Dist: onednn ==2025.0.1 ; extra == 'xpu-2-6'
+Requires-Dist: dpcpp-cpp-rt ==2025.0.2 ; extra == 'xpu-2-6'
 Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-2-6'
 Provides-Extra: xpu-arc
 Requires-Dist: py-cpuinfo ; extra == 'xpu-arc'
@@ -137,9 +140,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-arc'
 Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-arc'
 Requires-Dist: tabulate ; extra == 'xpu-arc'
 Requires-Dist: setuptools ; extra == 'xpu-arc'
-Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250114 ; extra == 'xpu-arc'
-Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250114 ; extra == 'xpu-arc'
-Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250114 ; extra == 'xpu-arc'
+Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250116 ; extra == 'xpu-arc'
+Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250116 ; extra == 'xpu-arc'
+Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250116 ; extra == 'xpu-arc'
 Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-arc'
 Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arc'
 Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arc'
@@ -160,9 +163,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-arl'
 Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-arl'
 Requires-Dist: tabulate ; extra == 'xpu-arl'
 Requires-Dist: setuptools ; extra == 'xpu-arl'
-Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250114 ; extra == 'xpu-arl'
-Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250114 ; extra == 'xpu-arl'
-Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250114 ; extra == 'xpu-arl'
+Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250116 ; extra == 'xpu-arl'
+Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250116 ; extra == 'xpu-arl'
+Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250116 ; extra == 'xpu-arl'
 Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-arl'
 Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arl'
 Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arl'
@@ -183,9 +186,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-lnl'
 Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-lnl'
 Requires-Dist: tabulate ; extra == 'xpu-lnl'
 Requires-Dist: setuptools ; extra == 'xpu-lnl'
-Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250114 ; extra == 'xpu-lnl'
-Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250114 ; extra == 'xpu-lnl'
-Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250114 ; extra == 'xpu-lnl'
+Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250116 ; extra == 'xpu-lnl'
+Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250116 ; extra == 'xpu-lnl'
+Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250116 ; extra == 'xpu-lnl'
 Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-lnl'
 Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-lnl'
 Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-lnl'

{ipex_llm-2.2.0b20250114.dist-info → ipex_llm-2.2.0b20250116.dist-info}/RECORD RENAMED Viewed

@@ -9,7 +9,7 @@ ipex_llm/cli/prompts/chat-with-llm.txt,sha256=PpSyd4FQQd-T7ptfXL9jZp7dgstevu1fsx
 ipex_llm/ggml/__init__.py,sha256=FzapYBUiTdZf0LzlN9hfJI-HE1OTi_2dzaYELJ9Mw8s,1272
 ipex_llm/ggml/convert.py,sha256=xfWH1E_hivbsxVo8h00STjH1Rlu9-dZQkCLLeIs1TWA,5286
 ipex_llm/ggml/convert_model.py,sha256=t-tGK9w8ZRi9dlDLTutput3ZBKj3ji94WUJi2KG8hkA,5955
-ipex_llm/ggml/quantize.py,sha256=TOoSe1w7tqAoV_fuqQhXIYb1S02A6udeud6IX0kLSic,6330
+ipex_llm/ggml/quantize.py,sha256=Cvk1R771rRDhSW7BRWcmb4ImY6TWDl_u9Vkdh7rYSuM,6367
 ipex_llm/ggml/model/__init__.py,sha256=T-EbRT6GJ_8RCu-iLmSzcftOimXSPQf2d5X72AUAy2Y,874
 ipex_llm/ggml/model/bloom/__init__.py,sha256=291QHI19FMw7Z1oaKBAf2YJ0M51iYqWC4IT1ejI-OGg,900
 ipex_llm/ggml/model/bloom/bloom.py,sha256=fUxgZd_Uc4RXaMC_naYdjekwNprM1TpURmQ8VbocShc,17975
@@ -41,35 +41,35 @@ ipex_llm/langchain/llms/transformerspipelinellm.py,sha256=vm522YPPwWxxAPVvQBtxRf
 ipex_llm/langchain/vllm/__init__.py,sha256=T-EbRT6GJ_8RCu-iLmSzcftOimXSPQf2d5X72AUAy2Y,874
 ipex_llm/langchain/vllm/vllm.py,sha256=6dxc-ZISZQrJilEa_HA827l75Dv9rcHpY_G6FdJ8BVs,7793
 ipex_llm/libs/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-ipex_llm/libs/bloom-api.dll,sha256=_INZo-YdawiFT4W8ycNSvfZGX7PyacE1FdWqdZ8ACBs,36352
-ipex_llm/libs/bloom.dll,sha256=rJwoSwgB6yXZBD98zjINiMMriV_HrsGtV-qUE7Lvfko,506880
-ipex_llm/libs/gptneox-api.dll,sha256=s5DlqOac9kaIpVCHI2R2y_GMz3ywntM2Z5JxC8CdByc,24576
-ipex_llm/libs/gptneox.dll,sha256=QH5m60fW8LZ6eDe-e66TIajdVNvh0KBjgFVlkJ-Hg_8,567296
-ipex_llm/libs/libbloom_avx.dll,sha256=3pTsql6-EovdJ4V7_RhYPHFNA2sNmdd3o6JiX_ZRB8A,535040
-ipex_llm/libs/libbloom_vnni.dll,sha256=_s9QDl8PwDk2i0HlAXAc4zNPSD-QP8CYuGlFNlW3kqw,506880
-ipex_llm/libs/libgptneox_avx.dll,sha256=5OFhG019GnKBSunLFj8Hdl3y74vYN9U166yH5jzq02o,595456
-ipex_llm/libs/libgptneox_vnni.dll,sha256=cO_uJK9ryOZCq1Mkis0JeeoXL7ELO4_5wwR2CsnLduM,567808
-ipex_llm/libs/libllama_avx.dll,sha256=rnzeKhvjPsR9yAqA2iGzeyTzJHsGqkzUhlWsLTKO-L0,589824
-ipex_llm/libs/libllama_vnni.dll,sha256=MpFGU7izhp3cjAV3dilxSawboR4h8YToQs-zLmVp09U,561664
-ipex_llm/libs/libstarcoder_avx.dll,sha256=_2mioTJ9PKfBnE7ePf_DXbf1nnv0kQvPWfH6Em8F2Dc,626688
-ipex_llm/libs/libstarcoder_vnni.dll,sha256=uCzy3zuwkJ9kpMsfjASte0AEAfANfMfy2QPO2_sU7iA,598528
-ipex_llm/libs/llama-api.dll,sha256=G9AOyrQqXM0sNyvuenC2AsltfyOGu7PUVP49Cd51Alw,25600
-ipex_llm/libs/llama.dll,sha256=2RsqXu5FuTFYV0-xfAT6p4W0rTpn_CLgPfY7_FOf6H0,561152
-ipex_llm/libs/main-bloom.exe,sha256=Oip9lCr0Z9E9JtNmmSfcpeIpa9u8QqljDoA6J26iyOs,103424
-ipex_llm/libs/main-gptneox.exe,sha256=HPSbPmvCZG7hsC6Cl5Aq2KIXwJ9x1C1rQKy-bXfsPvI,98816
-ipex_llm/libs/main-llama.exe,sha256=Ae1q1zudFru-aw8scEAByyfTNJysBJ8ok4gPM9QHgeg,99840
-ipex_llm/libs/main-starcoder.exe,sha256=_aCei2KKCjkY4eN8M-4uNBnmjSPCRCV4l5HzPuXKVyg,157696
-ipex_llm/libs/pipeline.dll,sha256=YNiP5VgCJurVeo7w-Ry3rfSW5a7XiXu_auJP6iPRNsE,72704
-ipex_llm/libs/quantize-bloom.exe,sha256=-BPVLMa469h23MFGald10g70gCzuAxsxYORFaov3iRs,126464
-ipex_llm/libs/quantize-bloom_vnni.exe,sha256=zOw0ZBktkMBZT1XuDrbmoAdNr1MgD-Sv7_0SjROSqUc,127488
-ipex_llm/libs/quantize-gptneox.exe,sha256=8-ZWZMSejey3NZYEgICAGB1_Ypb0g_sSSE7oEVRJBqU,104448
-ipex_llm/libs/quantize-gptneox_vnni.exe,sha256=6q4jDAT4eRgVmlb-bTA2N2HUmtWv1X2D6CjzYxtayCI,104960
-ipex_llm/libs/quantize-llama.exe,sha256=0lKm4Iq-CfHORbiQHcANIzsthrDt5PovjMYMIeRTk9I,109568
-ipex_llm/libs/quantize-llama_vnni.exe,sha256=wMP_pOkyNOPvHSAuWFr5f07SRLKbrkgbGo41O3hv5a4,110592
-ipex_llm/libs/quantize-starcoder.exe,sha256=mbh4bLwkWbtddyPdCz0jYNUf8vMFPZxFShOxtCqMzV4,127488
-ipex_llm/libs/quantize-starcoder_vnni.exe,sha256=AxO1y6ERwky9UJpjylpQ43U_xgxdX8PAdKXbyx1xsYI,128512
-ipex_llm/libs/starcoder-api.dll,sha256=_6xipNB_cWOy0iF7YmC10akPFNIpV_ymVDc5HcdUZtg,21504
-ipex_llm/libs/starcoder.dll,sha256=d3a-7_HMs7Mivq2719k7Unc5TEvLg2GwVIr7FgwiO7U,598016
+ipex_llm/libs/bloom-api.dll,sha256=KZO8E1UaDCnft7K0TDoh_3zTx42ISTU4D2bSqoPEV2s,36352
+ipex_llm/libs/bloom.dll,sha256=svReLrk8rOmuItKNyhldKdx-DoMPMO642_h_Ug5UxD0,507904
+ipex_llm/libs/gptneox-api.dll,sha256=O-N2Ia1UysaymHfImedI_WjOeJ2NTbxNn9q6yGXOQAI,24576
+ipex_llm/libs/gptneox.dll,sha256=fcBWhf3KmAqkmyf_F7NKa5lT0gO57-9BcC_rfeT-LwU,568320
+ipex_llm/libs/libbloom_avx.dll,sha256=zPvCrNZlhMXpWarLFBhmhybT54is_iiolIPrIwDWw2c,536576
+ipex_llm/libs/libbloom_vnni.dll,sha256=zJNPHctPT5i42tPNOSLeeMpllG30GGqI9v8iD1BYi4k,508416
+ipex_llm/libs/libgptneox_avx.dll,sha256=aM2pIFvj3JR3UtH_jaOfR7voUuPS3uxvmOEnplOBdbc,596992
+ipex_llm/libs/libgptneox_vnni.dll,sha256=SaC4qbKMRIqV_3NUcIYLV1gRZNsduV90DzovwmNY1UE,568832
+ipex_llm/libs/libllama_avx.dll,sha256=X-RoQ1vnzW0HEFDYJ8OyrMq9Nw080zXmM4RCOtNyx_E,591360
+ipex_llm/libs/libllama_vnni.dll,sha256=Is1ykadevzNjGRZTZtExJk8iAIXGjq-GJ7zHOpuNtzI,563200
+ipex_llm/libs/libstarcoder_avx.dll,sha256=kDSsXFnvGc0tqkv9uU3sO-JWYLYdeqq5mVe4aA_KB30,627712
+ipex_llm/libs/libstarcoder_vnni.dll,sha256=srj1INioPm8WX8WqsW1m5CrtvXfuySliylZH2bpCF08,599552
+ipex_llm/libs/llama-api.dll,sha256=LdTvWWTBx5z6a9WPJPLIuJ_y6KpjrSfq0weehc3VdwU,25600
+ipex_llm/libs/llama.dll,sha256=wYzQK-oATn1zwBuNu57FWSgVEOdNabU4PgU5O9SVm_Y,562688
+ipex_llm/libs/main-bloom.exe,sha256=_iCwL1VqzrOWnBDuilurts1prZwopIxPwqcMPUwuPIw,103424
+ipex_llm/libs/main-gptneox.exe,sha256=TQ4SKDSTZ811jn2ZlAcDj9uksjYbL9DQVKdo3_94NRQ,98816
+ipex_llm/libs/main-llama.exe,sha256=bQGz9gMIjKMMH5zTqpj3M8Mh_FCWdeyFUcK66usqqlI,99840
+ipex_llm/libs/main-starcoder.exe,sha256=siUfDQYwB9zmcsaqgccks4-_ylIeN4RIAcJdIFgfOSU,157696
+ipex_llm/libs/pipeline.dll,sha256=2WR7LimvR1WHIgoetcO2RO3uXmng752cZ9L9hr6iGoE,72704
+ipex_llm/libs/quantize-bloom.exe,sha256=2-S0X9dnWH1WYvTV0bWlZKTwC5PfMC5fLNWouC-UiPw,126464
+ipex_llm/libs/quantize-bloom_vnni.exe,sha256=5Oy_AOS8K7FDGXqUQj1aoAZ-NpZj5rDx4oXkYJU9zfs,128000
+ipex_llm/libs/quantize-gptneox.exe,sha256=3OXhZHW7T6x0JTT7R6mu9EmLZDmyymKK7SbLV4IW0L0,104448
+ipex_llm/libs/quantize-gptneox_vnni.exe,sha256=8u0qGmF64EqIBZcYKFve3LzF94r-ag1-gp1poZ-UqTQ,104960
+ipex_llm/libs/quantize-llama.exe,sha256=SZps0VsS4RG1N_5lcCicfAMEI5RwdLMH7CZUVVVbdfQ,110080
+ipex_llm/libs/quantize-llama_vnni.exe,sha256=b_YXBMvuKfHX96Y31M8MdeUoGS__2e2NZSX1Kr0yCzM,110592
+ipex_llm/libs/quantize-starcoder.exe,sha256=Txap-heal5Q1pMJfrC1To8IcHktSboCReD8aLyT8u5A,127488
+ipex_llm/libs/quantize-starcoder_vnni.exe,sha256=SEh_V-9nXaD5QlDZPQ6HdoStp1krtNc1vtIg0E-OPuo,128512
+ipex_llm/libs/starcoder-api.dll,sha256=obLtkGPijemfhwOHIu8iIwt6UdGeGg0PnuvDBoIhR0Q,21504
+ipex_llm/libs/starcoder.dll,sha256=pEZDz8kqNxmyyRd4LCVnvVsyM1Q2d5TnAV1fYbugGJI,599040
 ipex_llm/llamaindex/__init__.py,sha256=T-EbRT6GJ_8RCu-iLmSzcftOimXSPQf2d5X72AUAy2Y,874
 ipex_llm/llamaindex/llms/__init__.py,sha256=KP1lEdGqDuxPoxL1ZSH25Pm2kKMPJBWUTLR0ckSLMIU,1139
 ipex_llm/llamaindex/llms/bigdlllm.py,sha256=FQBzq1KOjfc6uofTXAha3O7TqpJkNfOFepXQmOVlbnI,26314
@@ -87,14 +87,14 @@ ipex_llm/serving/fastchat/tgi_api_protocol.py,sha256=brT3k3-V0NJrU4fRqUwWjC0O3iO
 ipex_llm/serving/fastchat/tgi_api_server.py,sha256=agNTAEiZPSuj3dEdIdYKwkoY0cXOUDX06DiM9VP2knQ,24418
 ipex_llm/serving/fastchat/vllm_worker.py,sha256=ZLz2Q9GxJO6r_LOiP6epgCRjBGk-K4EB1SNEWSJp5DA,11091
 ipex_llm/transformers/__init__.py,sha256=pJHs6GZXHIObVE4BUCuej-6BKBZZg9pYWKPrkhWSfB4,1192
-ipex_llm/transformers/convert.py,sha256=i2IOmDnQBKNtcfUL95l8w4rNBMiU4SqX_9uz_LtPHMI,98086
+ipex_llm/transformers/convert.py,sha256=RVW8PIKpLrdMbvqKuUtWswyECTvDP7IM-o6I-Ez3TZ4,99554
 ipex_llm/transformers/convert_ipex.py,sha256=_nSnUTQy-yfkKaqGdqnBdWztZf3NGmnbZ0TKaDrF4X4,14617
 ipex_llm/transformers/embedding.py,sha256=bdgk59DvD4ZZyxRzewXOR7g56nThgO6uhIwk8QL7f-s,9299
 ipex_llm/transformers/kv.py,sha256=k4TU18LlA-Sbq9WNNQnfuzu3RSFBwFhmaV3BcGN5bAo,19191
 ipex_llm/transformers/lisa.py,sha256=F5WxbtXQ7RdKulj83h_2DnEIgKiKGZf7zvOmg6QBl2s,3289
 ipex_llm/transformers/loader.py,sha256=AwjV5RpI2t2bedlv7ZhLm8cfd-QJZm5hny-XyjIvdnk,6876
 ipex_llm/transformers/lookup.py,sha256=b6OlZ9OV10R9qeWw8mVryVpDxszkjwLkldvi7GPMJY8,19614
-ipex_llm/transformers/low_bit_linear.py,sha256=1diyN_5OTViAmi8CRIUh5j1s5Z9j3Umcz2MEiideV4U,40863
+ipex_llm/transformers/low_bit_linear.py,sha256=2FhbDODYaw0D2RXfYCx3B9NyDep2D50tzQm6pYDxpzQ,40964
 ipex_llm/transformers/model.py,sha256=64eRLtbFftku9kcN5xSNerbZ3jAFUjCbNlM8Ly54ygE,41079
 ipex_llm/transformers/modelling_bigdl.py,sha256=7JpNVMuyq_OmtNUaMFMXdxPWZp2q0QHC02QeA-VTPOw,6709
 ipex_llm/transformers/npu_model.py,sha256=X8ZtvZJpzz64XrSPhUYXXZmdJcbZ9X6G3Vlzw-zgN1Q,39749
@@ -154,7 +154,7 @@ ipex_llm/transformers/models/gptbigcode.py,sha256=cP1_qGWoa43R2WacAMblShjku4Qupc
 ipex_llm/transformers/models/gptneox.py,sha256=loRh1x_5S6BCeOr_s5xr-N_1SQHL3Y5IiUBAEyoMUqQ,6172
 ipex_llm/transformers/models/internlm.py,sha256=JZFrI2HXsIAfM-6pA2RO0wcXopOliC1FggLMzNzaDZ4,17404
 ipex_llm/transformers/models/internvl.py,sha256=Vx0vENIEQLX2M6P398mw5TOhpks0U8xf8rtRQvy94go,8154
-ipex_llm/transformers/models/llama.py,sha256=NzpyQve_RC9ez1W-jWPLGZ80k_S1I5Rx5saAzCsDIoI,8558
+ipex_llm/transformers/models/llama.py,sha256=rqrNjuZb_jeb9MKx0z-FSVoGx8YDBxQzPJ9ZUvYhgx0,9138
 ipex_llm/transformers/models/minicpm.py,sha256=eaPNVNrep0_xGoELhZd886ff0ceoKqB6cusdAhd52eE,10145
 ipex_llm/transformers/models/minicpm3.py,sha256=11cYl8KM2hoIJNMAOZMxiwCu6dMhup9ric_OEn8-VrQ,9363
 ipex_llm/transformers/models/minicpmv.py,sha256=PP05b5iTnrMpiseCn8iJcxKJDnfq7WqXp9Mrch0kKZ0,9876
@@ -174,7 +174,8 @@ ipex_llm/transformers/models/rwkv5.py,sha256=OkRNj1pCAZg1z2Fw-I0DEnxLEdZyPeRSQ6m
 ipex_llm/transformers/models/sd.py,sha256=VvHV5u-0k2MgHu3NL9113hPj7DgfxqctuKzEEeNfRDU,5981
 ipex_llm/transformers/models/stablelm.py,sha256=fj-XtOnR6kggnFUQTMPCOOzolkPztN06WAv8QW-XRnI,7054
 ipex_llm/transformers/models/starcoder2.py,sha256=ONKvD7JCkRM0DI-R56x28QFBJ7CjD5hOZBQ_3WfOcNk,6626
-ipex_llm/transformers/models/utils.py,sha256=WYBc26vSiy_CzV07z-eT5ts90Kko2yUmS3DDZtfGcRk,15065
+ipex_llm/transformers/models/utils.py,sha256=Rdn9T4zk6Hz8ybJp6kvlyfPwgHwdxEZ8R4zGtMeozWg,15105
+ipex_llm/transformers/models/whisper.py,sha256=ju3WP8Eq-KvD7kb3Qy51r4FOfSX3NBxfp5RBcq__gzc,4241
 ipex_llm/transformers/models/yuan.py,sha256=JYAn_ZaSGK0NBJLEIxCACfAq084a66GFJkdd5NbpmMA,7732
 ipex_llm/transformers/npu_models/__init__.py,sha256=ulEUGLjaP48LCrVeury3UxLjXxKzRi0UpSG4bYu-7f8,585
 ipex_llm/transformers/npu_models/baichuan.py,sha256=fJtd7fBrttySghRUgfZTAdxLjsSNC-XL08HISsXigLE,4685
@@ -243,11 +244,11 @@ ipex_llm/vllm/xpu/engine/__init__.py,sha256=pY_CpyuZd72fr6s32ejeKHKFW0K4vUU2rzZj
 ipex_llm/vllm/xpu/engine/engine.py,sha256=k4-D27WS_Gk3mA--w3HWAjPjb4Aiu043MVPi0ZoAUBc,5984
 ipex_llm/vllm/xpu/entrypoints/openai/api_server.py,sha256=GshTZFB8e4PWvqckfbmTOU6b0oLkNn7A-vzLuG9--j8,21544
 ipex_llm/vllm/xpu/entrypoints/openai/cli_args.py,sha256=2rENA2ucynMaIjiZBEh2ez1o5vR32GaP514t39CD7KM,8676
-ipex_llm-2.2.0b20250114.data/scripts/ipex-llm-init.bat,sha256=HPtCYuDYwEatq7dAwOvdfVcHYCpAVdbj75K1qh0vQek,2578
-ipex_llm-2.2.0b20250114.data/scripts/llm-chat.ps1,sha256=6qrs-hGVAV8IKh7Jx8nq_XrnZcjd7qGU5wndArM7Yag,2769
-ipex_llm-2.2.0b20250114.data/scripts/llm-cli.ps1,sha256=3qBtTLs_EjYDnM8YyCpJhzLnGCKTEGssu9UNqfkjVXs,3009
-ipex_llm-2.2.0b20250114.dist-info/METADATA,sha256=CsE0v0mVfDVChkqM_ovKZkcfFq2zcg1yL3xthEnO7JM,12705
-ipex_llm-2.2.0b20250114.dist-info/WHEEL,sha256=6iYPr8vTHsyDK75jr9X0V3I9wPSVmtwr_8fdATBciGk,98
-ipex_llm-2.2.0b20250114.dist-info/entry_points.txt,sha256=TiUyBB2MRmfF3ko-pyAEzqeBCRnyhu27bNOAsWPp3e8,61
-ipex_llm-2.2.0b20250114.dist-info/top_level.txt,sha256=CGCMHM-SyqUabU4h8RqJ2KTYckQUO3LvIWwmUQ6Qbzw,9
-ipex_llm-2.2.0b20250114.dist-info/RECORD,,
+ipex_llm-2.2.0b20250116.data/scripts/ipex-llm-init.bat,sha256=HPtCYuDYwEatq7dAwOvdfVcHYCpAVdbj75K1qh0vQek,2578
+ipex_llm-2.2.0b20250116.data/scripts/llm-chat.ps1,sha256=6qrs-hGVAV8IKh7Jx8nq_XrnZcjd7qGU5wndArM7Yag,2769
+ipex_llm-2.2.0b20250116.data/scripts/llm-cli.ps1,sha256=3qBtTLs_EjYDnM8YyCpJhzLnGCKTEGssu9UNqfkjVXs,3009
+ipex_llm-2.2.0b20250116.dist-info/METADATA,sha256=-88ot5J1vrH5lxaRqG7J_H4AODcB6syYq9PHArHcHw4,12879
+ipex_llm-2.2.0b20250116.dist-info/WHEEL,sha256=6iYPr8vTHsyDK75jr9X0V3I9wPSVmtwr_8fdATBciGk,98
+ipex_llm-2.2.0b20250116.dist-info/entry_points.txt,sha256=TiUyBB2MRmfF3ko-pyAEzqeBCRnyhu27bNOAsWPp3e8,61
+ipex_llm-2.2.0b20250116.dist-info/top_level.txt,sha256=CGCMHM-SyqUabU4h8RqJ2KTYckQUO3LvIWwmUQ6Qbzw,9
+ipex_llm-2.2.0b20250116.dist-info/RECORD,,

{ipex_llm-2.2.0b20250114.data → ipex_llm-2.2.0b20250116.data}/scripts/ipex-llm-init.bat RENAMED Viewed

File without changes

{ipex_llm-2.2.0b20250114.data → ipex_llm-2.2.0b20250116.data}/scripts/llm-chat.ps1 RENAMED Viewed

File without changes

{ipex_llm-2.2.0b20250114.data → ipex_llm-2.2.0b20250116.data}/scripts/llm-cli.ps1 RENAMED Viewed

File without changes

{ipex_llm-2.2.0b20250114.dist-info → ipex_llm-2.2.0b20250116.dist-info}/WHEEL RENAMED Viewed

File without changes

{ipex_llm-2.2.0b20250114.dist-info → ipex_llm-2.2.0b20250116.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{ipex_llm-2.2.0b20250114.dist-info → ipex_llm-2.2.0b20250116.dist-info}/top_level.txt RENAMED Viewed

File without changes