ipex-llm 2.3.0b20250407__py3-none-manylinux2010_x86_64.whl → 2.3.0b20250413__py3-none-manylinux2010_x86_64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- ipex_llm/transformers/kv.py +51 -1
- ipex_llm/transformers/models/common.py +3 -3
- ipex_llm/transformers/models/utils.py +43 -0
- {ipex_llm-2.3.0b20250407.dist-info → ipex_llm-2.3.0b20250413.dist-info}/METADATA +20 -20
- {ipex_llm-2.3.0b20250407.dist-info → ipex_llm-2.3.0b20250413.dist-info}/RECORD +11 -11
- {ipex_llm-2.3.0b20250407.data → ipex_llm-2.3.0b20250413.data}/scripts/ipex-llm-init +0 -0
- {ipex_llm-2.3.0b20250407.data → ipex_llm-2.3.0b20250413.data}/scripts/llm-chat +0 -0
- {ipex_llm-2.3.0b20250407.data → ipex_llm-2.3.0b20250413.data}/scripts/llm-cli +0 -0
- {ipex_llm-2.3.0b20250407.dist-info → ipex_llm-2.3.0b20250413.dist-info}/WHEEL +0 -0
- {ipex_llm-2.3.0b20250407.dist-info → ipex_llm-2.3.0b20250413.dist-info}/entry_points.txt +0 -0
- {ipex_llm-2.3.0b20250407.dist-info → ipex_llm-2.3.0b20250413.dist-info}/top_level.txt +0 -0
ipex_llm/transformers/kv.py
CHANGED
@@ -22,7 +22,8 @@ import math
|
|
22
22
|
|
23
23
|
from .models.utils import (
|
24
24
|
init_fp8_kv_cache, append_fp8_kv_cache,
|
25
|
-
init_kv_cache, append_kv_cache, extend_kv_cache
|
25
|
+
init_kv_cache, append_kv_cache, extend_kv_cache,
|
26
|
+
init_unbalanced_fp8_kv_cache, append_unbalanced_fp8_kv_cache,
|
26
27
|
)
|
27
28
|
from typing import Optional, Dict, Tuple, Any, List
|
28
29
|
from transformers.cache_utils import DynamicCache
|
@@ -151,6 +152,55 @@ class DynamicNormalCache(DynamicCache):
|
|
151
152
|
return past_key_values
|
152
153
|
|
153
154
|
|
155
|
+
class DynamicUnbalancedFp8Cache(DynamicCache):
|
156
|
+
def __init__(self, num_hidden_layers: Optional[int] = None) -> None:
|
157
|
+
# ignore num_hidden_layers to fix transformers >= 4.45
|
158
|
+
super().__init__()
|
159
|
+
|
160
|
+
def update(
|
161
|
+
self,
|
162
|
+
key_states: torch.Tensor,
|
163
|
+
value_states: torch.Tensor,
|
164
|
+
layer_idx: int,
|
165
|
+
cache_kwargs: Optional[Dict[str, Any]]=None,
|
166
|
+
) -> Tuple[torch.Tensor, torch.Tensor]:
|
167
|
+
# fix converting empty DynamicCache in transformers >= 4.45
|
168
|
+
if key_states == []:
|
169
|
+
return key_states, value_states
|
170
|
+
|
171
|
+
batch_size, num_heads, seq_len, k_head_dim = key_states.shape
|
172
|
+
_, _, _, v_head_dim = value_states.shape
|
173
|
+
|
174
|
+
if layer_idx == 0:
|
175
|
+
if hasattr(self, "_seen_tokens"):
|
176
|
+
# 4.39 uses `_seen_tokens`
|
177
|
+
self._seen_tokens += seq_len
|
178
|
+
else:
|
179
|
+
# 4.37 uses `seen_tokens`
|
180
|
+
self.seen_tokens += seq_len
|
181
|
+
|
182
|
+
# Update the cache
|
183
|
+
if len(self.key_cache) <= layer_idx:
|
184
|
+
k_cache, v_cache = init_unbalanced_fp8_kv_cache(
|
185
|
+
batch_size, num_heads, seq_len, k_head_dim, v_head_dim,
|
186
|
+
device=key_states.device,
|
187
|
+
)
|
188
|
+
k_cache, v_cache = append_unbalanced_fp8_kv_cache(k_cache, v_cache,
|
189
|
+
key_states, value_states)
|
190
|
+
|
191
|
+
self.key_cache.append(k_cache)
|
192
|
+
self.value_cache.append(v_cache)
|
193
|
+
else:
|
194
|
+
k_cache = self.key_cache[layer_idx]
|
195
|
+
v_cache = self.value_cache[layer_idx]
|
196
|
+
k_cache, v_cache = append_unbalanced_fp8_kv_cache(k_cache, v_cache,
|
197
|
+
key_states, value_states)
|
198
|
+
self.key_cache[layer_idx] = k_cache
|
199
|
+
self.value_cache[layer_idx] = v_cache
|
200
|
+
|
201
|
+
return self.key_cache[layer_idx], self.value_cache[layer_idx]
|
202
|
+
|
203
|
+
|
154
204
|
# Copied from transformers.models.llama.modeling_llama.repeat_kv
|
155
205
|
def repeat_kv(hidden_states: torch.Tensor, n_rep: int) -> torch.Tensor:
|
156
206
|
"""
|
@@ -273,11 +273,11 @@ def scaled_dot_product_attention(query: torch.Tensor, key: torch.Tensor,
|
|
273
273
|
else:
|
274
274
|
attn_output = xe_addons.sdp_causal(query, key, value, mask, scale)
|
275
275
|
elif seq_length != kv_length and seq_length <= 32:
|
276
|
-
# todo: add scale support
|
276
|
+
# todo: add further scale support
|
277
277
|
if key.dtype == torch.uint8:
|
278
|
-
attn_output = xe_addons.sdp_fp8(query, key, value, mask)
|
278
|
+
attn_output = xe_addons.sdp_fp8(query, key, value, mask, scale)
|
279
279
|
else:
|
280
|
-
attn_output = xe_addons.sdp(query, key, value, mask)
|
280
|
+
attn_output = xe_addons.sdp(query, key, value, mask, scale)
|
281
281
|
else:
|
282
282
|
if key.dtype == torch.uint8:
|
283
283
|
attn_output = xe_addons.sdp_fp8_non_causal(query, key, value, mask, scale)
|
@@ -138,6 +138,49 @@ def append_fp8_kv_cache(k_cache, v_cache, key, value):
|
|
138
138
|
return new_k_cache, new_v_cache
|
139
139
|
|
140
140
|
|
141
|
+
def init_unbalanced_fp8_kv_cache(batch_size, num_heads, current_length,
|
142
|
+
k_head_dim, v_head_dim, device):
|
143
|
+
# for case which k head dim is different from v head dim
|
144
|
+
max_length = current_length + FP8_KV_ALLOC_LENGTH
|
145
|
+
|
146
|
+
k_cache_storage = torch.empty(batch_size, num_heads, max_length, k_head_dim,
|
147
|
+
dtype=torch.uint8, device=device)
|
148
|
+
k_cache = k_cache_storage.as_strided((batch_size, num_heads, 0, k_head_dim),
|
149
|
+
k_cache_storage.stride(), storage_offset=0)
|
150
|
+
|
151
|
+
v_cache_storage = torch.empty(batch_size, num_heads, max_length, v_head_dim,
|
152
|
+
dtype=torch.uint8, device=device)
|
153
|
+
v_cache = v_cache_storage.as_strided((batch_size, num_heads, 0, v_head_dim),
|
154
|
+
v_cache_storage.stride(), storage_offset=0)
|
155
|
+
return k_cache, v_cache
|
156
|
+
|
157
|
+
|
158
|
+
def append_unbalanced_fp8_kv_cache(k_cache, v_cache, key, value):
|
159
|
+
batch_size, num_heads, cur_length, k_head_dim = k_cache.shape
|
160
|
+
_, _, _, v_head_dim = v_cache.shape
|
161
|
+
new_length = cur_length + key.size(2)
|
162
|
+
new_k_size = (batch_size, num_heads, new_length, k_head_dim)
|
163
|
+
new_v_size = (batch_size, num_heads, new_length, v_head_dim)
|
164
|
+
|
165
|
+
if k_cache.stride(1) < new_length * k_cache.size(3):
|
166
|
+
new_k_cache, new_v_cache = init_unbalanced_fp8_kv_cache(batch_size, num_heads, new_length,
|
167
|
+
k_head_dim, v_head_dim, key.device)
|
168
|
+
new_k_cache = new_k_cache.as_strided(new_k_size, new_k_cache.stride(), storage_offset=0)
|
169
|
+
new_v_cache = new_v_cache.as_strided(new_v_size, new_v_cache.stride(), storage_offset=0)
|
170
|
+
new_k_cache[:, :, :cur_length, :] = k_cache
|
171
|
+
new_v_cache[:, :, :cur_length, :] = v_cache
|
172
|
+
else:
|
173
|
+
new_k_cache = k_cache.as_strided(new_k_size, k_cache.stride(), storage_offset=0)
|
174
|
+
new_v_cache = v_cache.as_strided(new_v_size, v_cache.stride(), storage_offset=0)
|
175
|
+
|
176
|
+
import xe_addons
|
177
|
+
xe_addons.quantize_key_value(key, value,
|
178
|
+
new_k_cache[:, :, cur_length:new_length, :],
|
179
|
+
new_v_cache[:, :, cur_length:new_length, :])
|
180
|
+
|
181
|
+
return new_k_cache, new_v_cache
|
182
|
+
|
183
|
+
|
141
184
|
def restore_fp8_kv_cache(k_cache, v_cache, dtype):
|
142
185
|
key_states = torch.empty(k_cache.shape, device=k_cache.device, dtype=dtype)
|
143
186
|
value_states = torch.empty(v_cache.shape, device=v_cache.device, dtype=dtype)
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: ipex-llm
|
3
|
-
Version: 2.3.
|
3
|
+
Version: 2.3.0b20250413
|
4
4
|
Summary: Large Language Model Develop Toolkit
|
5
5
|
Home-page: https://github.com/intel-analytics/ipex-llm
|
6
6
|
Author: BigDL Authors
|
@@ -27,7 +27,7 @@ Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine
|
|
27
27
|
Requires-Dist: torch ==2.1.2+cpu ; (platform_system == "Linux") and extra == 'all'
|
28
28
|
Requires-Dist: torch ==2.1.2 ; (platform_system == "Windows") and extra == 'all'
|
29
29
|
Provides-Extra: cpp
|
30
|
-
Requires-Dist: bigdl-core-cpp ==2.7.
|
30
|
+
Requires-Dist: bigdl-core-cpp ==2.7.0b20250413 ; extra == 'cpp'
|
31
31
|
Requires-Dist: setuptools ; extra == 'cpp'
|
32
32
|
Requires-Dist: onednn-devel ==2025.0.1 ; (platform_system == "Windows") and extra == 'cpp'
|
33
33
|
Requires-Dist: onednn ==2025.0.1 ; (platform_system == "Windows") and extra == 'cpp'
|
@@ -60,7 +60,7 @@ Requires-Dist: transformers ==4.40.0 ; extra == 'npu'
|
|
60
60
|
Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'npu'
|
61
61
|
Requires-Dist: torch ==2.1.2+cpu ; (platform_system == "Linux") and extra == 'npu'
|
62
62
|
Requires-Dist: torch ==2.1.2 ; (platform_system == "Windows") and extra == 'npu'
|
63
|
-
Requires-Dist: bigdl-core-npu ==2.7.
|
63
|
+
Requires-Dist: bigdl-core-npu ==2.7.0b20250413 ; (platform_system == "Windows") and extra == 'npu'
|
64
64
|
Provides-Extra: serving
|
65
65
|
Requires-Dist: py-cpuinfo ; extra == 'serving'
|
66
66
|
Requires-Dist: fschat[model_worker,webui] ==0.2.36 ; extra == 'serving'
|
@@ -80,9 +80,9 @@ Requires-Dist: setuptools <70.0.0 ; extra == 'xpu'
|
|
80
80
|
Requires-Dist: torch ==2.1.0a0 ; extra == 'xpu'
|
81
81
|
Requires-Dist: torchvision ==0.16.0a0 ; extra == 'xpu'
|
82
82
|
Requires-Dist: intel-extension-for-pytorch ==2.1.10+xpu ; extra == 'xpu'
|
83
|
-
Requires-Dist: bigdl-core-xe-21 ==2.7.
|
84
|
-
Requires-Dist: bigdl-core-xe-batch-21 ==2.7.
|
85
|
-
Requires-Dist: bigdl-core-xe-addons-21 ==2.7.
|
83
|
+
Requires-Dist: bigdl-core-xe-21 ==2.7.0b20250413 ; extra == 'xpu'
|
84
|
+
Requires-Dist: bigdl-core-xe-batch-21 ==2.7.0b20250413 ; extra == 'xpu'
|
85
|
+
Requires-Dist: bigdl-core-xe-addons-21 ==2.7.0b20250413 ; extra == 'xpu'
|
86
86
|
Provides-Extra: xpu-2-1
|
87
87
|
Requires-Dist: py-cpuinfo ; extra == 'xpu-2-1'
|
88
88
|
Requires-Dist: protobuf ; extra == 'xpu-2-1'
|
@@ -97,9 +97,9 @@ Requires-Dist: setuptools <70.0.0 ; extra == 'xpu-2-1'
|
|
97
97
|
Requires-Dist: torch ==2.1.0a0 ; extra == 'xpu-2-1'
|
98
98
|
Requires-Dist: torchvision ==0.16.0a0 ; extra == 'xpu-2-1'
|
99
99
|
Requires-Dist: intel-extension-for-pytorch ==2.1.10+xpu ; extra == 'xpu-2-1'
|
100
|
-
Requires-Dist: bigdl-core-xe-21 ==2.7.
|
101
|
-
Requires-Dist: bigdl-core-xe-batch-21 ==2.7.
|
102
|
-
Requires-Dist: bigdl-core-xe-addons-21 ==2.7.
|
100
|
+
Requires-Dist: bigdl-core-xe-21 ==2.7.0b20250413 ; extra == 'xpu-2-1'
|
101
|
+
Requires-Dist: bigdl-core-xe-batch-21 ==2.7.0b20250413 ; extra == 'xpu-2-1'
|
102
|
+
Requires-Dist: bigdl-core-xe-addons-21 ==2.7.0b20250413 ; extra == 'xpu-2-1'
|
103
103
|
Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-2-1'
|
104
104
|
Requires-Dist: dpcpp-cpp-rt ==2024.0.2 ; (platform_system == "Windows") and extra == 'xpu-2-1'
|
105
105
|
Requires-Dist: mkl-dpcpp ==2024.0.0 ; (platform_system == "Windows") and extra == 'xpu-2-1'
|
@@ -117,7 +117,7 @@ Requires-Dist: setuptools ; extra == 'xpu-2-6'
|
|
117
117
|
Requires-Dist: torch ==2.6.0+xpu ; extra == 'xpu-2-6'
|
118
118
|
Requires-Dist: torchvision ==0.21.0+xpu ; extra == 'xpu-2-6'
|
119
119
|
Requires-Dist: torchaudio ==2.6.0+xpu ; extra == 'xpu-2-6'
|
120
|
-
Requires-Dist: bigdl-core-xe-all ==2.7.
|
120
|
+
Requires-Dist: bigdl-core-xe-all ==2.7.0b20250413 ; extra == 'xpu-2-6'
|
121
121
|
Requires-Dist: onednn-devel ==2025.0.1 ; extra == 'xpu-2-6'
|
122
122
|
Requires-Dist: onednn ==2025.0.1 ; extra == 'xpu-2-6'
|
123
123
|
Requires-Dist: dpcpp-cpp-rt ==2025.0.2 ; extra == 'xpu-2-6'
|
@@ -132,7 +132,7 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-2-6-arl'
|
|
132
132
|
Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-2-6-arl'
|
133
133
|
Requires-Dist: tabulate ; extra == 'xpu-2-6-arl'
|
134
134
|
Requires-Dist: setuptools ; extra == 'xpu-2-6-arl'
|
135
|
-
Requires-Dist: bigdl-core-xe-all ==2.7.
|
135
|
+
Requires-Dist: bigdl-core-xe-all ==2.7.0b20250413 ; extra == 'xpu-2-6-arl'
|
136
136
|
Requires-Dist: onednn-devel ==2025.0.1 ; extra == 'xpu-2-6-arl'
|
137
137
|
Requires-Dist: onednn ==2025.0.1 ; extra == 'xpu-2-6-arl'
|
138
138
|
Requires-Dist: dpcpp-cpp-rt ==2025.0.2 ; extra == 'xpu-2-6-arl'
|
@@ -155,9 +155,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-arc'
|
|
155
155
|
Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-arc'
|
156
156
|
Requires-Dist: tabulate ; extra == 'xpu-arc'
|
157
157
|
Requires-Dist: setuptools ; extra == 'xpu-arc'
|
158
|
-
Requires-Dist: bigdl-core-xe-23 ==2.7.
|
159
|
-
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.
|
160
|
-
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.
|
158
|
+
Requires-Dist: bigdl-core-xe-23 ==2.7.0b20250413 ; extra == 'xpu-arc'
|
159
|
+
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.0b20250413 ; extra == 'xpu-arc'
|
160
|
+
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.0b20250413 ; extra == 'xpu-arc'
|
161
161
|
Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-arc'
|
162
162
|
Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arc'
|
163
163
|
Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arc'
|
@@ -178,9 +178,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-arl'
|
|
178
178
|
Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-arl'
|
179
179
|
Requires-Dist: tabulate ; extra == 'xpu-arl'
|
180
180
|
Requires-Dist: setuptools ; extra == 'xpu-arl'
|
181
|
-
Requires-Dist: bigdl-core-xe-23 ==2.7.
|
182
|
-
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.
|
183
|
-
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.
|
181
|
+
Requires-Dist: bigdl-core-xe-23 ==2.7.0b20250413 ; extra == 'xpu-arl'
|
182
|
+
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.0b20250413 ; extra == 'xpu-arl'
|
183
|
+
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.0b20250413 ; extra == 'xpu-arl'
|
184
184
|
Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-arl'
|
185
185
|
Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arl'
|
186
186
|
Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arl'
|
@@ -201,9 +201,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-lnl'
|
|
201
201
|
Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-lnl'
|
202
202
|
Requires-Dist: tabulate ; extra == 'xpu-lnl'
|
203
203
|
Requires-Dist: setuptools ; extra == 'xpu-lnl'
|
204
|
-
Requires-Dist: bigdl-core-xe-23 ==2.7.
|
205
|
-
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.
|
206
|
-
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.
|
204
|
+
Requires-Dist: bigdl-core-xe-23 ==2.7.0b20250413 ; extra == 'xpu-lnl'
|
205
|
+
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.0b20250413 ; extra == 'xpu-lnl'
|
206
|
+
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.0b20250413 ; extra == 'xpu-lnl'
|
207
207
|
Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-lnl'
|
208
208
|
Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-lnl'
|
209
209
|
Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-lnl'
|
@@ -97,7 +97,7 @@ ipex_llm/transformers/__init__.py,sha256=BreA3EY6hkNq0rVixb_sUuTLzMrcWXTt3yRsshC
|
|
97
97
|
ipex_llm/transformers/convert.py,sha256=xqqZFGcdDRko2IYgfSgDRs8ef4THUR25IAhSyDV0VUs,106933
|
98
98
|
ipex_llm/transformers/convert_ipex.py,sha256=_nSnUTQy-yfkKaqGdqnBdWztZf3NGmnbZ0TKaDrF4X4,14617
|
99
99
|
ipex_llm/transformers/embedding.py,sha256=bdgk59DvD4ZZyxRzewXOR7g56nThgO6uhIwk8QL7f-s,9299
|
100
|
-
ipex_llm/transformers/kv.py,sha256=
|
100
|
+
ipex_llm/transformers/kv.py,sha256=src_HcVDKFwQ1V8hdTrFQw5RIwUewM9VOR47GVTPJG4,21187
|
101
101
|
ipex_llm/transformers/lisa.py,sha256=F5WxbtXQ7RdKulj83h_2DnEIgKiKGZf7zvOmg6QBl2s,3289
|
102
102
|
ipex_llm/transformers/loader.py,sha256=c9qfJSC6-in-mkd-iKb1igk3nHWUYS3QtyH2cOazmKc,6825
|
103
103
|
ipex_llm/transformers/lookup.py,sha256=b6OlZ9OV10R9qeWw8mVryVpDxszkjwLkldvi7GPMJY8,19614
|
@@ -153,7 +153,7 @@ ipex_llm/transformers/models/chatglm.py,sha256=UHai1t2AUtGmF765_eHF8LUMVQzp_oCBx
|
|
153
153
|
ipex_llm/transformers/models/chatglm2.py,sha256=KyAIX7zGVQDQuwwM3QMBNWZbTeMHEzKUIgAryT0voHc,14933
|
154
154
|
ipex_llm/transformers/models/chatglm4.py,sha256=QvUehdaCePB3MNHyWg3dneDxmjtBdxYeKUyQUVcsgfM,16886
|
155
155
|
ipex_llm/transformers/models/chatglm4v.py,sha256=Ba9Xtzwtzk_rzg5khGqDrlHfJsDwc5YcM5_yPoord7o,13324
|
156
|
-
ipex_llm/transformers/models/common.py,sha256=
|
156
|
+
ipex_llm/transformers/models/common.py,sha256=LVA9nL_qJ61NEkEn9T985PjrrWPGpDTCALknH4Qv5aw,13040
|
157
157
|
ipex_llm/transformers/models/decilm.py,sha256=P-PBuDPf07GvKggLwJx_wPwIn6esN3rX8ai2JxRuZmE,5246
|
158
158
|
ipex_llm/transformers/models/deepseek.py,sha256=w6tGeyJ9joD7lQBiZ6A01Z00g8hAXC1N2yGtJh8kyuk,13096
|
159
159
|
ipex_llm/transformers/models/deepseek_v3.py,sha256=CTgwIKQlUPlUCbOxc9Id5GapWkXOP6pMtkguYrWpCio,10003
|
@@ -187,7 +187,7 @@ ipex_llm/transformers/models/rwkv5.py,sha256=OkRNj1pCAZg1z2Fw-I0DEnxLEdZyPeRSQ6m
|
|
187
187
|
ipex_llm/transformers/models/sd.py,sha256=VvHV5u-0k2MgHu3NL9113hPj7DgfxqctuKzEEeNfRDU,5981
|
188
188
|
ipex_llm/transformers/models/stablelm.py,sha256=fj-XtOnR6kggnFUQTMPCOOzolkPztN06WAv8QW-XRnI,7054
|
189
189
|
ipex_llm/transformers/models/starcoder2.py,sha256=ONKvD7JCkRM0DI-R56x28QFBJ7CjD5hOZBQ_3WfOcNk,6626
|
190
|
-
ipex_llm/transformers/models/utils.py,sha256=
|
190
|
+
ipex_llm/transformers/models/utils.py,sha256=Rj7QK1s3QxsTT4HzGNR00Q7izG5xYiZEX29YoQIM1tA,16998
|
191
191
|
ipex_llm/transformers/models/whisper.py,sha256=ju3WP8Eq-KvD7kb3Qy51r4FOfSX3NBxfp5RBcq__gzc,4241
|
192
192
|
ipex_llm/transformers/models/yuan.py,sha256=JYAn_ZaSGK0NBJLEIxCACfAq084a66GFJkdd5NbpmMA,7732
|
193
193
|
ipex_llm/transformers/npu_models/__init__.py,sha256=ulEUGLjaP48LCrVeury3UxLjXxKzRi0UpSG4bYu-7f8,585
|
@@ -263,11 +263,11 @@ ipex_llm/vllm/xpu/engine/__init__.py,sha256=pY_CpyuZd72fr6s32ejeKHKFW0K4vUU2rzZj
|
|
263
263
|
ipex_llm/vllm/xpu/engine/engine.py,sha256=NvCMbp0X8NVrOqbwm4FTvXOptTRLzu9jQsy37ZHnTk8,9493
|
264
264
|
ipex_llm/vllm/xpu/entrypoints/openai/api_server.py,sha256=IjiSze9vzBCAkLu_VwIcJwuO1jyFna7DLrj6aSL7RaQ,35220
|
265
265
|
ipex_llm/vllm/xpu/entrypoints/openai/cli_args.py,sha256=hB398yYtKauASRzevctScdbFIjiiSGMAe1bwEuIHrhY,10893
|
266
|
-
ipex_llm-2.3.
|
267
|
-
ipex_llm-2.3.
|
268
|
-
ipex_llm-2.3.
|
269
|
-
ipex_llm-2.3.
|
270
|
-
ipex_llm-2.3.
|
271
|
-
ipex_llm-2.3.
|
272
|
-
ipex_llm-2.3.
|
273
|
-
ipex_llm-2.3.
|
266
|
+
ipex_llm-2.3.0b20250413.data/scripts/ipex-llm-init,sha256=fLQsT2dRL6H5bThb4GuIWotAuqoLsIxFwA-0c2qmaO8,6672
|
267
|
+
ipex_llm-2.3.0b20250413.data/scripts/llm-chat,sha256=TdUnUmNapzuoe1c8IzrdVOQwWEg8IqsMSBRlOD3daZM,2249
|
268
|
+
ipex_llm-2.3.0b20250413.data/scripts/llm-cli,sha256=RXGPlLElHxcKzoUxljEMBIAXbzCDysXL-Nxw-xF-7LU,2457
|
269
|
+
ipex_llm-2.3.0b20250413.dist-info/METADATA,sha256=BcY-pLNYgB5lBm5wiYwAn7Y8UBeb5vcMLnTJsjK177A,13917
|
270
|
+
ipex_llm-2.3.0b20250413.dist-info/WHEEL,sha256=PPJcBMAZibF_2GFE9NmOJGqiaSMPiNFbJd6QaJjdA6Y,109
|
271
|
+
ipex_llm-2.3.0b20250413.dist-info/entry_points.txt,sha256=TiUyBB2MRmfF3ko-pyAEzqeBCRnyhu27bNOAsWPp3e8,61
|
272
|
+
ipex_llm-2.3.0b20250413.dist-info/top_level.txt,sha256=CGCMHM-SyqUabU4h8RqJ2KTYckQUO3LvIWwmUQ6Qbzw,9
|
273
|
+
ipex_llm-2.3.0b20250413.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|