ipex-llm 2.3.0b20250414__py3-none-manylinux2010_x86_64.whl → 2.3.0b20250415__py3-none-manylinux2010_x86_64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- ipex_llm/transformers/models/baichuan.py +5 -2
- ipex_llm/transformers/models/chatglm.py +3 -1
- ipex_llm/transformers/models/qwen_vl.py +3 -1
- {ipex_llm-2.3.0b20250414.dist-info → ipex_llm-2.3.0b20250415.dist-info}/METADATA +20 -20
- {ipex_llm-2.3.0b20250414.dist-info → ipex_llm-2.3.0b20250415.dist-info}/RECORD +11 -11
- {ipex_llm-2.3.0b20250414.data → ipex_llm-2.3.0b20250415.data}/scripts/ipex-llm-init +0 -0
- {ipex_llm-2.3.0b20250414.data → ipex_llm-2.3.0b20250415.data}/scripts/llm-chat +0 -0
- {ipex_llm-2.3.0b20250414.data → ipex_llm-2.3.0b20250415.data}/scripts/llm-cli +0 -0
- {ipex_llm-2.3.0b20250414.dist-info → ipex_llm-2.3.0b20250415.dist-info}/WHEEL +0 -0
- {ipex_llm-2.3.0b20250414.dist-info → ipex_llm-2.3.0b20250415.dist-info}/entry_points.txt +0 -0
- {ipex_llm-2.3.0b20250414.dist-info → ipex_llm-2.3.0b20250415.dist-info}/top_level.txt +0 -0
@@ -326,14 +326,17 @@ def baichuan_attention_forward_13b(
|
|
326
326
|
else:
|
327
327
|
attention_mask = attention_mask[None, :, -q_len:, :]
|
328
328
|
|
329
|
+
head_dim = query_states.shape[-1]
|
330
|
+
scale = 1 / math.sqrt(head_dim)
|
331
|
+
|
329
332
|
if use_sdp(q_len, kv_seq_len, self.head_dim, query_states):
|
330
333
|
import xe_addons
|
331
334
|
if use_quantize_kv:
|
332
335
|
attn_output = xe_addons.sdp_fp8(query_states, key_states, value_states,
|
333
|
-
attention_mask)
|
336
|
+
attention_mask, scale)
|
334
337
|
else:
|
335
338
|
attn_output = xe_addons.sdp(query_states, key_states, value_states,
|
336
|
-
attention_mask)
|
339
|
+
attention_mask, scale)
|
337
340
|
attn_weights = None
|
338
341
|
else:
|
339
342
|
if use_quantize_kv:
|
@@ -68,7 +68,9 @@ def glm_sdpa(query, key, value, attention_mask=None, is_causal=False):
|
|
68
68
|
if use_sdp(query.shape[2], key.shape[2],
|
69
69
|
query.shape[-1], query):
|
70
70
|
import xe_addons
|
71
|
-
|
71
|
+
head_dim = query.shape[-1]
|
72
|
+
scale = 1 / math.sqrt(head_dim)
|
73
|
+
attn_output = xe_addons.sdp(query, key, value, attn_bias, scale)
|
72
74
|
context_layer = attn_output.view(query.shape)
|
73
75
|
else:
|
74
76
|
head_dim = query.size(-1)
|
@@ -164,7 +164,9 @@ def qwen_attention_forward_vl(
|
|
164
164
|
if not self.training and not hidden_states.requires_grad and \
|
165
165
|
use_sdp(q_len, key.shape[2], self.head_dim, query):
|
166
166
|
import xe_addons
|
167
|
-
|
167
|
+
head_dim = query.shape[-1]
|
168
|
+
scale = 1 / math.sqrt(head_dim)
|
169
|
+
attn_output = xe_addons.sdp(query, key, value, attention_mask, scale)
|
168
170
|
attn_output = attn_output.view(query.shape)
|
169
171
|
attn_output = attn_output.transpose(1, 2)
|
170
172
|
attn_weight = None
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.1
|
2
2
|
Name: ipex-llm
|
3
|
-
Version: 2.3.
|
3
|
+
Version: 2.3.0b20250415
|
4
4
|
Summary: Large Language Model Develop Toolkit
|
5
5
|
Home-page: https://github.com/intel-analytics/ipex-llm
|
6
6
|
Author: BigDL Authors
|
@@ -27,7 +27,7 @@ Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine
|
|
27
27
|
Requires-Dist: torch ==2.1.2+cpu ; (platform_system == "Linux") and extra == 'all'
|
28
28
|
Requires-Dist: torch ==2.1.2 ; (platform_system == "Windows") and extra == 'all'
|
29
29
|
Provides-Extra: cpp
|
30
|
-
Requires-Dist: bigdl-core-cpp ==2.7.
|
30
|
+
Requires-Dist: bigdl-core-cpp ==2.7.0b20250415 ; extra == 'cpp'
|
31
31
|
Requires-Dist: setuptools ; extra == 'cpp'
|
32
32
|
Requires-Dist: onednn-devel ==2025.0.1 ; (platform_system == "Windows") and extra == 'cpp'
|
33
33
|
Requires-Dist: onednn ==2025.0.1 ; (platform_system == "Windows") and extra == 'cpp'
|
@@ -60,7 +60,7 @@ Requires-Dist: transformers ==4.40.0 ; extra == 'npu'
|
|
60
60
|
Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'npu'
|
61
61
|
Requires-Dist: torch ==2.1.2+cpu ; (platform_system == "Linux") and extra == 'npu'
|
62
62
|
Requires-Dist: torch ==2.1.2 ; (platform_system == "Windows") and extra == 'npu'
|
63
|
-
Requires-Dist: bigdl-core-npu ==2.7.
|
63
|
+
Requires-Dist: bigdl-core-npu ==2.7.0b20250415 ; (platform_system == "Windows") and extra == 'npu'
|
64
64
|
Provides-Extra: serving
|
65
65
|
Requires-Dist: py-cpuinfo ; extra == 'serving'
|
66
66
|
Requires-Dist: fschat[model_worker,webui] ==0.2.36 ; extra == 'serving'
|
@@ -80,9 +80,9 @@ Requires-Dist: setuptools <70.0.0 ; extra == 'xpu'
|
|
80
80
|
Requires-Dist: torch ==2.1.0a0 ; extra == 'xpu'
|
81
81
|
Requires-Dist: torchvision ==0.16.0a0 ; extra == 'xpu'
|
82
82
|
Requires-Dist: intel-extension-for-pytorch ==2.1.10+xpu ; extra == 'xpu'
|
83
|
-
Requires-Dist: bigdl-core-xe-21 ==2.7.
|
84
|
-
Requires-Dist: bigdl-core-xe-batch-21 ==2.7.
|
85
|
-
Requires-Dist: bigdl-core-xe-addons-21 ==2.7.
|
83
|
+
Requires-Dist: bigdl-core-xe-21 ==2.7.0b20250415 ; extra == 'xpu'
|
84
|
+
Requires-Dist: bigdl-core-xe-batch-21 ==2.7.0b20250415 ; extra == 'xpu'
|
85
|
+
Requires-Dist: bigdl-core-xe-addons-21 ==2.7.0b20250415 ; extra == 'xpu'
|
86
86
|
Provides-Extra: xpu-2-1
|
87
87
|
Requires-Dist: py-cpuinfo ; extra == 'xpu-2-1'
|
88
88
|
Requires-Dist: protobuf ; extra == 'xpu-2-1'
|
@@ -97,9 +97,9 @@ Requires-Dist: setuptools <70.0.0 ; extra == 'xpu-2-1'
|
|
97
97
|
Requires-Dist: torch ==2.1.0a0 ; extra == 'xpu-2-1'
|
98
98
|
Requires-Dist: torchvision ==0.16.0a0 ; extra == 'xpu-2-1'
|
99
99
|
Requires-Dist: intel-extension-for-pytorch ==2.1.10+xpu ; extra == 'xpu-2-1'
|
100
|
-
Requires-Dist: bigdl-core-xe-21 ==2.7.
|
101
|
-
Requires-Dist: bigdl-core-xe-batch-21 ==2.7.
|
102
|
-
Requires-Dist: bigdl-core-xe-addons-21 ==2.7.
|
100
|
+
Requires-Dist: bigdl-core-xe-21 ==2.7.0b20250415 ; extra == 'xpu-2-1'
|
101
|
+
Requires-Dist: bigdl-core-xe-batch-21 ==2.7.0b20250415 ; extra == 'xpu-2-1'
|
102
|
+
Requires-Dist: bigdl-core-xe-addons-21 ==2.7.0b20250415 ; extra == 'xpu-2-1'
|
103
103
|
Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-2-1'
|
104
104
|
Requires-Dist: dpcpp-cpp-rt ==2024.0.2 ; (platform_system == "Windows") and extra == 'xpu-2-1'
|
105
105
|
Requires-Dist: mkl-dpcpp ==2024.0.0 ; (platform_system == "Windows") and extra == 'xpu-2-1'
|
@@ -117,7 +117,7 @@ Requires-Dist: setuptools ; extra == 'xpu-2-6'
|
|
117
117
|
Requires-Dist: torch ==2.6.0+xpu ; extra == 'xpu-2-6'
|
118
118
|
Requires-Dist: torchvision ==0.21.0+xpu ; extra == 'xpu-2-6'
|
119
119
|
Requires-Dist: torchaudio ==2.6.0+xpu ; extra == 'xpu-2-6'
|
120
|
-
Requires-Dist: bigdl-core-xe-all ==2.7.
|
120
|
+
Requires-Dist: bigdl-core-xe-all ==2.7.0b20250415 ; extra == 'xpu-2-6'
|
121
121
|
Requires-Dist: onednn-devel ==2025.0.1 ; extra == 'xpu-2-6'
|
122
122
|
Requires-Dist: onednn ==2025.0.1 ; extra == 'xpu-2-6'
|
123
123
|
Requires-Dist: dpcpp-cpp-rt ==2025.0.2 ; extra == 'xpu-2-6'
|
@@ -132,7 +132,7 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-2-6-arl'
|
|
132
132
|
Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-2-6-arl'
|
133
133
|
Requires-Dist: tabulate ; extra == 'xpu-2-6-arl'
|
134
134
|
Requires-Dist: setuptools ; extra == 'xpu-2-6-arl'
|
135
|
-
Requires-Dist: bigdl-core-xe-all ==2.7.
|
135
|
+
Requires-Dist: bigdl-core-xe-all ==2.7.0b20250415 ; extra == 'xpu-2-6-arl'
|
136
136
|
Requires-Dist: onednn-devel ==2025.0.1 ; extra == 'xpu-2-6-arl'
|
137
137
|
Requires-Dist: onednn ==2025.0.1 ; extra == 'xpu-2-6-arl'
|
138
138
|
Requires-Dist: dpcpp-cpp-rt ==2025.0.2 ; extra == 'xpu-2-6-arl'
|
@@ -155,9 +155,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-arc'
|
|
155
155
|
Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-arc'
|
156
156
|
Requires-Dist: tabulate ; extra == 'xpu-arc'
|
157
157
|
Requires-Dist: setuptools ; extra == 'xpu-arc'
|
158
|
-
Requires-Dist: bigdl-core-xe-23 ==2.7.
|
159
|
-
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.
|
160
|
-
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.
|
158
|
+
Requires-Dist: bigdl-core-xe-23 ==2.7.0b20250415 ; extra == 'xpu-arc'
|
159
|
+
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.0b20250415 ; extra == 'xpu-arc'
|
160
|
+
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.0b20250415 ; extra == 'xpu-arc'
|
161
161
|
Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-arc'
|
162
162
|
Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arc'
|
163
163
|
Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arc'
|
@@ -178,9 +178,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-arl'
|
|
178
178
|
Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-arl'
|
179
179
|
Requires-Dist: tabulate ; extra == 'xpu-arl'
|
180
180
|
Requires-Dist: setuptools ; extra == 'xpu-arl'
|
181
|
-
Requires-Dist: bigdl-core-xe-23 ==2.7.
|
182
|
-
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.
|
183
|
-
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.
|
181
|
+
Requires-Dist: bigdl-core-xe-23 ==2.7.0b20250415 ; extra == 'xpu-arl'
|
182
|
+
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.0b20250415 ; extra == 'xpu-arl'
|
183
|
+
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.0b20250415 ; extra == 'xpu-arl'
|
184
184
|
Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-arl'
|
185
185
|
Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arl'
|
186
186
|
Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arl'
|
@@ -201,9 +201,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-lnl'
|
|
201
201
|
Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-lnl'
|
202
202
|
Requires-Dist: tabulate ; extra == 'xpu-lnl'
|
203
203
|
Requires-Dist: setuptools ; extra == 'xpu-lnl'
|
204
|
-
Requires-Dist: bigdl-core-xe-23 ==2.7.
|
205
|
-
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.
|
206
|
-
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.
|
204
|
+
Requires-Dist: bigdl-core-xe-23 ==2.7.0b20250415 ; extra == 'xpu-lnl'
|
205
|
+
Requires-Dist: bigdl-core-xe-batch-23 ==2.7.0b20250415 ; extra == 'xpu-lnl'
|
206
|
+
Requires-Dist: bigdl-core-xe-addons-23 ==2.7.0b20250415 ; extra == 'xpu-lnl'
|
207
207
|
Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-lnl'
|
208
208
|
Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-lnl'
|
209
209
|
Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-lnl'
|
@@ -145,11 +145,11 @@ ipex_llm/transformers/gguf/models/model_implement/yuan2/configuration_yuan.py,sh
|
|
145
145
|
ipex_llm/transformers/gguf/models/model_implement/yuan2/yuan_hf_model.py,sha256=_AOGMV65XHxgTxIib7lgs49InopcecTzRwgtYR8NTUg,51084
|
146
146
|
ipex_llm/transformers/models/__init__.py,sha256=tp2DcVkKg1-QvdYk7DY7rZvQWCDQ4ZjU8NAQ7Fclrpg,584
|
147
147
|
ipex_llm/transformers/models/aquila.py,sha256=VZb5Drpo_fTxwcExZ397LygnsNPX2sVbie9_JeFudZI,5252
|
148
|
-
ipex_llm/transformers/models/baichuan.py,sha256=
|
148
|
+
ipex_llm/transformers/models/baichuan.py,sha256=nRqg_ih8TCIAeSjoiQpaGNAXqXGpVvQmqj5_6gr-Rxg,18395
|
149
149
|
ipex_llm/transformers/models/baichuan_m1.py,sha256=l6BD9jbA8TQ5Q0fcngHNRw73SxqvC126ErENs7Zh-do,9513
|
150
150
|
ipex_llm/transformers/models/bert.py,sha256=U3JVnuY1z0ILlJgMvetOKuCAkH74ufGbg4whZ8GNtmQ,5620
|
151
151
|
ipex_llm/transformers/models/bloom.py,sha256=PxfzyYT-nFn3K5rZhTQjmcEjUUzAhUFzxIN4kzRlCuc,8103
|
152
|
-
ipex_llm/transformers/models/chatglm.py,sha256=
|
152
|
+
ipex_llm/transformers/models/chatglm.py,sha256=DQM63oPIVMMTBQN4O4hPF4WY1aSiTWq4Bt0BPmgrK0k,12687
|
153
153
|
ipex_llm/transformers/models/chatglm2.py,sha256=KyAIX7zGVQDQuwwM3QMBNWZbTeMHEzKUIgAryT0voHc,14933
|
154
154
|
ipex_llm/transformers/models/chatglm4.py,sha256=QvUehdaCePB3MNHyWg3dneDxmjtBdxYeKUyQUVcsgfM,16886
|
155
155
|
ipex_llm/transformers/models/chatglm4v.py,sha256=Ba9Xtzwtzk_rzg5khGqDrlHfJsDwc5YcM5_yPoord7o,13324
|
@@ -181,7 +181,7 @@ ipex_llm/transformers/models/qwen2.py,sha256=zK-FpUaxEhjD4gZa1ZvArodAilz29T_cpeA
|
|
181
181
|
ipex_llm/transformers/models/qwen2_5_omni.py,sha256=gNnWvGiPntn6GlyIUtCVYCSIMPU6FG9TCS7fhWbwerY,18779
|
182
182
|
ipex_llm/transformers/models/qwen2_moe.py,sha256=a0gYo-ngf8SxaEnBdZUJDnPS6Mkn_poDd8xqhx50icI,19516
|
183
183
|
ipex_llm/transformers/models/qwen2_vl.py,sha256=G-9e2oN4f5p5IWQ-zsBZuONxTura3BjlgyT2meigbHQ,13579
|
184
|
-
ipex_llm/transformers/models/qwen_vl.py,sha256=
|
184
|
+
ipex_llm/transformers/models/qwen_vl.py,sha256=lwNwCJNsBvOu1TGNDW_E2IlCjI7XZwHY8qIcZpuNDFc,17187
|
185
185
|
ipex_llm/transformers/models/rwkv4.py,sha256=H4KMtxN0JA2ZTXnonHpsUUJ5xULemo-D1Jzl0ri_UY8,6123
|
186
186
|
ipex_llm/transformers/models/rwkv5.py,sha256=OkRNj1pCAZg1z2Fw-I0DEnxLEdZyPeRSQ6msrkxLOCs,10710
|
187
187
|
ipex_llm/transformers/models/sd.py,sha256=VvHV5u-0k2MgHu3NL9113hPj7DgfxqctuKzEEeNfRDU,5981
|
@@ -263,11 +263,11 @@ ipex_llm/vllm/xpu/engine/__init__.py,sha256=pY_CpyuZd72fr6s32ejeKHKFW0K4vUU2rzZj
|
|
263
263
|
ipex_llm/vllm/xpu/engine/engine.py,sha256=NvCMbp0X8NVrOqbwm4FTvXOptTRLzu9jQsy37ZHnTk8,9493
|
264
264
|
ipex_llm/vllm/xpu/entrypoints/openai/api_server.py,sha256=IjiSze9vzBCAkLu_VwIcJwuO1jyFna7DLrj6aSL7RaQ,35220
|
265
265
|
ipex_llm/vllm/xpu/entrypoints/openai/cli_args.py,sha256=hB398yYtKauASRzevctScdbFIjiiSGMAe1bwEuIHrhY,10893
|
266
|
-
ipex_llm-2.3.
|
267
|
-
ipex_llm-2.3.
|
268
|
-
ipex_llm-2.3.
|
269
|
-
ipex_llm-2.3.
|
270
|
-
ipex_llm-2.3.
|
271
|
-
ipex_llm-2.3.
|
272
|
-
ipex_llm-2.3.
|
273
|
-
ipex_llm-2.3.
|
266
|
+
ipex_llm-2.3.0b20250415.data/scripts/ipex-llm-init,sha256=fLQsT2dRL6H5bThb4GuIWotAuqoLsIxFwA-0c2qmaO8,6672
|
267
|
+
ipex_llm-2.3.0b20250415.data/scripts/llm-chat,sha256=TdUnUmNapzuoe1c8IzrdVOQwWEg8IqsMSBRlOD3daZM,2249
|
268
|
+
ipex_llm-2.3.0b20250415.data/scripts/llm-cli,sha256=RXGPlLElHxcKzoUxljEMBIAXbzCDysXL-Nxw-xF-7LU,2457
|
269
|
+
ipex_llm-2.3.0b20250415.dist-info/METADATA,sha256=AK6V5GUxadLFvaeVQf6Ym6bSCFwx4ChknK-6c21T2lo,13917
|
270
|
+
ipex_llm-2.3.0b20250415.dist-info/WHEEL,sha256=PPJcBMAZibF_2GFE9NmOJGqiaSMPiNFbJd6QaJjdA6Y,109
|
271
|
+
ipex_llm-2.3.0b20250415.dist-info/entry_points.txt,sha256=TiUyBB2MRmfF3ko-pyAEzqeBCRnyhu27bNOAsWPp3e8,61
|
272
|
+
ipex_llm-2.3.0b20250415.dist-info/top_level.txt,sha256=CGCMHM-SyqUabU4h8RqJ2KTYckQUO3LvIWwmUQ6Qbzw,9
|
273
|
+
ipex_llm-2.3.0b20250415.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|