ipex-llm 2.2.0b20250311__py3-none-manylinux2010_x86_64.whl → 2.2.0b20250311.post0__py3-none-manylinux2010_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -361,6 +361,33 @@ async def show_version():
361
361
  return JSONResponse(content=ver)
362
362
 
363
363
 
364
+ save_dict = {}
365
+ import os
366
+ flag = os.getenv("VLLM_LOG_OUTPUT", None)
367
+ async def stream_generator(generator, request, request_id):
368
+ async for chunk in generator:
369
+ if request_id not in save_dict:
370
+ save_dict[request_id] = ""
371
+ import json
372
+ try:
373
+ data = chunk.strip()
374
+ if data.startswith('data: '):
375
+ data = data[len('data: '):]
376
+ else:
377
+ yield chunk
378
+ json_data = json.loads(data)
379
+ if 'choices' in json_data and len(json_data['choices']) > 0:
380
+ choice = json_data['choices'][0]
381
+ if 'delta' in choice:
382
+ save_dict[request_id] += choice["delta"]["content"]
383
+ elif 'text' in choice:
384
+ save_dict[request_id] += choice["text"]
385
+ except json.JSONDecodeError:
386
+ print(f"Received request_id: {request_id}, request: {request} content: {save_dict[request_id]}")
387
+ pass # Done
388
+ yield chunk
389
+
390
+
364
391
  @router.post("/v1/chat/completions")
365
392
  @with_cancellation
366
393
  async def create_chat_completion(request: ChatCompletionRequest,
@@ -370,6 +397,11 @@ async def create_chat_completion(request: ChatCompletionRequest,
370
397
  return base(raw_request).create_error_response(
371
398
  message="The model does not support Chat Completions API")
372
399
 
400
+ if flag is not None:
401
+ request_id = "chatcmpl-" \
402
+ f"{handler._base_request_id(raw_request, request.request_id)}"
403
+ print(f"First received request_id: {request_id}, request: {request}")
404
+
373
405
  generator = await handler.create_chat_completion(request, raw_request)
374
406
 
375
407
  if isinstance(generator, ErrorResponse):
@@ -377,8 +409,12 @@ async def create_chat_completion(request: ChatCompletionRequest,
377
409
  status_code=generator.code)
378
410
 
379
411
  elif isinstance(generator, ChatCompletionResponse):
412
+ if flag is not None:
413
+ print(f"Received request-id:{request_id}, request:{request}, Output:{generator.model_dump()}")
380
414
  return JSONResponse(content=generator.model_dump())
381
415
 
416
+ if flag is not None:
417
+ return StreamingResponse(content=stream_generator(generator, request, request_id), media_type="text/event-stream")
382
418
  return StreamingResponse(content=generator, media_type="text/event-stream")
383
419
 
384
420
 
@@ -390,13 +426,21 @@ async def create_completion(request: CompletionRequest, raw_request: Request):
390
426
  return base(raw_request).create_error_response(
391
427
  message="The model does not support Completions API")
392
428
 
429
+ if flag is not None:
430
+ request_id = f"cmpl-{handler._base_request_id(raw_request)}"
431
+ print(f"First received request_id: {request_id}, request: {request}")
432
+
393
433
  generator = await handler.create_completion(request, raw_request)
394
434
  if isinstance(generator, ErrorResponse):
395
435
  return JSONResponse(content=generator.model_dump(),
396
436
  status_code=generator.code)
397
437
  elif isinstance(generator, CompletionResponse):
438
+ if flag is not None:
439
+ print(f"Received request-id:{request_id}, request:{request}, Output:{generator.model_dump()}")
398
440
  return JSONResponse(content=generator.model_dump())
399
-
441
+
442
+ if flag is not None:
443
+ return StreamingResponse(content=stream_generator(generator, request, request_id), media_type="text/event-stream")
400
444
  return StreamingResponse(content=generator, media_type="text/event-stream")
401
445
 
402
446
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: ipex-llm
3
- Version: 2.2.0b20250311
3
+ Version: 2.2.0b20250311.post0
4
4
  Summary: Large Language Model Develop Toolkit
5
5
  Home-page: https://github.com/intel-analytics/ipex-llm
6
6
  Author: BigDL Authors
@@ -27,7 +27,7 @@ Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine
27
27
  Requires-Dist: torch ==2.1.2+cpu ; (platform_system == "Linux") and extra == 'all'
28
28
  Requires-Dist: torch ==2.1.2 ; (platform_system == "Windows") and extra == 'all'
29
29
  Provides-Extra: cpp
30
- Requires-Dist: bigdl-core-cpp ==2.6.0b20250311 ; extra == 'cpp'
30
+ Requires-Dist: bigdl-core-cpp ==2.6.0b20250312 ; extra == 'cpp'
31
31
  Requires-Dist: setuptools ; extra == 'cpp'
32
32
  Requires-Dist: onednn-devel ==2025.0.1 ; (platform_system == "Windows") and extra == 'cpp'
33
33
  Requires-Dist: onednn ==2025.0.1 ; (platform_system == "Windows") and extra == 'cpp'
@@ -60,7 +60,7 @@ Requires-Dist: transformers ==4.40.0 ; extra == 'npu'
60
60
  Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'npu'
61
61
  Requires-Dist: torch ==2.1.2+cpu ; (platform_system == "Linux") and extra == 'npu'
62
62
  Requires-Dist: torch ==2.1.2 ; (platform_system == "Windows") and extra == 'npu'
63
- Requires-Dist: bigdl-core-npu ==2.6.0b20250311 ; (platform_system == "Windows") and extra == 'npu'
63
+ Requires-Dist: bigdl-core-npu ==2.6.0b20250312 ; (platform_system == "Windows") and extra == 'npu'
64
64
  Provides-Extra: serving
65
65
  Requires-Dist: py-cpuinfo ; extra == 'serving'
66
66
  Requires-Dist: fschat[model_worker,webui] ==0.2.36 ; extra == 'serving'
@@ -80,9 +80,9 @@ Requires-Dist: setuptools <70.0.0 ; extra == 'xpu'
80
80
  Requires-Dist: torch ==2.1.0a0 ; extra == 'xpu'
81
81
  Requires-Dist: torchvision ==0.16.0a0 ; extra == 'xpu'
82
82
  Requires-Dist: intel-extension-for-pytorch ==2.1.10+xpu ; extra == 'xpu'
83
- Requires-Dist: bigdl-core-xe-21 ==2.6.0b20250311 ; extra == 'xpu'
84
- Requires-Dist: bigdl-core-xe-batch-21 ==2.6.0b20250311 ; extra == 'xpu'
85
- Requires-Dist: bigdl-core-xe-addons-21 ==2.6.0b20250311 ; extra == 'xpu'
83
+ Requires-Dist: bigdl-core-xe-21 ==2.6.0b20250312 ; extra == 'xpu'
84
+ Requires-Dist: bigdl-core-xe-batch-21 ==2.6.0b20250312 ; extra == 'xpu'
85
+ Requires-Dist: bigdl-core-xe-addons-21 ==2.6.0b20250312 ; extra == 'xpu'
86
86
  Provides-Extra: xpu-2-1
87
87
  Requires-Dist: py-cpuinfo ; extra == 'xpu-2-1'
88
88
  Requires-Dist: protobuf ; extra == 'xpu-2-1'
@@ -97,9 +97,9 @@ Requires-Dist: setuptools <70.0.0 ; extra == 'xpu-2-1'
97
97
  Requires-Dist: torch ==2.1.0a0 ; extra == 'xpu-2-1'
98
98
  Requires-Dist: torchvision ==0.16.0a0 ; extra == 'xpu-2-1'
99
99
  Requires-Dist: intel-extension-for-pytorch ==2.1.10+xpu ; extra == 'xpu-2-1'
100
- Requires-Dist: bigdl-core-xe-21 ==2.6.0b20250311 ; extra == 'xpu-2-1'
101
- Requires-Dist: bigdl-core-xe-batch-21 ==2.6.0b20250311 ; extra == 'xpu-2-1'
102
- Requires-Dist: bigdl-core-xe-addons-21 ==2.6.0b20250311 ; extra == 'xpu-2-1'
100
+ Requires-Dist: bigdl-core-xe-21 ==2.6.0b20250312 ; extra == 'xpu-2-1'
101
+ Requires-Dist: bigdl-core-xe-batch-21 ==2.6.0b20250312 ; extra == 'xpu-2-1'
102
+ Requires-Dist: bigdl-core-xe-addons-21 ==2.6.0b20250312 ; extra == 'xpu-2-1'
103
103
  Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-2-1'
104
104
  Requires-Dist: dpcpp-cpp-rt ==2024.0.2 ; (platform_system == "Windows") and extra == 'xpu-2-1'
105
105
  Requires-Dist: mkl-dpcpp ==2024.0.0 ; (platform_system == "Windows") and extra == 'xpu-2-1'
@@ -117,10 +117,35 @@ Requires-Dist: setuptools ; extra == 'xpu-2-6'
117
117
  Requires-Dist: torch ==2.6.0+xpu ; extra == 'xpu-2-6'
118
118
  Requires-Dist: torchvision ==0.21.0+xpu ; extra == 'xpu-2-6'
119
119
  Requires-Dist: torchaudio ==2.6.0+xpu ; extra == 'xpu-2-6'
120
- Requires-Dist: bigdl-core-xe-all ==2.6.0b20250311 ; extra == 'xpu-2-6'
120
+ Requires-Dist: bigdl-core-xe-all ==2.6.0b20250312 ; extra == 'xpu-2-6'
121
121
  Requires-Dist: onednn-devel ==2025.0.1 ; extra == 'xpu-2-6'
122
122
  Requires-Dist: onednn ==2025.0.1 ; extra == 'xpu-2-6'
123
123
  Requires-Dist: dpcpp-cpp-rt ==2025.0.2 ; extra == 'xpu-2-6'
124
+ Provides-Extra: xpu-2-6-arl
125
+ Requires-Dist: py-cpuinfo ; extra == 'xpu-2-6-arl'
126
+ Requires-Dist: protobuf ; extra == 'xpu-2-6-arl'
127
+ Requires-Dist: mpmath ==1.3.0 ; extra == 'xpu-2-6-arl'
128
+ Requires-Dist: numpy ==1.26.4 ; extra == 'xpu-2-6-arl'
129
+ Requires-Dist: transformers ==4.37.0 ; extra == 'xpu-2-6-arl'
130
+ Requires-Dist: sentencepiece ; extra == 'xpu-2-6-arl'
131
+ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-2-6-arl'
132
+ Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-2-6-arl'
133
+ Requires-Dist: tabulate ; extra == 'xpu-2-6-arl'
134
+ Requires-Dist: setuptools ; extra == 'xpu-2-6-arl'
135
+ Requires-Dist: bigdl-core-xe-all ==2.6.0b20250312 ; extra == 'xpu-2-6-arl'
136
+ Requires-Dist: onednn-devel ==2025.0.1 ; extra == 'xpu-2-6-arl'
137
+ Requires-Dist: onednn ==2025.0.1 ; extra == 'xpu-2-6-arl'
138
+ Requires-Dist: dpcpp-cpp-rt ==2025.0.2 ; extra == 'xpu-2-6-arl'
139
+ Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-2-6-arl'
140
+ Requires-Dist: torch ==2.6.0+xpu ; (platform_system == "Linux") and extra == 'xpu-2-6-arl'
141
+ Requires-Dist: torchvision ==0.21.0+xpu ; (platform_system == "Linux") and extra == 'xpu-2-6-arl'
142
+ Requires-Dist: torchaudio ==2.6.0+xpu ; (platform_system == "Linux") and extra == 'xpu-2-6-arl'
143
+ Requires-Dist: intel-extension-for-pytorch ==2.6.10+xpu ; (platform_system == "Linux") and extra == 'xpu-2-6-arl'
144
+ Requires-Dist: oneccl-bind-pt ==2.6.0+xpu ; (platform_system == "Linux") and extra == 'xpu-2-6-arl'
145
+ Requires-Dist: torch ==2.6.0.post0+xpu ; (platform_system == "Windows") and extra == 'xpu-2-6-arl'
146
+ Requires-Dist: torchvision ==0.21.0.post0+xpu ; (platform_system == "Windows") and extra == 'xpu-2-6-arl'
147
+ Requires-Dist: torchaudio ==2.6.0.post0+xpu ; (platform_system == "Windows") and extra == 'xpu-2-6-arl'
148
+ Requires-Dist: intel-extension-for-pytorch ==2.6.10+xpu ; (platform_system == "Windows") and extra == 'xpu-2-6-arl'
124
149
  Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-2-6'
125
150
  Provides-Extra: xpu-arc
126
151
  Requires-Dist: py-cpuinfo ; extra == 'xpu-arc'
@@ -133,9 +158,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-arc'
133
158
  Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-arc'
134
159
  Requires-Dist: tabulate ; extra == 'xpu-arc'
135
160
  Requires-Dist: setuptools ; extra == 'xpu-arc'
136
- Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250311 ; extra == 'xpu-arc'
137
- Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250311 ; extra == 'xpu-arc'
138
- Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250311 ; extra == 'xpu-arc'
161
+ Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250312 ; extra == 'xpu-arc'
162
+ Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250312 ; extra == 'xpu-arc'
163
+ Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250312 ; extra == 'xpu-arc'
139
164
  Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-arc'
140
165
  Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arc'
141
166
  Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arc'
@@ -156,9 +181,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-arl'
156
181
  Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-arl'
157
182
  Requires-Dist: tabulate ; extra == 'xpu-arl'
158
183
  Requires-Dist: setuptools ; extra == 'xpu-arl'
159
- Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250311 ; extra == 'xpu-arl'
160
- Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250311 ; extra == 'xpu-arl'
161
- Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250311 ; extra == 'xpu-arl'
184
+ Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250312 ; extra == 'xpu-arl'
185
+ Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250312 ; extra == 'xpu-arl'
186
+ Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250312 ; extra == 'xpu-arl'
162
187
  Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-arl'
163
188
  Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arl'
164
189
  Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-arl'
@@ -179,9 +204,9 @@ Requires-Dist: tokenizers ==0.15.2 ; extra == 'xpu-lnl'
179
204
  Requires-Dist: accelerate ==0.23.0 ; extra == 'xpu-lnl'
180
205
  Requires-Dist: tabulate ; extra == 'xpu-lnl'
181
206
  Requires-Dist: setuptools ; extra == 'xpu-lnl'
182
- Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250311 ; extra == 'xpu-lnl'
183
- Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250311 ; extra == 'xpu-lnl'
184
- Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250311 ; extra == 'xpu-lnl'
207
+ Requires-Dist: bigdl-core-xe-23 ==2.6.0b20250312 ; extra == 'xpu-lnl'
208
+ Requires-Dist: bigdl-core-xe-batch-23 ==2.6.0b20250312 ; extra == 'xpu-lnl'
209
+ Requires-Dist: bigdl-core-xe-addons-23 ==2.6.0b20250312 ; extra == 'xpu-lnl'
185
210
  Requires-Dist: intel-openmp ; (platform_machine == "x86_64" or platform_machine == "AMD64") and extra == 'xpu-lnl'
186
211
  Requires-Dist: torch ==2.3.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-lnl'
187
212
  Requires-Dist: torchvision ==0.18.1+cxx11.abi ; (platform_system == "Linux") and extra == 'xpu-lnl'
@@ -260,13 +260,13 @@ ipex_llm/vllm/xpu/ipex_llm_wrapper.py,sha256=_CbhvBuf_KPnmLfngYKtJl5gPAHVsG2mWth
260
260
  ipex_llm/vllm/xpu/model_convert.py,sha256=pSiJlmoktCPQIGzBuDBMWiCyASqgSAQpEbqWkYe00JQ,9029
261
261
  ipex_llm/vllm/xpu/engine/__init__.py,sha256=pY_CpyuZd72fr6s32ejeKHKFW0K4vUU2rzZjWqm5YiA,783
262
262
  ipex_llm/vllm/xpu/engine/engine.py,sha256=NvCMbp0X8NVrOqbwm4FTvXOptTRLzu9jQsy37ZHnTk8,9493
263
- ipex_llm/vllm/xpu/entrypoints/openai/api_server.py,sha256=D577nxWlyoWaHXNXIEvS3ViKSSWL3XZq8D8t6izD7x4,33250
263
+ ipex_llm/vllm/xpu/entrypoints/openai/api_server.py,sha256=IjiSze9vzBCAkLu_VwIcJwuO1jyFna7DLrj6aSL7RaQ,35220
264
264
  ipex_llm/vllm/xpu/entrypoints/openai/cli_args.py,sha256=hB398yYtKauASRzevctScdbFIjiiSGMAe1bwEuIHrhY,10893
265
- ipex_llm-2.2.0b20250311.data/scripts/ipex-llm-init,sha256=fLQsT2dRL6H5bThb4GuIWotAuqoLsIxFwA-0c2qmaO8,6672
266
- ipex_llm-2.2.0b20250311.data/scripts/llm-chat,sha256=TdUnUmNapzuoe1c8IzrdVOQwWEg8IqsMSBRlOD3daZM,2249
267
- ipex_llm-2.2.0b20250311.data/scripts/llm-cli,sha256=RXGPlLElHxcKzoUxljEMBIAXbzCDysXL-Nxw-xF-7LU,2457
268
- ipex_llm-2.2.0b20250311.dist-info/METADATA,sha256=SQ5ZQxq7ojdFfBnzWfvYBfhjcCAftLdoe5x6qJg4-cI,12369
269
- ipex_llm-2.2.0b20250311.dist-info/WHEEL,sha256=PPJcBMAZibF_2GFE9NmOJGqiaSMPiNFbJd6QaJjdA6Y,109
270
- ipex_llm-2.2.0b20250311.dist-info/entry_points.txt,sha256=TiUyBB2MRmfF3ko-pyAEzqeBCRnyhu27bNOAsWPp3e8,61
271
- ipex_llm-2.2.0b20250311.dist-info/top_level.txt,sha256=CGCMHM-SyqUabU4h8RqJ2KTYckQUO3LvIWwmUQ6Qbzw,9
272
- ipex_llm-2.2.0b20250311.dist-info/RECORD,,
265
+ ipex_llm-2.2.0b20250311.post0.data/scripts/ipex-llm-init,sha256=fLQsT2dRL6H5bThb4GuIWotAuqoLsIxFwA-0c2qmaO8,6672
266
+ ipex_llm-2.2.0b20250311.post0.data/scripts/llm-chat,sha256=TdUnUmNapzuoe1c8IzrdVOQwWEg8IqsMSBRlOD3daZM,2249
267
+ ipex_llm-2.2.0b20250311.post0.data/scripts/llm-cli,sha256=RXGPlLElHxcKzoUxljEMBIAXbzCDysXL-Nxw-xF-7LU,2457
268
+ ipex_llm-2.2.0b20250311.post0.dist-info/METADATA,sha256=faWohJUzBBnTfgSd31oO-CofJpPUzQ8wxKalLA53S6s,14253
269
+ ipex_llm-2.2.0b20250311.post0.dist-info/WHEEL,sha256=PPJcBMAZibF_2GFE9NmOJGqiaSMPiNFbJd6QaJjdA6Y,109
270
+ ipex_llm-2.2.0b20250311.post0.dist-info/entry_points.txt,sha256=TiUyBB2MRmfF3ko-pyAEzqeBCRnyhu27bNOAsWPp3e8,61
271
+ ipex_llm-2.2.0b20250311.post0.dist-info/top_level.txt,sha256=CGCMHM-SyqUabU4h8RqJ2KTYckQUO3LvIWwmUQ6Qbzw,9
272
+ ipex_llm-2.2.0b20250311.post0.dist-info/RECORD,,