bigdl-core-npu 2.6.0b20241211__cp311-cp311-win_amd64.whl → 2.6.0b20241212__cp311-cp311-win_amd64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- bigdl-core-npu/include/common.h +6 -0
- bigdl-core-npu/include/npu_llm.h +4 -2
- bigdl-core-npu/npu_llm.dll +0 -0
- bigdl-core-npu/npu_llm.lib +0 -0
- {bigdl_core_npu-2.6.0b20241211.dist-info → bigdl_core_npu-2.6.0b20241212.dist-info}/METADATA +1 -1
- {bigdl_core_npu-2.6.0b20241211.dist-info → bigdl_core_npu-2.6.0b20241212.dist-info}/RECORD +10 -10
- intel_npu_acceleration_library/_version.py +1 -1
- intel_npu_acceleration_library/lib/Release/intel_npu_acceleration_library.dll +0 -0
- {bigdl_core_npu-2.6.0b20241211.dist-info → bigdl_core_npu-2.6.0b20241212.dist-info}/WHEEL +0 -0
- {bigdl_core_npu-2.6.0b20241211.dist-info → bigdl_core_npu-2.6.0b20241212.dist-info}/top_level.txt +0 -0
bigdl-core-npu/include/common.h
CHANGED
@@ -80,6 +80,12 @@ struct tokenizer_params {
|
|
80
80
|
std::vector<int32_t> eos_token_id;
|
81
81
|
};
|
82
82
|
|
83
|
+
struct npu_generation_params {
|
84
|
+
// may add more later when dealing with more cases
|
85
|
+
float repetition_penalty;
|
86
|
+
int32_t max_new_token;
|
87
|
+
};
|
88
|
+
|
83
89
|
|
84
90
|
#ifdef __cplusplus
|
85
91
|
extern "C" {
|
bigdl-core-npu/include/npu_llm.h
CHANGED
@@ -51,11 +51,13 @@ extern "C" {
|
|
51
51
|
|
52
52
|
EXPORT_API void load_config_from_file(npu_model_params &model_params, const char* model_path);
|
53
53
|
|
54
|
+
EXPORT_API void load_generation_config_from_file(npu_generation_params &generation_params, const char* model_path);
|
55
|
+
|
54
56
|
EXPORT_API std::string add_chat_template(npu_model_params model_params, std::string input_prompt);
|
55
57
|
|
56
|
-
EXPORT_API float* run_prefill(void* void_model, int32_t* embd_inp_ptr, int32_t embd_inp_size);
|
58
|
+
EXPORT_API float* run_prefill(void* void_model, int32_t* embd_inp_ptr, int32_t embd_inp_size, float repetition_penalty);
|
57
59
|
|
58
|
-
EXPORT_API float* run_decode(void* void_model, int32_t input_token);
|
60
|
+
EXPORT_API float* run_decode(void* void_model, int32_t input_token, float repetition_penalty);
|
59
61
|
|
60
62
|
EXPORT_API void run_prefill_with_logits(void* void_model, int32_t* embd_inp_ptr, int32_t embd_inp_size, float* logits, int32_t vocab_size);
|
61
63
|
|
bigdl-core-npu/npu_llm.dll
CHANGED
Binary file
|
bigdl-core-npu/npu_llm.lib
CHANGED
Binary file
|
@@ -1,10 +1,10 @@
|
|
1
1
|
bigdl-core-npu/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
2
|
-
bigdl-core-npu/npu_llm.dll,sha256=
|
3
|
-
bigdl-core-npu/npu_llm.lib,sha256=
|
4
|
-
bigdl-core-npu/include/common.h,sha256=
|
5
|
-
bigdl-core-npu/include/npu_llm.h,sha256=
|
2
|
+
bigdl-core-npu/npu_llm.dll,sha256=zGMMkS74GyzCeDMjtWGD-MVMmGkOlwns85P9SF85W4U,3923456
|
3
|
+
bigdl-core-npu/npu_llm.lib,sha256=uG0enTHg0GNdEYMN36DPEKQXuYoioueKYpKXCKR3wyk,44328
|
4
|
+
bigdl-core-npu/include/common.h,sha256=AWpPmCEAz6-oGUtq_ONHlELtOzSMqy4CBTMIppJeOII,2819
|
5
|
+
bigdl-core-npu/include/npu_llm.h,sha256=Ar35OKx1qVbT3Q8TGTx_TQa6IlwIYBpn6oSo9q-t9YM,2509
|
6
6
|
intel_npu_acceleration_library/__init__.py,sha256=ZKTIhGMDjF7P6pF-yX8KWcSXbeHWRk24AO_orsa18f8,536
|
7
|
-
intel_npu_acceleration_library/_version.py,sha256=
|
7
|
+
intel_npu_acceleration_library/_version.py,sha256=SAbcsL8DKJ2CKOwNc76MqXwyYql3QHQhTPW2Hs3xW5c,112
|
8
8
|
intel_npu_acceleration_library/compiler.py,sha256=3IdgqjamSC8MLexDBJypIeZRiWIcTFnvQSU1LPXUr7Y,6225
|
9
9
|
intel_npu_acceleration_library/device.py,sha256=9bn8eVXJa5cXIqgfLsQAdkMVtVUQABb8z0-mQik5jRg,7424
|
10
10
|
intel_npu_acceleration_library/dtypes.py,sha256=gdd06Wsc9zIZFHlauUEx4xcK9WGTn1Mu6GkuYDJeA-E,4683
|
@@ -198,7 +198,7 @@ intel_npu_acceleration_library/external/openvino/torch/__init__.py,sha256=RXLzsf
|
|
198
198
|
intel_npu_acceleration_library/functional/__init__.py,sha256=WWKwKOh6Sgovv7mKctA872TbLP98Pg5m5-MREvUmlAA,204
|
199
199
|
intel_npu_acceleration_library/functional/scaled_dot_product_attention.py,sha256=yGUcg4tDQOLuUnP1g74cl-ec8TRr2SuAMcNLlN6qLvE,1620
|
200
200
|
intel_npu_acceleration_library/lib/Release/cache.json,sha256=CyrSqZUWo0Ec4_7ydOiuKIC0Gm8AybrGdozUqUuHxBw,8840377
|
201
|
-
intel_npu_acceleration_library/lib/Release/intel_npu_acceleration_library.dll,sha256
|
201
|
+
intel_npu_acceleration_library/lib/Release/intel_npu_acceleration_library.dll,sha256=-0QqIpcxa4igeEqLkhKAUuS8kaKpr1trp7EPDjI1h0Y,339968
|
202
202
|
intel_npu_acceleration_library/lib/Release/openvino.dll,sha256=m7M119p3JBq2YYJJ2zzCaBDz6XivKK3nNykb8L1cvDU,13244768
|
203
203
|
intel_npu_acceleration_library/lib/Release/openvino_auto_batch_plugin.dll,sha256=2v_I9P3Qo0St1bQZMEZscnFOUVvgZQQ0HvQlG3HtTd0,203104
|
204
204
|
intel_npu_acceleration_library/lib/Release/openvino_auto_plugin.dll,sha256=e3Aj9CDRHN30dBEdPSk7OCWe52tWfhI4xeXgyFjuDHg,475488
|
@@ -228,7 +228,7 @@ intel_npu_acceleration_library/nn/functional.py,sha256=UfAKBc0u6RtyaMo14ldH2GpEn
|
|
228
228
|
intel_npu_acceleration_library/nn/linear.py,sha256=Q06SoGQeLaI86nA_ky2GnFC6H2Fw1zyMDILKnpYC2eo,5739
|
229
229
|
intel_npu_acceleration_library/nn/llm.py,sha256=P6dz36Yf6BHtzWcftaghC6QaMI_WeRfQwrCbO7fD6hk,15002
|
230
230
|
intel_npu_acceleration_library/nn/module.py,sha256=EYxoTq6I_YgBDgTF76GPDxHrT8SupOTDGMzQaomBeq8,12667
|
231
|
-
bigdl_core_npu-2.6.
|
232
|
-
bigdl_core_npu-2.6.
|
233
|
-
bigdl_core_npu-2.6.
|
234
|
-
bigdl_core_npu-2.6.
|
231
|
+
bigdl_core_npu-2.6.0b20241212.dist-info/METADATA,sha256=WjfT1msnAHDOr21DLxWpjCi6jS-ujbY4Q1F-yI-10pA,1541
|
232
|
+
bigdl_core_npu-2.6.0b20241212.dist-info/WHEEL,sha256=nkBcd8Ko0v5sEcSagm2-x_RVrb8gBSkTa8VFFZ0Mr1o,101
|
233
|
+
bigdl_core_npu-2.6.0b20241212.dist-info/top_level.txt,sha256=iMQZlTsFPJjlD-Y0MqZEP_9ifI0LlbNCJIOTaMoGMjk,46
|
234
|
+
bigdl_core_npu-2.6.0b20241212.dist-info/RECORD,,
|
Binary file
|
File without changes
|
{bigdl_core_npu-2.6.0b20241211.dist-info → bigdl_core_npu-2.6.0b20241212.dist-info}/top_level.txt
RENAMED
File without changes
|