bigdl-core-npu 2.6.0b20241127__cp310-cp310-win_amd64.whl → 2.6.0b20241129__cp310-cp310-win_amd64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- bigdl-core-npu/include/common.h +1 -1
- bigdl-core-npu/include/npu_llm.h +8 -4
- bigdl-core-npu/npu_llm.dll +0 -0
- bigdl-core-npu/npu_llm.lib +0 -0
- {bigdl_core_npu-2.6.0b20241127.dist-info → bigdl_core_npu-2.6.0b20241129.dist-info}/METADATA +1 -1
- {bigdl_core_npu-2.6.0b20241127.dist-info → bigdl_core_npu-2.6.0b20241129.dist-info}/RECORD +10 -10
- intel_npu_acceleration_library/_version.py +1 -1
- intel_npu_acceleration_library/lib/Release/intel_npu_acceleration_library.dll +0 -0
- {bigdl_core_npu-2.6.0b20241127.dist-info → bigdl_core_npu-2.6.0b20241129.dist-info}/WHEEL +0 -0
- {bigdl_core_npu-2.6.0b20241127.dist-info → bigdl_core_npu-2.6.0b20241129.dist-info}/top_level.txt +0 -0
bigdl-core-npu/include/common.h
CHANGED
@@ -29,7 +29,7 @@
|
|
29
29
|
|
30
30
|
struct common_params {
|
31
31
|
int32_t n_predict = -1; // new tokens to predict
|
32
|
-
|
32
|
+
char* model = ""; // model path // NOLINT
|
33
33
|
std::string prompt = ""; // NOLINT
|
34
34
|
std::string prompt_file = ""; // store the external prompt file name // NOLINT
|
35
35
|
|
bigdl-core-npu/include/npu_llm.h
CHANGED
@@ -47,15 +47,19 @@ extern "C" {
|
|
47
47
|
|
48
48
|
EXPORT_API std::string llm_decode(vector<int32_t> tokens);
|
49
49
|
|
50
|
-
EXPORT_API
|
50
|
+
EXPORT_API void* load_model_from_file(const char* model_path);
|
51
|
+
|
52
|
+
EXPORT_API void load_config_from_file(npu_model_params &model_params, const char* model_path);
|
51
53
|
|
52
54
|
EXPORT_API std::string add_chat_template(npu_model_params model_params, std::string input_prompt);
|
53
55
|
|
54
|
-
EXPORT_API float* run_prefill(
|
56
|
+
EXPORT_API float* run_prefill(void* void_model, int32_t* embd_inp_ptr, int32_t embd_inp_size);
|
57
|
+
|
58
|
+
EXPORT_API float* run_decode(void* void_model, int32_t input_token);
|
55
59
|
|
56
|
-
EXPORT_API
|
60
|
+
EXPORT_API int32_t llm_sample_token(float* logits, bool greedy_search, int32_t vocab_size);
|
57
61
|
|
58
|
-
EXPORT_API
|
62
|
+
EXPORT_API void reset(void* void_model);
|
59
63
|
|
60
64
|
#ifdef __cplusplus
|
61
65
|
}
|
bigdl-core-npu/npu_llm.dll
CHANGED
Binary file
|
bigdl-core-npu/npu_llm.lib
CHANGED
Binary file
|
@@ -1,10 +1,10 @@
|
|
1
1
|
bigdl-core-npu/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
2
|
-
bigdl-core-npu/npu_llm.dll,sha256=
|
3
|
-
bigdl-core-npu/npu_llm.lib,sha256=
|
4
|
-
bigdl-core-npu/include/common.h,sha256=
|
5
|
-
bigdl-core-npu/include/npu_llm.h,sha256=
|
2
|
+
bigdl-core-npu/npu_llm.dll,sha256=s5_86uZkuvx96pXFWDcmdmARdaKgnLz3K-O-_xjAz-g,3902464
|
3
|
+
bigdl-core-npu/npu_llm.lib,sha256=VuvMfKbbAM7BTiDyFBCK8PGqmfdEOVJVtNQOtdTJI_k,43370
|
4
|
+
bigdl-core-npu/include/common.h,sha256=2qMhyPMYet0BzIQ5m_wRXye_A8ileRpnsxp55TvcThE,2632
|
5
|
+
bigdl-core-npu/include/npu_llm.h,sha256=aYJxEHcrNsHZdgjtom7pILZtB0eBONB9H-azgQDmo38,1903
|
6
6
|
intel_npu_acceleration_library/__init__.py,sha256=ZKTIhGMDjF7P6pF-yX8KWcSXbeHWRk24AO_orsa18f8,536
|
7
|
-
intel_npu_acceleration_library/_version.py,sha256=
|
7
|
+
intel_npu_acceleration_library/_version.py,sha256=0JBHmQg23E48IvzuouLicFI6jfbU4iioNTqm_rvIxx4,112
|
8
8
|
intel_npu_acceleration_library/compiler.py,sha256=3IdgqjamSC8MLexDBJypIeZRiWIcTFnvQSU1LPXUr7Y,6225
|
9
9
|
intel_npu_acceleration_library/device.py,sha256=9bn8eVXJa5cXIqgfLsQAdkMVtVUQABb8z0-mQik5jRg,7424
|
10
10
|
intel_npu_acceleration_library/dtypes.py,sha256=gdd06Wsc9zIZFHlauUEx4xcK9WGTn1Mu6GkuYDJeA-E,4683
|
@@ -198,7 +198,7 @@ intel_npu_acceleration_library/external/openvino/torch/__init__.py,sha256=RXLzsf
|
|
198
198
|
intel_npu_acceleration_library/functional/__init__.py,sha256=WWKwKOh6Sgovv7mKctA872TbLP98Pg5m5-MREvUmlAA,204
|
199
199
|
intel_npu_acceleration_library/functional/scaled_dot_product_attention.py,sha256=yGUcg4tDQOLuUnP1g74cl-ec8TRr2SuAMcNLlN6qLvE,1620
|
200
200
|
intel_npu_acceleration_library/lib/Release/cache.json,sha256=CyrSqZUWo0Ec4_7ydOiuKIC0Gm8AybrGdozUqUuHxBw,8840377
|
201
|
-
intel_npu_acceleration_library/lib/Release/intel_npu_acceleration_library.dll,sha256=
|
201
|
+
intel_npu_acceleration_library/lib/Release/intel_npu_acceleration_library.dll,sha256=8wLWfRLZbjsSTUrqy8_h40NPzvz9BS-_GrX1zMMs-UQ,333312
|
202
202
|
intel_npu_acceleration_library/lib/Release/openvino.dll,sha256=m7M119p3JBq2YYJJ2zzCaBDz6XivKK3nNykb8L1cvDU,13244768
|
203
203
|
intel_npu_acceleration_library/lib/Release/openvino_auto_batch_plugin.dll,sha256=2v_I9P3Qo0St1bQZMEZscnFOUVvgZQQ0HvQlG3HtTd0,203104
|
204
204
|
intel_npu_acceleration_library/lib/Release/openvino_auto_plugin.dll,sha256=e3Aj9CDRHN30dBEdPSk7OCWe52tWfhI4xeXgyFjuDHg,475488
|
@@ -228,7 +228,7 @@ intel_npu_acceleration_library/nn/functional.py,sha256=UfAKBc0u6RtyaMo14ldH2GpEn
|
|
228
228
|
intel_npu_acceleration_library/nn/linear.py,sha256=Q06SoGQeLaI86nA_ky2GnFC6H2Fw1zyMDILKnpYC2eo,5739
|
229
229
|
intel_npu_acceleration_library/nn/llm.py,sha256=P6dz36Yf6BHtzWcftaghC6QaMI_WeRfQwrCbO7fD6hk,15002
|
230
230
|
intel_npu_acceleration_library/nn/module.py,sha256=EYxoTq6I_YgBDgTF76GPDxHrT8SupOTDGMzQaomBeq8,12667
|
231
|
-
bigdl_core_npu-2.6.
|
232
|
-
bigdl_core_npu-2.6.
|
233
|
-
bigdl_core_npu-2.6.
|
234
|
-
bigdl_core_npu-2.6.
|
231
|
+
bigdl_core_npu-2.6.0b20241129.dist-info/METADATA,sha256=aZJgC5QEtfWfCP6WxG_MFUTSPkOs60A6zF6ayPGdThs,1541
|
232
|
+
bigdl_core_npu-2.6.0b20241129.dist-info/WHEEL,sha256=tcd-HDpskugT8GYYKyyid0lOlzoZtZdWwcrj5ormtfo,101
|
233
|
+
bigdl_core_npu-2.6.0b20241129.dist-info/top_level.txt,sha256=iMQZlTsFPJjlD-Y0MqZEP_9ifI0LlbNCJIOTaMoGMjk,46
|
234
|
+
bigdl_core_npu-2.6.0b20241129.dist-info/RECORD,,
|
Binary file
|
File without changes
|
{bigdl_core_npu-2.6.0b20241127.dist-info → bigdl_core_npu-2.6.0b20241129.dist-info}/top_level.txt
RENAMED
File without changes
|