bigdl-core-npu 2.6.0b20250206__cp310-cp310-win_amd64.whl → 2.6.0b20250208__cp310-cp310-win_amd64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- bigdl-core-npu/common.lib +0 -0
- bigdl-core-npu/ggml.dll +0 -0
- bigdl-core-npu/ggml.lib +0 -0
- bigdl-core-npu/include/common.h +1 -1
- bigdl-core-npu/include/llamacpp/common.h +1 -1
- bigdl-core-npu/include/llamacpp/ggml.h +11 -1
- bigdl-core-npu/include/llamacpp/llama.h +5 -0
- bigdl-core-npu/llama-cli-npu.exe +0 -0
- bigdl-core-npu/llama.dll +0 -0
- bigdl-core-npu/llama.lib +0 -0
- bigdl-core-npu/llm-cli.exe +0 -0
- bigdl-core-npu/npu_llm.dll +0 -0
- {bigdl_core_npu-2.6.0b20250206.dist-info → bigdl_core_npu-2.6.0b20250208.dist-info}/METADATA +1 -1
- {bigdl_core_npu-2.6.0b20250206.dist-info → bigdl_core_npu-2.6.0b20250208.dist-info}/RECORD +18 -17
- intel_npu_acceleration_library/_version.py +1 -1
- intel_npu_acceleration_library/lib/Release/intel_npu_acceleration_library.dll +0 -0
- {bigdl_core_npu-2.6.0b20250206.dist-info → bigdl_core_npu-2.6.0b20250208.dist-info}/WHEEL +0 -0
- {bigdl_core_npu-2.6.0b20250206.dist-info → bigdl_core_npu-2.6.0b20250208.dist-info}/top_level.txt +0 -0
bigdl-core-npu/common.lib
CHANGED
Binary file
|
bigdl-core-npu/ggml.dll
CHANGED
Binary file
|
bigdl-core-npu/ggml.lib
CHANGED
Binary file
|
bigdl-core-npu/include/common.h
CHANGED
@@ -344,7 +344,7 @@ struct gpt_params {
|
|
344
344
|
bool batched_bench_output_jsonl = false;
|
345
345
|
|
346
346
|
// npu convert
|
347
|
-
std::string low_bit = "
|
347
|
+
std::string low_bit = "Q4_0";
|
348
348
|
int32_t quantization_group_size = 0;
|
349
349
|
int32_t max_context_len = 1024;
|
350
350
|
int32_t max_prompt_len = 512;
|
@@ -2661,9 +2661,19 @@ extern "C" {
|
|
2661
2661
|
|
2662
2662
|
GGML_API void ggml_dequantize_to_fp32(struct ggml_tensor * tensor, float *y, size_t n);
|
2663
2663
|
|
2664
|
-
GGML_API void ggml_requantize_to_npu(struct ggml_tensor * tensor, float* y, const char* layer, const int weight_idx, enum gguf_npu_qtype npu_type, const char* dir_path);
|
2664
|
+
GGML_API void ggml_requantize_to_npu(struct ggml_tensor * tensor, float* y, const char* layer, const int weight_idx, enum gguf_npu_qtype npu_type, const char* dir_path, int n_splits);
|
2665
2665
|
|
2666
2666
|
GGML_API void ggml_convert_to_fp16(struct ggml_tensor * tensor, const char* layer, const int weight_idx, const char* dir_path);
|
2667
|
+
|
2668
|
+
GGML_API size_t ggml_quantize_chunk_with_splits(
|
2669
|
+
enum ggml_type type,
|
2670
|
+
const float * src,
|
2671
|
+
void * dst,
|
2672
|
+
int64_t start,
|
2673
|
+
int64_t nrows,
|
2674
|
+
int64_t n_per_row,
|
2675
|
+
const float * imatrix,
|
2676
|
+
int n_splits);
|
2667
2677
|
#ifdef __cplusplus
|
2668
2678
|
}
|
2669
2679
|
#endif
|
@@ -8,6 +8,7 @@
|
|
8
8
|
#include <stdint.h>
|
9
9
|
#include <stdio.h>
|
10
10
|
#include <stdbool.h>
|
11
|
+
#include <string>
|
11
12
|
|
12
13
|
#ifdef LLAMA_SHARED
|
13
14
|
# if defined(_WIN32) && !defined(__MINGW32__)
|
@@ -310,6 +311,8 @@ extern "C" {
|
|
310
311
|
bool use_mmap; // use mmap if possible
|
311
312
|
bool use_mlock; // force system to keep model in RAM
|
312
313
|
bool check_tensors; // validate model tensor data
|
314
|
+
std::string npu_model;
|
315
|
+
std::string qtype;
|
313
316
|
};
|
314
317
|
|
315
318
|
// NOTE: changing the default values of parameters marked as [EXPERIMENTAL] may cause crashes or incorrect results in certain configurations
|
@@ -1217,6 +1220,8 @@ extern "C" {
|
|
1217
1220
|
|
1218
1221
|
LLAMA_API void convert_gguf_to_npu_weight(llama_model* model, const char* weight_path, enum gguf_npu_qtype npu_type);
|
1219
1222
|
|
1223
|
+
LLAMA_API std::string get_npu_model_dir(llama_model * model, std::string qtype);
|
1224
|
+
|
1220
1225
|
#ifdef __cplusplus
|
1221
1226
|
}
|
1222
1227
|
#endif
|
bigdl-core-npu/llama-cli-npu.exe
CHANGED
Binary file
|
bigdl-core-npu/llama.dll
CHANGED
Binary file
|
bigdl-core-npu/llama.lib
CHANGED
Binary file
|
Binary file
|
bigdl-core-npu/npu_llm.dll
CHANGED
Binary file
|
@@ -1,23 +1,24 @@
|
|
1
1
|
bigdl-core-npu/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
2
|
-
bigdl-core-npu/common.lib,sha256=
|
3
|
-
bigdl-core-npu/ggml.dll,sha256=
|
4
|
-
bigdl-core-npu/ggml.lib,sha256=
|
5
|
-
bigdl-core-npu/llama-cli-npu.exe,sha256=
|
6
|
-
bigdl-core-npu/llama.dll,sha256=
|
7
|
-
bigdl-core-npu/llama.lib,sha256=
|
8
|
-
bigdl-core-npu/
|
2
|
+
bigdl-core-npu/common.lib,sha256=MeeiDWPtA8cw-rdDsxPDdEqOV5ZdYNwNcP6jzS8Yc5M,6645900
|
3
|
+
bigdl-core-npu/ggml.dll,sha256=qoyuaP5i1Gp0yyivaOf5DrdheOa4Lc86VvY3imSzVho,705024
|
4
|
+
bigdl-core-npu/ggml.lib,sha256=YiA6rQgJZwvwdM0bXqMHNgAigoEPozcLs7jP3dYz1nk,139880
|
5
|
+
bigdl-core-npu/llama-cli-npu.exe,sha256=8oPaOUWSlZzh54bttKjA5qRR9RivC8w5-gwRg-FjyBY,556032
|
6
|
+
bigdl-core-npu/llama.dll,sha256=ERfdyRLtgCp7QWl1mcZw2rd08NS8hL71XuWK3Syc5qI,1591808
|
7
|
+
bigdl-core-npu/llama.lib,sha256=G-H-iFwvni5O4_Lwjx2GteAE7B9kTC9pMVbM23dndC0,1515984
|
8
|
+
bigdl-core-npu/llm-cli.exe,sha256=3lNbGbrjnAAobmq8YtZj_zp4-IwF7LJMyII-Y5J_iRw,44544
|
9
|
+
bigdl-core-npu/npu_llm.dll,sha256=JihsqX2Y8QjcAyn77K_oHj2jlrligxveFddX5KO9nek,3962368
|
9
10
|
bigdl-core-npu/npu_llm.lib,sha256=nNYF-btjrT9Pzcd31kQV5BsLBSNdA_DSeyK5RnmOc9s,44524
|
10
|
-
bigdl-core-npu/include/common.h,sha256=
|
11
|
+
bigdl-core-npu/include/common.h,sha256=p5PTHTHiJlOA9lXXWH12eHf5JTvGi-mmf9GgFY7kv7E,3206
|
11
12
|
bigdl-core-npu/include/npu_llm.h,sha256=siEFqkKnZlzR9cvq7qXiAy5Z65-X14QyWEw__wsLLpA,2605
|
12
13
|
bigdl-core-npu/include/llamacpp/arg.h,sha256=XOLwSDqJsCJJgGCkOGSWcA9yGZ0eiiY7GffHdAxFYYY,3110
|
13
|
-
bigdl-core-npu/include/llamacpp/common.h,sha256=
|
14
|
+
bigdl-core-npu/include/llamacpp/common.h,sha256=pZ1DuXPcaIFui7juV0kB4-c5CW2I9BRI3Tlz8OT_bsk,25837
|
14
15
|
bigdl-core-npu/include/llamacpp/ggml-alloc.h,sha256=kiWITcUF9Q7kvGSBeCfouV59YyGDNy56VE_0fXXnWHE,3088
|
15
16
|
bigdl-core-npu/include/llamacpp/ggml-backend.h,sha256=cUJR-AC7hUbIxukKixR9vUSV38gmp-9eoViaBG8lyio,14347
|
16
|
-
bigdl-core-npu/include/llamacpp/ggml.h,sha256=
|
17
|
-
bigdl-core-npu/include/llamacpp/llama.h,sha256=
|
17
|
+
bigdl-core-npu/include/llamacpp/ggml.h,sha256=liFnnzpemuVWZ3lg7oTCoRIPCo2taBdA8cwMY6OV9FM,106000
|
18
|
+
bigdl-core-npu/include/llamacpp/llama.h,sha256=OCMREKob7-NDw3ia9INyJ13bVKUT00gSp9JIayY5FnM,61134
|
18
19
|
bigdl-core-npu/include/llamacpp/log.h,sha256=D6UiundA26yZOh3ci828u5U4ZaBxWb9CwSNu_3dt6CA,4295
|
19
20
|
intel_npu_acceleration_library/__init__.py,sha256=ZKTIhGMDjF7P6pF-yX8KWcSXbeHWRk24AO_orsa18f8,536
|
20
|
-
intel_npu_acceleration_library/_version.py,sha256=
|
21
|
+
intel_npu_acceleration_library/_version.py,sha256=4pFkd6f20XRFeIEE7uRcKsrNSMU_fJedu5xEWYA3v6k,112
|
21
22
|
intel_npu_acceleration_library/compiler.py,sha256=3IdgqjamSC8MLexDBJypIeZRiWIcTFnvQSU1LPXUr7Y,6225
|
22
23
|
intel_npu_acceleration_library/device.py,sha256=9bn8eVXJa5cXIqgfLsQAdkMVtVUQABb8z0-mQik5jRg,7424
|
23
24
|
intel_npu_acceleration_library/dtypes.py,sha256=gdd06Wsc9zIZFHlauUEx4xcK9WGTn1Mu6GkuYDJeA-E,4683
|
@@ -234,7 +235,7 @@ intel_npu_acceleration_library/external/openvino/torch/__init__.py,sha256=RXLzsf
|
|
234
235
|
intel_npu_acceleration_library/functional/__init__.py,sha256=WWKwKOh6Sgovv7mKctA872TbLP98Pg5m5-MREvUmlAA,204
|
235
236
|
intel_npu_acceleration_library/functional/scaled_dot_product_attention.py,sha256=yGUcg4tDQOLuUnP1g74cl-ec8TRr2SuAMcNLlN6qLvE,1620
|
236
237
|
intel_npu_acceleration_library/lib/Release/cache.json,sha256=CyrSqZUWo0Ec4_7ydOiuKIC0Gm8AybrGdozUqUuHxBw,8840377
|
237
|
-
intel_npu_acceleration_library/lib/Release/intel_npu_acceleration_library.dll,sha256=
|
238
|
+
intel_npu_acceleration_library/lib/Release/intel_npu_acceleration_library.dll,sha256=eXhnETU-SufRnGBOfeMnYX4tEYSMiNA7uvXDGczHeZc,341504
|
238
239
|
intel_npu_acceleration_library/lib/Release/openvino.dll,sha256=m7M119p3JBq2YYJJ2zzCaBDz6XivKK3nNykb8L1cvDU,13244768
|
239
240
|
intel_npu_acceleration_library/lib/Release/openvino_auto_batch_plugin.dll,sha256=2v_I9P3Qo0St1bQZMEZscnFOUVvgZQQ0HvQlG3HtTd0,203104
|
240
241
|
intel_npu_acceleration_library/lib/Release/openvino_auto_plugin.dll,sha256=e3Aj9CDRHN30dBEdPSk7OCWe52tWfhI4xeXgyFjuDHg,475488
|
@@ -264,7 +265,7 @@ intel_npu_acceleration_library/nn/functional.py,sha256=UfAKBc0u6RtyaMo14ldH2GpEn
|
|
264
265
|
intel_npu_acceleration_library/nn/linear.py,sha256=Q06SoGQeLaI86nA_ky2GnFC6H2Fw1zyMDILKnpYC2eo,5739
|
265
266
|
intel_npu_acceleration_library/nn/llm.py,sha256=P6dz36Yf6BHtzWcftaghC6QaMI_WeRfQwrCbO7fD6hk,15002
|
266
267
|
intel_npu_acceleration_library/nn/module.py,sha256=EYxoTq6I_YgBDgTF76GPDxHrT8SupOTDGMzQaomBeq8,12667
|
267
|
-
bigdl_core_npu-2.6.
|
268
|
-
bigdl_core_npu-2.6.
|
269
|
-
bigdl_core_npu-2.6.
|
270
|
-
bigdl_core_npu-2.6.
|
268
|
+
bigdl_core_npu-2.6.0b20250208.dist-info/METADATA,sha256=0eKBbcpupCbACu_wuUmjO8kgF0Uj0-C39YnxzYKopAI,1762
|
269
|
+
bigdl_core_npu-2.6.0b20250208.dist-info/WHEEL,sha256=rzGfZgUcGeKSgIHGYMuqg4xE4VPHxnaldXH6BG0zjVk,101
|
270
|
+
bigdl_core_npu-2.6.0b20250208.dist-info/top_level.txt,sha256=iMQZlTsFPJjlD-Y0MqZEP_9ifI0LlbNCJIOTaMoGMjk,46
|
271
|
+
bigdl_core_npu-2.6.0b20250208.dist-info/RECORD,,
|
Binary file
|
File without changes
|
{bigdl_core_npu-2.6.0b20250206.dist-info → bigdl_core_npu-2.6.0b20250208.dist-info}/top_level.txt
RENAMED
File without changes
|