bigdl-core-cpp 2.5.0b20240818__py3-none-manylinux2010_x86_64.whl → 2.5.0b20240820__py3-none-manylinux2010_x86_64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- bigdl/cpp/convert-hf-to-gguf.py +28 -1
- bigdl/cpp/libs/baby-llama +0 -0
- bigdl/cpp/libs/batched +0 -0
- bigdl/cpp/libs/batched-bench +0 -0
- bigdl/cpp/libs/benchmark +0 -0
- bigdl/cpp/libs/embedding +0 -0
- bigdl/cpp/libs/gguf +0 -0
- bigdl/cpp/libs/imatrix +0 -0
- bigdl/cpp/libs/llama-bench +0 -0
- bigdl/cpp/libs/llava-cli +0 -0
- bigdl/cpp/libs/lookahead +0 -0
- bigdl/cpp/libs/lookup +0 -0
- bigdl/cpp/libs/ls-sycl-device +0 -0
- bigdl/cpp/libs/main +0 -0
- bigdl/cpp/libs/ollama +0 -0
- bigdl/cpp/libs/perplexity +0 -0
- bigdl/cpp/libs/quantize +0 -0
- bigdl/cpp/libs/quantize-stats +0 -0
- bigdl/cpp/libs/save-load-state +0 -0
- bigdl/cpp/libs/server +0 -0
- bigdl/cpp/libs/speculative +0 -0
- bigdl/cpp/libs/tokenize +0 -0
- {bigdl_core_cpp-2.5.0b20240818.dist-info → bigdl_core_cpp-2.5.0b20240820.dist-info}/METADATA +1 -1
- bigdl_core_cpp-2.5.0b20240820.dist-info/RECORD +45 -0
- bigdl_core_cpp-2.5.0b20240818.dist-info/RECORD +0 -45
- {bigdl_core_cpp-2.5.0b20240818.data → bigdl_core_cpp-2.5.0b20240820.data}/scripts/init-llama-cpp +0 -0
- {bigdl_core_cpp-2.5.0b20240818.data → bigdl_core_cpp-2.5.0b20240820.data}/scripts/init-ollama +0 -0
- {bigdl_core_cpp-2.5.0b20240818.dist-info → bigdl_core_cpp-2.5.0b20240820.dist-info}/WHEEL +0 -0
- {bigdl_core_cpp-2.5.0b20240818.dist-info → bigdl_core_cpp-2.5.0b20240820.dist-info}/top_level.txt +0 -0
bigdl/cpp/convert-hf-to-gguf.py
CHANGED
@@ -1570,6 +1570,33 @@ class LlamaModel(Model):
|
|
1570
1570
|
return [(self.map_tensor_name(name), data_torch)]
|
1571
1571
|
|
1572
1572
|
def prepare_tensors(self):
|
1573
|
+
if rope_scaling := self.find_hparam(["rope_scaling"], optional=True):
|
1574
|
+
if rope_scaling.get("rope_type", '').lower() == "llama3":
|
1575
|
+
base = self.hparams.get("rope_theta", 10000.0)
|
1576
|
+
dim = self.hparams["hidden_size"] // self.hparams["num_attention_heads"]
|
1577
|
+
freqs = 1.0 / (base ** (torch.arange(0, dim, 2, dtype=torch.float32) / dim))
|
1578
|
+
factor = rope_scaling.get("factor", 8.0)
|
1579
|
+
low_freq_factor = rope_scaling.get("low_freq_factor", 1.0)
|
1580
|
+
high_freq_factor = rope_scaling.get("high_freq_factor", 4.0)
|
1581
|
+
old_context_len = self.hparams.get("original_max_position_embeddings", 8192)
|
1582
|
+
|
1583
|
+
low_freq_wavelen = old_context_len / low_freq_factor
|
1584
|
+
high_freq_wavelen = old_context_len / high_freq_factor
|
1585
|
+
assert low_freq_wavelen != high_freq_wavelen
|
1586
|
+
|
1587
|
+
rope_factors = []
|
1588
|
+
for freq in freqs:
|
1589
|
+
wavelen = 2 * math.pi / freq
|
1590
|
+
if wavelen < high_freq_wavelen:
|
1591
|
+
rope_factors.append(1)
|
1592
|
+
elif wavelen > low_freq_wavelen:
|
1593
|
+
rope_factors.append(factor)
|
1594
|
+
else:
|
1595
|
+
smooth = (old_context_len / wavelen - low_freq_factor) / (high_freq_factor - low_freq_factor)
|
1596
|
+
rope_factors.append(1 / ((1 - smooth) / factor + smooth))
|
1597
|
+
|
1598
|
+
self.gguf_writer.add_tensor(self.format_tensor_name(gguf.MODEL_TENSOR.ROPE_FREQS), np.array(rope_factors, dtype=np.float32))
|
1599
|
+
|
1573
1600
|
super().prepare_tensors()
|
1574
1601
|
|
1575
1602
|
if self._experts is not None:
|
@@ -3686,4 +3713,4 @@ def main() -> None:
|
|
3686
3713
|
|
3687
3714
|
|
3688
3715
|
if __name__ == '__main__':
|
3689
|
-
main()
|
3716
|
+
main()
|
bigdl/cpp/libs/baby-llama
CHANGED
Binary file
|
bigdl/cpp/libs/batched
CHANGED
Binary file
|
bigdl/cpp/libs/batched-bench
CHANGED
Binary file
|
bigdl/cpp/libs/benchmark
CHANGED
Binary file
|
bigdl/cpp/libs/embedding
CHANGED
Binary file
|
bigdl/cpp/libs/gguf
CHANGED
Binary file
|
bigdl/cpp/libs/imatrix
CHANGED
Binary file
|
bigdl/cpp/libs/llama-bench
CHANGED
Binary file
|
bigdl/cpp/libs/llava-cli
CHANGED
Binary file
|
bigdl/cpp/libs/lookahead
CHANGED
Binary file
|
bigdl/cpp/libs/lookup
CHANGED
Binary file
|
bigdl/cpp/libs/ls-sycl-device
CHANGED
Binary file
|
bigdl/cpp/libs/main
CHANGED
Binary file
|
bigdl/cpp/libs/ollama
CHANGED
Binary file
|
bigdl/cpp/libs/perplexity
CHANGED
Binary file
|
bigdl/cpp/libs/quantize
CHANGED
Binary file
|
bigdl/cpp/libs/quantize-stats
CHANGED
Binary file
|
bigdl/cpp/libs/save-load-state
CHANGED
Binary file
|
bigdl/cpp/libs/server
CHANGED
Binary file
|
bigdl/cpp/libs/speculative
CHANGED
Binary file
|
bigdl/cpp/libs/tokenize
CHANGED
Binary file
|
@@ -0,0 +1,45 @@
|
|
1
|
+
bigdl/cpp/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
2
|
+
bigdl/cpp/convert-hf-to-gguf.py,sha256=ci596u_GY7MDZrPeUGJ3TnYYzdZ2_1e0JT-nLeNpps8,168262
|
3
|
+
bigdl/cpp/convert.py,sha256=XMMcpfWHwEAAWzwLXe9mmJTU7cMvcyw8g2BFctfZnvI,69417
|
4
|
+
bigdl/cpp/cli/init-llama-cpp,sha256=qpIwMQc2Vb11fmovXFJKefp5iD1tQMfL8Ma7Y3Ebguk,400
|
5
|
+
bigdl/cpp/cli/init-ollama,sha256=5eg4DsWg87iysFRh7leawr6H47F_sHydwL5we6fUG6o,193
|
6
|
+
bigdl/cpp/gguf-py/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
7
|
+
bigdl/cpp/gguf-py/gguf/__init__.py,sha256=LUfJeRbrLY6TgwI0rLw_qo8klu7GgYB8Ycu8H4V0eb8,218
|
8
|
+
bigdl/cpp/gguf-py/gguf/constants.py,sha256=WRloarpYU4sc0tIi8aDgIh6xb6Ox0CPLCiPa9Yzzm2Q,46902
|
9
|
+
bigdl/cpp/gguf-py/gguf/gguf.py,sha256=MzR6GNwyrWBN3w-o995FY0qX8U3J9Mbinu9HAMEjx8g,477
|
10
|
+
bigdl/cpp/gguf-py/gguf/gguf_reader.py,sha256=5yv15RSKLfz9ViQd2e-vQxzXEdCGqgJfGfoBbzPYTHw,12364
|
11
|
+
bigdl/cpp/gguf-py/gguf/gguf_writer.py,sha256=HqxGAplbhGDgn9bELLFFh3Nf15Gg16BOTVvhOMKe6GM,34612
|
12
|
+
bigdl/cpp/gguf-py/gguf/lazy.py,sha256=yMcMTIrlwpQrX9m8YSRdvyHsNupHZMSj1RsjAAPrxqE,8527
|
13
|
+
bigdl/cpp/gguf-py/gguf/metadata.py,sha256=HNu6fzuLLSzQ_K_xJkKqtT5Tni3kGESj67BZ2uPNajg,24851
|
14
|
+
bigdl/cpp/gguf-py/gguf/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
15
|
+
bigdl/cpp/gguf-py/gguf/quants.py,sha256=dI6JsSpaSzfdz7OwfqH1kvK98M_Ax8d6NMNYY5pyoQM,4354
|
16
|
+
bigdl/cpp/gguf-py/gguf/tensor_mapping.py,sha256=1tNoM-XXvD8JaStxt39HBRe_obCWawHfTFVCWXRe9Zk,30147
|
17
|
+
bigdl/cpp/gguf-py/gguf/utility.py,sha256=xEIfT3CphqAyI56A5XZQDMti2XGG5k6kxm5bjf_Vn-E,2933
|
18
|
+
bigdl/cpp/gguf-py/gguf/vocab.py,sha256=vsRrPQ6RafirhBmMp9h3YGZh_tqEjeg7S2hiLvMv7Ys,6847
|
19
|
+
bigdl/cpp/libs/baby-llama,sha256=u5ibSMXHCYc2uIqsPtTFL_JKOFmTBXRxY2yCWkbp4Ic,14319136
|
20
|
+
bigdl/cpp/libs/batched,sha256=OugBdAdLzSLhbzMnltk3xZqsDM8xnkQU5dvix3pBPcA,14243704
|
21
|
+
bigdl/cpp/libs/batched-bench,sha256=Z0z-USL1rvw1iKDGMnFdetYCTmZvk-T_8g386b_bpLA,14243864
|
22
|
+
bigdl/cpp/libs/benchmark,sha256=GEtYJQCxe8aniNOzxFP8RXdENg5VRkJvpFJ8s_jhoJU,1452712
|
23
|
+
bigdl/cpp/libs/embedding,sha256=VBP6-wea7RRNMgIoferFs08aKiyjbBV31h95EswkePk,14239752
|
24
|
+
bigdl/cpp/libs/gguf,sha256=TfHkBvibkVzp6IVjHeyINMr9FJkDMbx-kc_jHRSOoLI,12483008
|
25
|
+
bigdl/cpp/libs/imatrix,sha256=Werf4flSXxriskdr-rZp95PINBsC_8OUumacIDHSMhs,14267608
|
26
|
+
bigdl/cpp/libs/llama-bench,sha256=6rCmJO7ddWjdOu59LAGTzmdAMePgAleU9V6LncV0o-E,14333248
|
27
|
+
bigdl/cpp/libs/llava-cli,sha256=g5TIcfjV0tX7OwMJm1bTEQQVmqKyv872m4t-SHmojiY,14557832
|
28
|
+
bigdl/cpp/libs/lookahead,sha256=0pRIwO9QLbDZiryzljR6AwvHs320wS6n6_Z5NvfphSE,14252072
|
29
|
+
bigdl/cpp/libs/lookup,sha256=2nwJhdR0ej86-m1tcWIm1aJL8wuVx55IlidEzg5xEBQ,14271856
|
30
|
+
bigdl/cpp/libs/ls-sycl-device,sha256=o5dVh3SI1dEgaU_L9euiEMqmkt51RNQ6nk2inKSOJmI,12478752
|
31
|
+
bigdl/cpp/libs/main,sha256=oQJPS60tjFuxdY_hrseOpVGO_tnWhJFrTqyVSn4cLlE,14299192
|
32
|
+
bigdl/cpp/libs/ollama,sha256=7hw1hFmbRCLDJReMFybHE5OXoqRHwqpJgflKFl3-RH8,47374520
|
33
|
+
bigdl/cpp/libs/perplexity,sha256=Tb6AP9w1K-bBmZDQl7jTo1p8HbBTElMWv6oWasWqlxs,14340696
|
34
|
+
bigdl/cpp/libs/quantize,sha256=Vuk-3RYNvVt7FKqhx8OVtErQEH2wOLhXJlMbBpkabkI,14265984
|
35
|
+
bigdl/cpp/libs/quantize-stats,sha256=P5bGwOKJlLD2fWHU6VM5F9xMDuGVaNvja3JZAIXYRqk,13780224
|
36
|
+
bigdl/cpp/libs/save-load-state,sha256=zBR2iKN28tQyd038Qj-NotfAn0BZAWhQqgjfgNa8UK4,14239880
|
37
|
+
bigdl/cpp/libs/server,sha256=4d5gERJu7qIrb8kONTKLGAnLeN9NptL4MUjdVQpzlJo,15097272
|
38
|
+
bigdl/cpp/libs/speculative,sha256=2OZezaJeae0__HTXf6oy8ep3hFycpImRfxgYOneYS9g,14278112
|
39
|
+
bigdl/cpp/libs/tokenize,sha256=KDYXYerowPEau6QXkTy8gOFs7O21Cnbvjs6s8-f1n4c,14239800
|
40
|
+
bigdl_core_cpp-2.5.0b20240820.data/scripts/init-llama-cpp,sha256=qpIwMQc2Vb11fmovXFJKefp5iD1tQMfL8Ma7Y3Ebguk,400
|
41
|
+
bigdl_core_cpp-2.5.0b20240820.data/scripts/init-ollama,sha256=5eg4DsWg87iysFRh7leawr6H47F_sHydwL5we6fUG6o,193
|
42
|
+
bigdl_core_cpp-2.5.0b20240820.dist-info/METADATA,sha256=bSz40OvUMWpyVy-RJbbzAjIv7qZm0VnDNaxx5eSZ8Eg,643
|
43
|
+
bigdl_core_cpp-2.5.0b20240820.dist-info/WHEEL,sha256=LP9LuSkp9EkkS3GaxGDqD2GVQk9RkMkUIxzcmUzigkU,108
|
44
|
+
bigdl_core_cpp-2.5.0b20240820.dist-info/top_level.txt,sha256=iGuLfZARD_qANcIMfy0tbbrC3EtCg6BSiH8icc3dLWs,6
|
45
|
+
bigdl_core_cpp-2.5.0b20240820.dist-info/RECORD,,
|
@@ -1,45 +0,0 @@
|
|
1
|
-
bigdl/cpp/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
2
|
-
bigdl/cpp/convert-hf-to-gguf.py,sha256=1wAaTiqtAsnA_4k10TCzDSp4KTZ_mldv6pY47z5gg7M,166672
|
3
|
-
bigdl/cpp/convert.py,sha256=XMMcpfWHwEAAWzwLXe9mmJTU7cMvcyw8g2BFctfZnvI,69417
|
4
|
-
bigdl/cpp/cli/init-llama-cpp,sha256=qpIwMQc2Vb11fmovXFJKefp5iD1tQMfL8Ma7Y3Ebguk,400
|
5
|
-
bigdl/cpp/cli/init-ollama,sha256=5eg4DsWg87iysFRh7leawr6H47F_sHydwL5we6fUG6o,193
|
6
|
-
bigdl/cpp/gguf-py/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
7
|
-
bigdl/cpp/gguf-py/gguf/__init__.py,sha256=LUfJeRbrLY6TgwI0rLw_qo8klu7GgYB8Ycu8H4V0eb8,218
|
8
|
-
bigdl/cpp/gguf-py/gguf/constants.py,sha256=WRloarpYU4sc0tIi8aDgIh6xb6Ox0CPLCiPa9Yzzm2Q,46902
|
9
|
-
bigdl/cpp/gguf-py/gguf/gguf.py,sha256=MzR6GNwyrWBN3w-o995FY0qX8U3J9Mbinu9HAMEjx8g,477
|
10
|
-
bigdl/cpp/gguf-py/gguf/gguf_reader.py,sha256=5yv15RSKLfz9ViQd2e-vQxzXEdCGqgJfGfoBbzPYTHw,12364
|
11
|
-
bigdl/cpp/gguf-py/gguf/gguf_writer.py,sha256=HqxGAplbhGDgn9bELLFFh3Nf15Gg16BOTVvhOMKe6GM,34612
|
12
|
-
bigdl/cpp/gguf-py/gguf/lazy.py,sha256=yMcMTIrlwpQrX9m8YSRdvyHsNupHZMSj1RsjAAPrxqE,8527
|
13
|
-
bigdl/cpp/gguf-py/gguf/metadata.py,sha256=HNu6fzuLLSzQ_K_xJkKqtT5Tni3kGESj67BZ2uPNajg,24851
|
14
|
-
bigdl/cpp/gguf-py/gguf/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
15
|
-
bigdl/cpp/gguf-py/gguf/quants.py,sha256=dI6JsSpaSzfdz7OwfqH1kvK98M_Ax8d6NMNYY5pyoQM,4354
|
16
|
-
bigdl/cpp/gguf-py/gguf/tensor_mapping.py,sha256=1tNoM-XXvD8JaStxt39HBRe_obCWawHfTFVCWXRe9Zk,30147
|
17
|
-
bigdl/cpp/gguf-py/gguf/utility.py,sha256=xEIfT3CphqAyI56A5XZQDMti2XGG5k6kxm5bjf_Vn-E,2933
|
18
|
-
bigdl/cpp/gguf-py/gguf/vocab.py,sha256=vsRrPQ6RafirhBmMp9h3YGZh_tqEjeg7S2hiLvMv7Ys,6847
|
19
|
-
bigdl/cpp/libs/baby-llama,sha256=QmIJJJGP4U67Wv53jCoYZ9K5g8274o1xGnVRcEVv-J8,14319136
|
20
|
-
bigdl/cpp/libs/batched,sha256=CKSDgeHKKPOW4XL-FaUZ4mwfeC1yxs7UH7OtdL3ppB0,14239608
|
21
|
-
bigdl/cpp/libs/batched-bench,sha256=w5v59iFWf7oXGSV8BxkhgnFFpp0xTQOUe0u5GcwNq_4,14243864
|
22
|
-
bigdl/cpp/libs/benchmark,sha256=xPE6tU_r0tntVYLIYWlR4BNyrmC7bqiulRNLX4ICl-0,1452712
|
23
|
-
bigdl/cpp/libs/embedding,sha256=iQcvBMHBhJN00YCmEvUsU3lF3as4SEIYP8H6DapaG9g,14239752
|
24
|
-
bigdl/cpp/libs/gguf,sha256=MyC23QGbnIPHNL1YRNqKlRw3KXiyWheq-xsrsmss2Ew,12483008
|
25
|
-
bigdl/cpp/libs/imatrix,sha256=XK46doyLDeYNodB2R2wUmyumXDCELebGcqWZLXPr7Fg,14267608
|
26
|
-
bigdl/cpp/libs/llama-bench,sha256=jDc6f1ydLVr3gj9DT9dOeYC3LkSZoEOpp_3tu2LH7sw,14333248
|
27
|
-
bigdl/cpp/libs/llava-cli,sha256=2oDDOXd50FyhoFyZtfEt8lV25KI0D6vptMMLVNN8z5Q,14557832
|
28
|
-
bigdl/cpp/libs/lookahead,sha256=KK9PJ_81kq76j_yNqdgCgtNcLVSVouF6onRrslT4Arg,14252072
|
29
|
-
bigdl/cpp/libs/lookup,sha256=igthfHlx4cUXQuIWCMaeUolcV9ilWWuTr3y0M2RHyiI,14271856
|
30
|
-
bigdl/cpp/libs/ls-sycl-device,sha256=UtoLLkcRSXWZMDIZs77PAz80_nn19JjSpOZDfMpWZj0,12478752
|
31
|
-
bigdl/cpp/libs/main,sha256=h8e9VBzysX0EWA0OQ9Z3rB5Zu6rjaX5GAaoAgj1nAFc,14299192
|
32
|
-
bigdl/cpp/libs/ollama,sha256=6CKRaRDw6g9uzO6l5oJKBBsrccqFugw3eJQY20PwdtQ,47375392
|
33
|
-
bigdl/cpp/libs/perplexity,sha256=a8eRfIMVI0inrZDWDhxVGfM3L3Yj4ebMlhDbnAbQ4ZI,14340696
|
34
|
-
bigdl/cpp/libs/quantize,sha256=RQHpkY72tcZTuvMwOXwEC8fCivnN4ClbUGruj5cKx-g,14265984
|
35
|
-
bigdl/cpp/libs/quantize-stats,sha256=YcQ-X5kP8nEPnE0mxZ9Sy1vl_HkjVH_sSiqWJW7YMJc,13780224
|
36
|
-
bigdl/cpp/libs/save-load-state,sha256=xekWUPF-IhoNmgxUXSzKMPfadqLNae7iAh1YPQDT9Bc,14239880
|
37
|
-
bigdl/cpp/libs/server,sha256=KfI2-m5lAUcxYb6KHVZkXIOy4Kk1VnZ8rLneF5MCCNw,15097272
|
38
|
-
bigdl/cpp/libs/speculative,sha256=nCKmu33RQdCwkb5WHaPqfEFvy9RoYnPJHzXi_gLkxT0,14278112
|
39
|
-
bigdl/cpp/libs/tokenize,sha256=m9zbFNldBToN00fuM2lQTq1_THx28-HQdFSftw4VNhM,14239800
|
40
|
-
bigdl_core_cpp-2.5.0b20240818.data/scripts/init-llama-cpp,sha256=qpIwMQc2Vb11fmovXFJKefp5iD1tQMfL8Ma7Y3Ebguk,400
|
41
|
-
bigdl_core_cpp-2.5.0b20240818.data/scripts/init-ollama,sha256=5eg4DsWg87iysFRh7leawr6H47F_sHydwL5we6fUG6o,193
|
42
|
-
bigdl_core_cpp-2.5.0b20240818.dist-info/METADATA,sha256=9ccXui2OMJgXwEzx4fJytb_Gi0CCyiiFp6X81l31G14,643
|
43
|
-
bigdl_core_cpp-2.5.0b20240818.dist-info/WHEEL,sha256=LP9LuSkp9EkkS3GaxGDqD2GVQk9RkMkUIxzcmUzigkU,108
|
44
|
-
bigdl_core_cpp-2.5.0b20240818.dist-info/top_level.txt,sha256=iGuLfZARD_qANcIMfy0tbbrC3EtCg6BSiH8icc3dLWs,6
|
45
|
-
bigdl_core_cpp-2.5.0b20240818.dist-info/RECORD,,
|
{bigdl_core_cpp-2.5.0b20240818.data → bigdl_core_cpp-2.5.0b20240820.data}/scripts/init-llama-cpp
RENAMED
File without changes
|
{bigdl_core_cpp-2.5.0b20240818.data → bigdl_core_cpp-2.5.0b20240820.data}/scripts/init-ollama
RENAMED
File without changes
|
File without changes
|
{bigdl_core_cpp-2.5.0b20240818.dist-info → bigdl_core_cpp-2.5.0b20240820.dist-info}/top_level.txt
RENAMED
File without changes
|