lalamo 0.5.11__py3-none-any.whl → 0.5.12__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
lalamo/__init__.py CHANGED
@@ -15,7 +15,7 @@ from lalamo.speculator import (
15
15
  SpeculatorTrainingEvent,
16
16
  )
17
17
 
18
- __version__ = "0.5.11"
18
+ __version__ = "0.5.12"
19
19
 
20
20
  __all__ = [
21
21
  "AssistantMessage",
@@ -46,7 +46,6 @@ class HFGemma3TextConfigRaw:
46
46
  model_type: Literal["gemma3_text"]
47
47
  num_hidden_layers: int
48
48
  sliding_window: int
49
- sliding_window_pattern: int
50
49
  rms_norm_eps: float = 1e-06
51
50
  query_pre_attn_scalar: float = 256.0
52
51
  attention_bias: bool = False
@@ -55,6 +54,7 @@ class HFGemma3TextConfigRaw:
55
54
  attn_logit_softcapping: float | None = None
56
55
  head_dim: int = 256
57
56
  max_position_embeddings: int = 131072
57
+ sliding_window_pattern: int = 6
58
58
  rope_theta: float = 1000000.0
59
59
  rope_local_base_freq: float = 10000.0
60
60
  rope_scaling: GemmaRoPEScalingConfig | YarnRopeScalingConfig | None = None
@@ -350,9 +350,9 @@ def load_attention(
350
350
  weights_dict: Mapping[str, Array],
351
351
  path: ParameterPath,
352
352
  ) -> Attention:
353
- if (path / "o_proj.weight") in weights_dict:
353
+ if (path / "o_proj.weight") in weights_dict or (path / "o_proj.qweight") in weights_dict:
354
354
  o_proj_name = "o_proj"
355
- elif (path / "out_proj.weight") in weights_dict:
355
+ elif (path / "out_proj.weight") in weights_dict or (path / "out_proj.qweight") in weights_dict:
356
356
  o_proj_name = "out_proj"
357
357
  else:
358
358
  raise NotImplementedError("Can't determine attention output projection name")
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: lalamo
3
- Version: 0.5.11
3
+ Version: 0.5.12
4
4
  Summary: JAX library for optimization and export of models for use with the UZU inference engine.
5
5
  Requires-Python: <4,>=3.12
6
6
  Description-Content-Type: text/markdown
@@ -1,4 +1,4 @@
1
- lalamo/__init__.py,sha256=YYirmrwul4QLFCnBJpYyq8Os5sFQNn-9OxTjd0CbSd8,815
1
+ lalamo/__init__.py,sha256=Q9W7Wur0iL4StzN99Y70CLGeiCHriTxjg50OLzXIDLw,815
2
2
  lalamo/common.py,sha256=5NUFD26yQgOnEEk3LaQnce8n-VwJxILkEpFesHZhtQU,3820
3
3
  lalamo/main.py,sha256=GgUT7lT48-XQuAEH7qzsDKG8Lx9iBf-sYBIRhZL9q7E,23978
4
4
  lalamo/message_processor.py,sha256=bSUAQg7CemLTnBV4LtPxJBicAalruDCA-JXjkTYPZ8U,5797
@@ -20,7 +20,7 @@ lalamo/model_import/decoder_configs/executorch.py,sha256=fTEG_j-7d8riR3Fu_H5tHDj
20
20
  lalamo/model_import/decoder_configs/huggingface/__init__.py,sha256=AboZJgZxOuIigPShskj-FqBkBqwlJZoKHP0RDqx-MyY,696
21
21
  lalamo/model_import/decoder_configs/huggingface/common.py,sha256=YYIDEQy8x7lqL2qtxUHrNqfjZEiizBZ_26sTqOzjRtQ,3792
22
22
  lalamo/model_import/decoder_configs/huggingface/gemma2.py,sha256=g8LH_GlSNyL04WWi596zI0rWsD3ahnfNjDk-9zZNcDE,4759
23
- lalamo/model_import/decoder_configs/huggingface/gemma3.py,sha256=aSZ0TtpgDYA10rHi8eD0C_Jsn48siM_HXqfZ4O7nh94,8372
23
+ lalamo/model_import/decoder_configs/huggingface/gemma3.py,sha256=EYkcsRUKVQqPFyL8dZuocDVAUaM8d9dr_aMh5-jTvTM,8376
24
24
  lalamo/model_import/decoder_configs/huggingface/gpt_oss.py,sha256=MBCoPbuWyzbJiBRtHOtpaPHJjQ1UVCAYcVrfIejTnlQ,7446
25
25
  lalamo/model_import/decoder_configs/huggingface/lfm2.py,sha256=vrBMxtiKEg0eHNDL_bWM9odlrsab7jlMXEY8vjEB7-c,7595
26
26
  lalamo/model_import/decoder_configs/huggingface/llama.py,sha256=UPeQiz2Dix8YaZYRxn9z44OZJ6c4xBQmcUZcM0Ymvh4,6934
@@ -32,7 +32,7 @@ lalamo/model_import/decoder_configs/huggingface/qwen3.py,sha256=lySVO-TvusAYUjDn
32
32
  lalamo/model_import/loaders/__init__.py,sha256=3THc1wQ4EPBzQkL_4EaKCa7Ev5Z7oczcvc4AHy9v5EI,228
33
33
  lalamo/model_import/loaders/common.py,sha256=kkugV-bMQlN1zvGHoj3uc7z0FbXKoMtXEBTvyu4KxK4,1844
34
34
  lalamo/model_import/loaders/executorch.py,sha256=t2Ey_mBMNC8bTSTdYWjuGXdPTRoohFlYrqtWyNkBU_8,9219
35
- lalamo/model_import/loaders/huggingface.py,sha256=_vFAgz6ZR8386VIuhWAY88nJ8qoTDawCREBsRHQQmGo,32753
35
+ lalamo/model_import/loaders/huggingface.py,sha256=nGaJDAB-2uK5z7XNYEpVDZcAoAZF-w3zs6xWOK7nzac,32845
36
36
  lalamo/model_import/loaders/utils.py,sha256=eiX3WKFRrAfBY-dugodscNInl5o5w3KmVcgma4atpGY,2456
37
37
  lalamo/model_import/model_specs/__init__.py,sha256=JISqwJkloQkGD2jvi1MakNEWapIwlNXXVi5giZyXB74,1275
38
38
  lalamo/model_import/model_specs/common.py,sha256=RLySCIkmGiA1IVZgLeemssMBMo4hMYMpmBjV0cRwBb4,6586
@@ -85,9 +85,9 @@ lalamo/speculator/estimator.py,sha256=4D8dPZCWsrpORb7y8pQ6VsiIg1Cblvvxe6gXCoYtcD
85
85
  lalamo/speculator/inference.py,sha256=5GntUgj0HQLeLn3HIHnVX8EEO0EBzmKeP5-_U7kdFAM,3670
86
86
  lalamo/speculator/ngram.py,sha256=95mdfAWhx4d5XOnOwhyhElnvcy6nlUjYhcbJzqDs414,5875
87
87
  lalamo/speculator/utils.py,sha256=0wZoMMIzzk0Q-3zq5H5f-JBplePNHxywndkrNtOJOyo,1697
88
- lalamo-0.5.11.dist-info/licenses/LICENSE,sha256=diHRfjSEJHD1nnEeMIfMRCjR3UERf8bT3eseD6b1ayA,1072
89
- lalamo-0.5.11.dist-info/METADATA,sha256=0uICfw4NXxiDgA8JIPaYiUnOlFcGxYe7NKbNP2ZejHE,3147
90
- lalamo-0.5.11.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
91
- lalamo-0.5.11.dist-info/entry_points.txt,sha256=qli7qTfnBk5WP10rOGXXEckHMtt-atJMDWd8jN89Uks,43
92
- lalamo-0.5.11.dist-info/top_level.txt,sha256=VHvWL5JN5XRG36NsN_MieJ7EwRihEOrEjyDaTdFJ-aI,7
93
- lalamo-0.5.11.dist-info/RECORD,,
88
+ lalamo-0.5.12.dist-info/licenses/LICENSE,sha256=diHRfjSEJHD1nnEeMIfMRCjR3UERf8bT3eseD6b1ayA,1072
89
+ lalamo-0.5.12.dist-info/METADATA,sha256=dRj887UMuZ5JBHgriCILQxCKklC-ZNyAcsOLAwbbyrU,3147
90
+ lalamo-0.5.12.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
91
+ lalamo-0.5.12.dist-info/entry_points.txt,sha256=qli7qTfnBk5WP10rOGXXEckHMtt-atJMDWd8jN89Uks,43
92
+ lalamo-0.5.12.dist-info/top_level.txt,sha256=VHvWL5JN5XRG36NsN_MieJ7EwRihEOrEjyDaTdFJ-aI,7
93
+ lalamo-0.5.12.dist-info/RECORD,,