lalamo 0.5.11__tar.gz → 0.5.12__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (110) hide show
  1. {lalamo-0.5.11 → lalamo-0.5.12}/PKG-INFO +1 -1
  2. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/__init__.py +1 -1
  3. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/gemma3.py +1 -1
  4. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/loaders/huggingface.py +2 -2
  5. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo.egg-info/PKG-INFO +1 -1
  6. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_huggingface_model_conversion.py +2 -0
  7. {lalamo-0.5.11 → lalamo-0.5.12}/LICENSE +0 -0
  8. {lalamo-0.5.11 → lalamo-0.5.12}/README.md +0 -0
  9. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/common.py +0 -0
  10. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/data/__init__.py +0 -0
  11. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/data/huggingface_message.py +0 -0
  12. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/data/lalamo_completions.py +0 -0
  13. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/data/utils.py +0 -0
  14. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/main.py +0 -0
  15. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/message_processor.py +0 -0
  16. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/__init__.py +0 -0
  17. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/common.py +0 -0
  18. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/__init__.py +0 -0
  19. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/common.py +0 -0
  20. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/executorch.py +0 -0
  21. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/__init__.py +0 -0
  22. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/common.py +0 -0
  23. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/gemma2.py +0 -0
  24. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/gpt_oss.py +0 -0
  25. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/lfm2.py +0 -0
  26. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/llama.py +0 -0
  27. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/llamba.py +0 -0
  28. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/mistral.py +0 -0
  29. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/modern_bert.py +0 -0
  30. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/qwen2.py +0 -0
  31. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/decoder_configs/huggingface/qwen3.py +0 -0
  32. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/huggingface_generation_config.py +0 -0
  33. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/huggingface_tokenizer_config.py +0 -0
  34. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/loaders/__init__.py +0 -0
  35. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/loaders/common.py +0 -0
  36. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/loaders/executorch.py +0 -0
  37. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/loaders/utils.py +0 -0
  38. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/__init__.py +0 -0
  39. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/common.py +0 -0
  40. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/deepseek.py +0 -0
  41. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/essential_ai.py +0 -0
  42. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/gemma.py +0 -0
  43. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/gpt_oss.py +0 -0
  44. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/huggingface.py +0 -0
  45. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/lfm2.py +0 -0
  46. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/llama.py +0 -0
  47. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/llamba.py +0 -0
  48. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/mirai.py +0 -0
  49. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/mistral.py +0 -0
  50. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/pleias.py +0 -0
  51. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/polaris.py +0 -0
  52. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/qwen.py +0 -0
  53. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/model_import/model_specs/reka.py +0 -0
  54. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/models/__init__.py +0 -0
  55. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/models/classifier.py +0 -0
  56. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/models/common.py +0 -0
  57. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/models/language_model.py +0 -0
  58. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/__init__.py +0 -0
  59. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/activations.py +0 -0
  60. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/classifier.py +0 -0
  61. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/common.py +0 -0
  62. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/decoder.py +0 -0
  63. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/embedding.py +0 -0
  64. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/linear.py +0 -0
  65. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/mlp.py +0 -0
  66. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/mlx_interop.py +0 -0
  67. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/normalization.py +0 -0
  68. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/rope.py +0 -0
  69. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/token_mixers/__init__.py +0 -0
  70. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/token_mixers/attention.py +0 -0
  71. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/token_mixers/common.py +0 -0
  72. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/token_mixers/mamba.py +0 -0
  73. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/token_mixers/short_conv.py +0 -0
  74. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/token_mixers/state/__init__.py +0 -0
  75. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/token_mixers/state/common.py +0 -0
  76. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/token_mixers/state/kv_cache.py +0 -0
  77. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/token_mixers/state/mamba_state.py +0 -0
  78. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/token_mixers/state/short_conv_state.py +0 -0
  79. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/torch_interop.py +0 -0
  80. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/transformer.py +0 -0
  81. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/transformer_layer.py +0 -0
  82. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/modules/utils.py +0 -0
  83. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/quantization.py +0 -0
  84. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/registry_abc.py +0 -0
  85. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/sampling.py +0 -0
  86. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/speculator/__init__.py +0 -0
  87. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/speculator/common.py +0 -0
  88. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/speculator/estimator.py +0 -0
  89. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/speculator/inference.py +0 -0
  90. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/speculator/ngram.py +0 -0
  91. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/speculator/utils.py +0 -0
  92. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo/utils.py +0 -0
  93. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo.egg-info/SOURCES.txt +0 -0
  94. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo.egg-info/dependency_links.txt +0 -0
  95. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo.egg-info/entry_points.txt +0 -0
  96. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo.egg-info/requires.txt +0 -0
  97. {lalamo-0.5.11 → lalamo-0.5.12}/lalamo.egg-info/top_level.txt +0 -0
  98. {lalamo-0.5.11 → lalamo-0.5.12}/pyproject.toml +0 -0
  99. {lalamo-0.5.11 → lalamo-0.5.12}/setup.cfg +0 -0
  100. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_cartesia_mlx_models.py +0 -0
  101. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_chat_template.py +0 -0
  102. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_generation.py +0 -0
  103. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_huggingface_models.py +0 -0
  104. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_lfm2_models.py +0 -0
  105. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_mlx_models.py +0 -0
  106. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_model_spec.py +0 -0
  107. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_models.py +0 -0
  108. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_moe.py +0 -0
  109. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_parameter_tree.py +0 -0
  110. {lalamo-0.5.11 → lalamo-0.5.12}/tests/test_registry_abc.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: lalamo
3
- Version: 0.5.11
3
+ Version: 0.5.12
4
4
  Summary: JAX library for optimization and export of models for use with the UZU inference engine.
5
5
  Requires-Python: <4,>=3.12
6
6
  Description-Content-Type: text/markdown
@@ -15,7 +15,7 @@ from lalamo.speculator import (
15
15
  SpeculatorTrainingEvent,
16
16
  )
17
17
 
18
- __version__ = "0.5.11"
18
+ __version__ = "0.5.12"
19
19
 
20
20
  __all__ = [
21
21
  "AssistantMessage",
@@ -46,7 +46,6 @@ class HFGemma3TextConfigRaw:
46
46
  model_type: Literal["gemma3_text"]
47
47
  num_hidden_layers: int
48
48
  sliding_window: int
49
- sliding_window_pattern: int
50
49
  rms_norm_eps: float = 1e-06
51
50
  query_pre_attn_scalar: float = 256.0
52
51
  attention_bias: bool = False
@@ -55,6 +54,7 @@ class HFGemma3TextConfigRaw:
55
54
  attn_logit_softcapping: float | None = None
56
55
  head_dim: int = 256
57
56
  max_position_embeddings: int = 131072
57
+ sliding_window_pattern: int = 6
58
58
  rope_theta: float = 1000000.0
59
59
  rope_local_base_freq: float = 10000.0
60
60
  rope_scaling: GemmaRoPEScalingConfig | YarnRopeScalingConfig | None = None
@@ -350,9 +350,9 @@ def load_attention(
350
350
  weights_dict: Mapping[str, Array],
351
351
  path: ParameterPath,
352
352
  ) -> Attention:
353
- if (path / "o_proj.weight") in weights_dict:
353
+ if (path / "o_proj.weight") in weights_dict or (path / "o_proj.qweight") in weights_dict:
354
354
  o_proj_name = "o_proj"
355
- elif (path / "out_proj.weight") in weights_dict:
355
+ elif (path / "out_proj.weight") in weights_dict or (path / "out_proj.qweight") in weights_dict:
356
356
  o_proj_name = "out_proj"
357
357
  else:
358
358
  raise NotImplementedError("Can't determine attention output projection name")
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: lalamo
3
- Version: 0.5.11
3
+ Version: 0.5.12
4
4
  Summary: JAX library for optimization and export of models for use with the UZU inference engine.
5
5
  Requires-Python: <4,>=3.12
6
6
  Description-Content-Type: text/markdown
@@ -22,8 +22,10 @@ from tests.test_models import DType, ModelTestSpec
22
22
  MODEL_LIST: list[ModelTestSpec] = [
23
23
  ModelTestSpec("trymirai/chat-moderation-router", DType.FLOAT32),
24
24
  ModelTestSpec("Qwen/Qwen3-0.6B", DType.FLOAT32),
25
+ ModelTestSpec("Qwen/Qwen3-4B-AWQ", DType.FLOAT32),
25
26
  ModelTestSpec("Qwen/Qwen2.5-0.5B-Instruct", DType.FLOAT32),
26
27
  ModelTestSpec("google/gemma-3-1b-it", DType.FLOAT32),
28
+ ModelTestSpec("google/gemma-3-4b-it", DType.FLOAT32),
27
29
  ModelTestSpec("deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", DType.FLOAT32),
28
30
  ModelTestSpec("meta-llama/Llama-3.2-1B-Instruct", DType.FLOAT32),
29
31
  ModelTestSpec("cartesia-ai/Llamba-1B", DType.FLOAT32),
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes