lalamo 0.5.15__tar.gz → 0.5.16__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (110) hide show
  1. {lalamo-0.5.15 → lalamo-0.5.16}/PKG-INFO +1 -1
  2. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/__init__.py +1 -1
  3. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/llama.py +32 -21
  4. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo.egg-info/PKG-INFO +1 -1
  5. {lalamo-0.5.15 → lalamo-0.5.16}/LICENSE +0 -0
  6. {lalamo-0.5.15 → lalamo-0.5.16}/README.md +0 -0
  7. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/common.py +0 -0
  8. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/data/__init__.py +0 -0
  9. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/data/huggingface_message.py +0 -0
  10. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/data/lalamo_completions.py +0 -0
  11. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/data/utils.py +0 -0
  12. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/main.py +0 -0
  13. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/message_processor.py +0 -0
  14. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/__init__.py +0 -0
  15. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/common.py +0 -0
  16. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/__init__.py +0 -0
  17. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/common.py +0 -0
  18. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/executorch.py +0 -0
  19. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/__init__.py +0 -0
  20. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/common.py +0 -0
  21. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/gemma2.py +0 -0
  22. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/gemma3.py +0 -0
  23. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/gpt_oss.py +0 -0
  24. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/lfm2.py +0 -0
  25. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/llamba.py +0 -0
  26. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/mistral.py +0 -0
  27. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/modern_bert.py +0 -0
  28. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/qwen2.py +0 -0
  29. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/decoder_configs/huggingface/qwen3.py +0 -0
  30. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/huggingface_generation_config.py +0 -0
  31. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/huggingface_tokenizer_config.py +0 -0
  32. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/loaders/__init__.py +0 -0
  33. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/loaders/common.py +0 -0
  34. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/loaders/executorch.py +0 -0
  35. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/loaders/huggingface.py +0 -0
  36. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/loaders/utils.py +0 -0
  37. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/__init__.py +0 -0
  38. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/common.py +0 -0
  39. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/deepseek.py +0 -0
  40. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/essential_ai.py +0 -0
  41. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/gemma.py +0 -0
  42. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/gpt_oss.py +0 -0
  43. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/huggingface.py +0 -0
  44. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/lfm2.py +0 -0
  45. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/llama.py +0 -0
  46. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/llamba.py +0 -0
  47. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/mirai.py +0 -0
  48. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/mistral.py +0 -0
  49. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/pleias.py +0 -0
  50. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/polaris.py +0 -0
  51. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/qwen.py +0 -0
  52. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/model_import/model_specs/reka.py +0 -0
  53. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/models/__init__.py +0 -0
  54. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/models/classifier.py +0 -0
  55. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/models/common.py +0 -0
  56. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/models/language_model.py +0 -0
  57. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/__init__.py +0 -0
  58. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/activations.py +0 -0
  59. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/classifier.py +0 -0
  60. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/common.py +0 -0
  61. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/decoder.py +0 -0
  62. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/embedding.py +0 -0
  63. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/linear.py +0 -0
  64. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/mlp.py +0 -0
  65. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/mlx_interop.py +0 -0
  66. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/normalization.py +0 -0
  67. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/rope.py +0 -0
  68. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/token_mixers/__init__.py +0 -0
  69. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/token_mixers/attention.py +0 -0
  70. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/token_mixers/common.py +0 -0
  71. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/token_mixers/mamba.py +0 -0
  72. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/token_mixers/short_conv.py +0 -0
  73. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/token_mixers/state/__init__.py +0 -0
  74. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/token_mixers/state/common.py +0 -0
  75. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/token_mixers/state/kv_cache.py +0 -0
  76. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/token_mixers/state/mamba_state.py +0 -0
  77. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/token_mixers/state/short_conv_state.py +0 -0
  78. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/torch_interop.py +0 -0
  79. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/transformer.py +0 -0
  80. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/transformer_layer.py +0 -0
  81. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/modules/utils.py +0 -0
  82. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/quantization.py +0 -0
  83. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/registry_abc.py +0 -0
  84. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/sampling.py +0 -0
  85. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/speculator/__init__.py +0 -0
  86. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/speculator/common.py +0 -0
  87. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/speculator/estimator.py +0 -0
  88. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/speculator/inference.py +0 -0
  89. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/speculator/ngram.py +0 -0
  90. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/speculator/utils.py +0 -0
  91. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo/utils.py +0 -0
  92. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo.egg-info/SOURCES.txt +0 -0
  93. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo.egg-info/dependency_links.txt +0 -0
  94. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo.egg-info/entry_points.txt +0 -0
  95. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo.egg-info/requires.txt +0 -0
  96. {lalamo-0.5.15 → lalamo-0.5.16}/lalamo.egg-info/top_level.txt +0 -0
  97. {lalamo-0.5.15 → lalamo-0.5.16}/pyproject.toml +0 -0
  98. {lalamo-0.5.15 → lalamo-0.5.16}/setup.cfg +0 -0
  99. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_cartesia_mlx_models.py +0 -0
  100. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_chat_template.py +0 -0
  101. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_generation.py +0 -0
  102. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_huggingface_model_conversion.py +0 -0
  103. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_huggingface_models.py +0 -0
  104. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_lfm2_models.py +0 -0
  105. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_mlx_models.py +0 -0
  106. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_model_spec.py +0 -0
  107. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_models.py +0 -0
  108. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_moe.py +0 -0
  109. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_parameter_tree.py +0 -0
  110. {lalamo-0.5.15 → lalamo-0.5.16}/tests/test_registry_abc.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: lalamo
3
- Version: 0.5.15
3
+ Version: 0.5.16
4
4
  Summary: JAX library for optimization and export of models for use with the UZU inference engine.
5
5
  Requires-Python: <4,>=3.12
6
6
  Description-Content-Type: text/markdown
@@ -15,7 +15,7 @@ from lalamo.speculator import (
15
15
  SpeculatorTrainingEvent,
16
16
  )
17
17
 
18
- __version__ = "0.5.15"
18
+ __version__ = "0.5.16"
19
19
 
20
20
  __all__ = [
21
21
  "AssistantMessage",
@@ -13,6 +13,7 @@ from lalamo.modules import (
13
13
  LlamaRoPEConfig,
14
14
  MLXQuantizedLinearConfig,
15
15
  MLXQuantizedTiedEmbeddingConfig,
16
+ MLXQuantizedUntiedEmbeddingConfig,
16
17
  NormalizationConfig,
17
18
  SiLU,
18
19
  TiedEmbeddingConfig,
@@ -89,27 +90,37 @@ class HFLlamaConfig(HuggingFaceLMConfig):
89
90
  ) -> DecoderConfig:
90
91
  quantization = self.quantization or self.quantization_config
91
92
  if isinstance(quantization, MLXQuantizationConfig):
92
- assert self.tie_word_embeddings, "only tied embeddings are supported"
93
- embedding_config = MLXQuantizedTiedEmbeddingConfig(
94
- input_scale=None,
95
- logit_soft_cap=None,
96
- group_size=quantization.group_size,
97
- embedding_quantization_mode=QuantizationMode.from_num_bits(quantization.bits),
98
- activation_quantization_mode=None,
99
- activation_precision=activation_precision,
100
- )
101
- elif self.tie_word_embeddings:
102
- embedding_config = TiedEmbeddingConfig(
103
- input_scale=None,
104
- logit_soft_cap=None,
105
- precision=activation_precision,
106
- )
107
- else:
108
- embedding_config = UntiedEmbeddingConfig(
109
- input_scale=None,
110
- logit_soft_cap=None,
111
- precision=activation_precision,
112
- )
93
+ if self.tie_word_embeddings:
94
+ embedding_config = MLXQuantizedTiedEmbeddingConfig(
95
+ input_scale=None,
96
+ logit_soft_cap=None,
97
+ group_size=quantization.group_size,
98
+ embedding_quantization_mode=QuantizationMode.from_num_bits(quantization.bits),
99
+ activation_quantization_mode=None,
100
+ activation_precision=activation_precision,
101
+ )
102
+ else:
103
+ embedding_config = MLXQuantizedUntiedEmbeddingConfig(
104
+ input_scale=None,
105
+ logit_soft_cap=None,
106
+ group_size=quantization.group_size,
107
+ embedding_quantization_mode=QuantizationMode.from_num_bits(quantization.bits),
108
+ activation_quantization_mode=None,
109
+ activation_precision=activation_precision,
110
+ )
111
+ else: # noqa: PLR5501
112
+ if self.tie_word_embeddings:
113
+ embedding_config = TiedEmbeddingConfig(
114
+ input_scale=None,
115
+ logit_soft_cap=None,
116
+ precision=activation_precision,
117
+ )
118
+ else:
119
+ embedding_config = UntiedEmbeddingConfig(
120
+ input_scale=None,
121
+ logit_soft_cap=None,
122
+ precision=activation_precision,
123
+ )
113
124
  if self.rope_scaling is None:
114
125
  rope_config = UnscaledRoPEConfig(
115
126
  precision=activation_precision,
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: lalamo
3
- Version: 0.5.15
3
+ Version: 0.5.16
4
4
  Summary: JAX library for optimization and export of models for use with the UZU inference engine.
5
5
  Requires-Python: <4,>=3.12
6
6
  Description-Content-Type: text/markdown
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes