lalamo 0.2.2__tar.gz → 0.2.3__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {lalamo-0.2.2 → lalamo-0.2.3}/PKG-INFO +1 -1
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/__init__.py +1 -1
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/configs/__init__.py +3 -2
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/configs/executorch.py +1 -1
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/loaders/__init__.py +2 -2
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/model_specs/llama.py +29 -30
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo.egg-info/PKG-INFO +1 -1
- {lalamo-0.2.2 → lalamo-0.2.3}/LICENSE +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/README.md +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/common.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/language_model.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/main.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/__init__.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/common.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/configs/common.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/configs/huggingface/__init__.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/configs/huggingface/common.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/configs/huggingface/gemma2.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/configs/huggingface/gemma3.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/configs/huggingface/llama.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/configs/huggingface/mistral.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/configs/huggingface/qwen2.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/configs/huggingface/qwen3.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/loaders/common.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/loaders/executorch.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/loaders/huggingface.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/model_specs/__init__.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/model_specs/common.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/model_specs/deepseek.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/model_specs/gemma.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/model_specs/huggingface.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/model_specs/mistral.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/model_specs/pleias.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/model_specs/polaris.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/model_specs/qwen.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/model_import/model_specs/reka.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/__init__.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/activations.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/attention.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/common.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/decoder.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/decoder_layer.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/embedding.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/kv_cache.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/linear.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/mlp.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/normalization.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/rope.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/modules/utils.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/quantization.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo/utils.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo.egg-info/SOURCES.txt +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo.egg-info/dependency_links.txt +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo.egg-info/entry_points.txt +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo.egg-info/requires.txt +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/lalamo.egg-info/top_level.txt +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/pyproject.toml +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/setup.cfg +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/tests/test_generation.py +0 -0
- {lalamo-0.2.2 → lalamo-0.2.3}/tests/test_huggingface_models.py +0 -0
|
@@ -1,5 +1,6 @@
|
|
|
1
1
|
from .common import ForeignConfig
|
|
2
|
-
|
|
2
|
+
|
|
3
|
+
# from .executorch import ETLlamaConfig
|
|
3
4
|
from .huggingface import (
|
|
4
5
|
HFGemma2Config,
|
|
5
6
|
HFGemma3Config,
|
|
@@ -11,7 +12,7 @@ from .huggingface import (
|
|
|
11
12
|
)
|
|
12
13
|
|
|
13
14
|
__all__ = [
|
|
14
|
-
"ETLlamaConfig",
|
|
15
|
+
# "ETLlamaConfig",
|
|
15
16
|
"ForeignConfig",
|
|
16
17
|
"HFGemma2Config",
|
|
17
18
|
"HFGemma3Config",
|
|
@@ -3,7 +3,7 @@ from dataclasses import dataclass
|
|
|
3
3
|
import jax.numpy as jnp
|
|
4
4
|
from jaxtyping import Array, DTypeLike
|
|
5
5
|
|
|
6
|
-
from lalamo.model_import.loaders import load_executorch
|
|
6
|
+
from lalamo.model_import.loaders.executorch import load_executorch
|
|
7
7
|
from lalamo.modules import (
|
|
8
8
|
Activation,
|
|
9
9
|
AttentionConfig,
|
|
@@ -1,7 +1,6 @@
|
|
|
1
1
|
from dataclasses import replace
|
|
2
2
|
|
|
3
|
-
from lalamo.model_import.configs import
|
|
4
|
-
from lalamo.quantization import QuantizationMode
|
|
3
|
+
from lalamo.model_import.configs import HFLlamaConfig
|
|
5
4
|
|
|
6
5
|
from .common import (
|
|
7
6
|
HUGGINFACE_GENERATION_CONFIG_FILE,
|
|
@@ -54,20 +53,20 @@ LLAMA32 = [
|
|
|
54
53
|
tokenizer_files=(*HUGGINGFACE_TOKENIZER_FILES, HUGGINFACE_GENERATION_CONFIG_FILE),
|
|
55
54
|
use_cases=tuple(),
|
|
56
55
|
),
|
|
57
|
-
ModelSpec(
|
|
58
|
-
|
|
59
|
-
|
|
60
|
-
|
|
61
|
-
|
|
62
|
-
|
|
63
|
-
|
|
64
|
-
|
|
65
|
-
|
|
66
|
-
|
|
67
|
-
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
),
|
|
56
|
+
# ModelSpec(
|
|
57
|
+
# vendor="Meta",
|
|
58
|
+
# family="Llama-3.2",
|
|
59
|
+
# name="Llama-3.2-1B-Instruct-QLoRA",
|
|
60
|
+
# size="1B",
|
|
61
|
+
# quantization=QuantizationMode.UINT4,
|
|
62
|
+
# repo="meta-llama/Llama-3.2-1B-Instruct-QLORA_INT4_EO8",
|
|
63
|
+
# config_type=ETLlamaConfig,
|
|
64
|
+
# config_file_name="params.json",
|
|
65
|
+
# weights_file_names=("consolidated.00.pth",),
|
|
66
|
+
# weights_type=WeightsType.TORCH,
|
|
67
|
+
# tokenizer_files=_tokenizer_files_from_another_repo("meta-llama/Llama-3.2-1B-Instruct"),
|
|
68
|
+
# use_cases=tuple(),
|
|
69
|
+
# ),
|
|
71
70
|
ModelSpec(
|
|
72
71
|
vendor="Meta",
|
|
73
72
|
family="Llama-3.2",
|
|
@@ -82,20 +81,20 @@ LLAMA32 = [
|
|
|
82
81
|
tokenizer_files=(*HUGGINGFACE_TOKENIZER_FILES, HUGGINFACE_GENERATION_CONFIG_FILE),
|
|
83
82
|
use_cases=tuple(),
|
|
84
83
|
),
|
|
85
|
-
ModelSpec(
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
|
|
90
|
-
|
|
91
|
-
|
|
92
|
-
|
|
93
|
-
|
|
94
|
-
|
|
95
|
-
|
|
96
|
-
|
|
97
|
-
|
|
98
|
-
),
|
|
84
|
+
# ModelSpec(
|
|
85
|
+
# vendor="Meta",
|
|
86
|
+
# family="Llama-3.2",
|
|
87
|
+
# name="Llama-3.2-3B-Instruct-QLoRA",
|
|
88
|
+
# size="3B",
|
|
89
|
+
# quantization=QuantizationMode.UINT4,
|
|
90
|
+
# repo="meta-llama/Llama-3.2-3B-Instruct-QLORA_INT4_EO8",
|
|
91
|
+
# config_type=ETLlamaConfig,
|
|
92
|
+
# config_file_name="params.json",
|
|
93
|
+
# weights_file_names=("consolidated.00.pth",),
|
|
94
|
+
# tokenizer_files=_tokenizer_files_from_another_repo("meta-llama/Llama-3.2-3B-Instruct"),
|
|
95
|
+
# weights_type=WeightsType.TORCH,
|
|
96
|
+
# use_cases=tuple(),
|
|
97
|
+
# ),
|
|
99
98
|
]
|
|
100
99
|
|
|
101
100
|
LLAMA_MODELS = LLAMA31 + LLAMA32
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|