PyPI - aimnet - Versions diffs - 0.0.1__py3-none-any.whl → 0.1.0__py3-none-any.whl - Mend

aimnet 0.0.1py3-none-any.whl → 0.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

aimnet/__init__.py +7 -0
aimnet/base.py +24 -8
aimnet/calculators/__init__.py +4 -4
aimnet/calculators/aimnet2ase.py +19 -6
aimnet/calculators/calculator.py +868 -108
aimnet/calculators/model_registry.py +2 -5
aimnet/calculators/model_registry.yaml +55 -17
aimnet/cli.py +62 -6
aimnet/config.py +8 -9
aimnet/data/sgdataset.py +23 -22
aimnet/kernels/__init__.py +66 -0
aimnet/kernels/conv_sv_2d_sp_wp.py +478 -0
aimnet/models/__init__.py +13 -1
aimnet/models/aimnet2.py +19 -22
aimnet/models/base.py +183 -15
aimnet/models/convert.py +30 -0
aimnet/models/utils.py +735 -0
aimnet/modules/__init__.py +1 -1
aimnet/modules/aev.py +49 -48
aimnet/modules/core.py +14 -13
aimnet/modules/lr.py +520 -115
aimnet/modules/ops.py +537 -0
aimnet/nbops.py +105 -15
aimnet/ops.py +90 -18
aimnet/train/export_model.py +226 -0
aimnet/train/loss.py +7 -7
aimnet/train/metrics.py +5 -6
aimnet/train/train.py +4 -1
aimnet/train/utils.py +42 -13
aimnet-0.1.0.dist-info/METADATA +308 -0
aimnet-0.1.0.dist-info/RECORD +43 -0
{aimnet-0.0.1.dist-info → aimnet-0.1.0.dist-info}/WHEEL +1 -1
aimnet-0.1.0.dist-info/entry_points.txt +3 -0
aimnet/calculators/nb_kernel_cpu.py +0 -222
aimnet/calculators/nb_kernel_cuda.py +0 -217
aimnet/calculators/nbmat.py +0 -220
aimnet/train/pt2jpt.py +0 -81
aimnet-0.0.1.dist-info/METADATA +0 -78
aimnet-0.0.1.dist-info/RECORD +0 -41
aimnet-0.0.1.dist-info/entry_points.txt +0 -5
{aimnet-0.0.1.dist-info → aimnet-0.1.0.dist-info/licenses}/LICENSE +0 -0

aimnet/models/base.py CHANGED Viewed

@@ -1,12 +1,151 @@
-from typing import ClassVar, Dict, Final
+from __future__ import annotations
+import contextlib
+import warnings
+from typing import ClassVar, Final, NotRequired, TypedDict
 import torch
 from torch import Tensor, nn
 from aimnet import nbops
+from aimnet.config import build_module
+from aimnet.models.utils import (
+    extract_d3_params,
+    extract_species,
+    has_externalizable_dftd3,
+    validate_state_dict_keys,
+)
+class ModelMetadata(TypedDict):
+    """Metadata returned by load_model().
+    This TypedDict documents the structure of the metadata dictionary.
+    """
+    format_version: int  # 1 = legacy .jpt, 2 = new .pt
+    cutoff: float  # Model cutoff radius
+    # Action flags - what calculator should add externally
+    needs_coulomb: bool  # Add external Coulomb?
+    needs_dispersion: bool  # Add external DFTD3?
+    # Coulomb mode descriptor - what's in the model
+    # "sr_embedded": Model has SRCoulomb, add FULL externally
+    # "full_embedded": Full Coulomb in model (legacy JIT)
+    # "none": No Coulomb anywhere
+    coulomb_mode: str
+    coulomb_sr_rc: NotRequired[float | None]  # Only if coulomb_mode="sr_embedded"
+    coulomb_sr_envelope: NotRequired[str | None]  # "exp" | "cosine", only if sr_embedded
+    # Dispersion parameters (optional)
+    d3_params: NotRequired[dict | None]  # {s8, a1, a2, s6} if needs_dispersion=True
+    implemented_species: list[int]  # Supported atomic numbers
+def load_model(path: str, device: str = "cpu") -> tuple[nn.Module, ModelMetadata]:
+    """Load model from file, supporting both new and legacy formats.
+    Automatically detects format:
+    - New format: state dict with embedded YAML config and metadata
+    - Legacy format: JIT-compiled TorchScript model
+    Parameters
+    ----------
+    path : str
+        Path to the model file (.pt or .jpt).
+    device : str
+        Device to load the model on. Default is "cpu".
+    Returns
+    -------
+    model : nn.Module
+        The loaded model with weights.
+    metadata : ModelMetadata
+        Dictionary containing model metadata. See ModelMetadata TypedDict for fields.
+    Notes
+    -----
+    For legacy JIT models (format_version=1), `needs_coulomb` and `needs_dispersion`
+    are False because LR modules are already embedded in the TorchScript model.
+    """
+    import yaml
+    # torch.load auto-detects TorchScript and dispatches to torch.jit.load
+    with warnings.catch_warnings():
+        warnings.filterwarnings("ignore", ".*looks like a TorchScript archive.*")
+        data = torch.load(path, map_location=device, weights_only=False)
+    # Check result type to determine format
+    if isinstance(data, dict) and "model_yaml" in data:
+        # New state dict format
+        model_config = yaml.safe_load(data["model_yaml"])
+        model = build_module(model_config)
+        # Use strict=False because modules may differ between formats
+        load_result = model.load_state_dict(data["state_dict"], strict=False)
+        # Check for unexpected missing/extra keys
+        real_missing, real_unexpected = validate_state_dict_keys(load_result.missing_keys, load_result.unexpected_keys)
+        if real_missing or real_unexpected:
+            msg_parts = []
+            if real_missing:
+                msg_parts.append(f"Missing keys: {real_missing}")
+            if real_unexpected:
+                msg_parts.append(f"Unexpected keys: {real_unexpected}")
+            warnings.warn(f"State dict mismatch during model loading. {'; '.join(msg_parts)}", stacklevel=2)
+        model = model.to(device)
+        # Preserve float64 precision for atomic shifts (SAE values) after device transfer
+        if hasattr(model, "outputs") and hasattr(model.outputs, "atomic_shift"):
+            model.outputs.atomic_shift.shifts = model.outputs.atomic_shift.shifts.double()
+        metadata: ModelMetadata = {
+            "format_version": data.get("format_version", 2),  # Default 2 for early v2 files without version
+            "cutoff": data["cutoff"],
+            "needs_coulomb": data.get("needs_coulomb", False),
+            "needs_dispersion": data.get("needs_dispersion", False),
+            "coulomb_mode": data.get("coulomb_mode", "none"),
+            "coulomb_sr_rc": data.get("coulomb_sr_rc"),
+            "coulomb_sr_envelope": data.get("coulomb_sr_envelope"),
+            "d3_params": data.get("d3_params"),
+            "has_embedded_lr": data.get("has_embedded_lr", False),
+            "implemented_species": data.get("implemented_species", []),
+        }
+        # Attach metadata to model for easy access
+        model._metadata = metadata
-class AIMNet2Base(nn.Module):  # pylint: disable=abstract-method
+        return model, metadata
+    elif isinstance(data, torch.jit.ScriptModule):
+        # Legacy JIT format - LR modules are already embedded in the TorchScript model
+        model = data
+        metadata: ModelMetadata = {
+            "format_version": 1,  # Legacy .jpt format is v1
+            "cutoff": float(model.cutoff),
+            # Legacy models have LR modules embedded - don't add external ones
+            "needs_coulomb": False,
+            "needs_dispersion": False,
+            "coulomb_mode": "full_embedded",
+            # No coulomb_sr_rc/envelope for legacy (full Coulomb is embedded)
+            "d3_params": extract_d3_params(model) if has_externalizable_dftd3(model) else None,
+            "implemented_species": extract_species(model),
+        }
+        # Attempt metadata assignment; silently fails for JIT models
+        with contextlib.suppress(AttributeError, RuntimeError):
+            model._metadata = metadata  # type: ignore[attr-defined]
+        return model, metadata
+    else:
+        raise ValueError(f"Unknown model format: {type(data)}")
+class AIMNet2Base(nn.Module):
     """Base class for AIMNet2 models. Implements pre-processing data:
     converting to right dtype and device, setting nb mode, calculating masks.
     """
@@ -15,32 +154,61 @@ class AIMNet2Base(nn.Module):  # pylint: disable=abstract-method
     _required_keys: Final = ["coord", "numbers", "charge"]
     _required_keys_dtype: Final = [__default_dtype, torch.int64, __default_dtype]
-    _optional_keys: Final = ["mult", "nbmat", "nbmat_lr", "mol_idx", "shifts", "shifts_lr", "cell"]
+    _optional_keys: Final = [
+        "mult",
+        "nbmat",
+        "nbmat_lr",
+        "mol_idx",
+        "shifts",
+        "shifts_lr",
+        "cell",
+        "nbmat_dftd3",
+        "shifts_dftd3",
+        "cutoff_dftd3",
+        "nbmat_coulomb",
+        "shifts_coulomb",
+        "cutoff_coulomb",
+    ]
     _optional_keys_dtype: Final = [
-        __default_dtype,
-        torch.int64,
-        torch.int64,
-        torch.int64,
-        __default_dtype,
-        __default_dtype,
-        __default_dtype,
+        __default_dtype,  # mult
+        torch.int64,  # nbmat
+        torch.int64,  # nbmat_lr
+        torch.int64,  # mol_idx
+        __default_dtype,  # shifts
+        __default_dtype,  # shifts_lr
+        __default_dtype,  # cell
+        torch.int64,  # nbmat_dftd3
+        __default_dtype,  # shifts_dftd3
+        __default_dtype,  # cutoff_dftd3
+        torch.int64,  # nbmat_coulomb
+        __default_dtype,  # shifts_coulomb
+        __default_dtype,  # cutoff_coulomb
     ]
     __constants__: ClassVar = ["_required_keys", "_required_keys_dtype", "_optional_keys", "_optional_keys_dtype"]
+    # TypedDict not supported in TorchScript; exclude from serialization
+    __jit_unused_properties__: ClassVar = ["metadata"]
     def __init__(self):
         super().__init__()
+        # Use object.__setattr__ to avoid TorchScript tracing this attribute
+        object.__setattr__(self, "_metadata", None)
+    @property
+    def metadata(self) -> ModelMetadata | None:
+        """Return model metadata if available."""
+        return getattr(self, "_metadata", None)
-    def _prepare_dtype(self, data: Dict[str, Tensor]) -> Dict[str, Tensor]:
-        for k, d in zip(self._required_keys, self._required_keys_dtype):
+    def _prepare_dtype(self, data: dict[str, Tensor]) -> dict[str, Tensor]:
+        for k, d in zip(self._required_keys, self._required_keys_dtype, strict=False):
             assert k in data, f"Key {k} is required"
             data[k] = data[k].to(d)
-        for k, d in zip(self._optional_keys, self._optional_keys_dtype):
+        for k, d in zip(self._optional_keys, self._optional_keys_dtype, strict=False):
             if k in data:
                 data[k] = data[k].to(d)
         return data
-    def prepare_input(self, data: Dict[str, Tensor]) -> Dict[str, Tensor]:
-        """Some sommon operations"""
+    def prepare_input(self, data: dict[str, Tensor]) -> dict[str, Tensor]:
+        """Common operations for input preparation."""
         data = self._prepare_dtype(data)
         data = nbops.set_nb_mode(data)
         data = nbops.calc_masks(data)

aimnet/models/convert.py ADDED Viewed

@@ -0,0 +1,30 @@
+"""Convert legacy JIT-compiled models to new state dict format.
+This module provides CLI interface for converting legacy .jpt TorchScript
+models to the new .pt format with metadata.
+For programmatic use, import load_v1_model from aimnet.models.utils:
+    from aimnet.models.utils import load_v1_model
+    model, metadata = load_v1_model("model.jpt", "config.yaml", "model_new.pt")
+"""
+import click
+from aimnet.models.utils import load_v1_model
+@click.command()
+@click.argument("jpt", type=click.Path(exists=True))
+@click.argument("yaml_config", type=click.Path(exists=True))
+@click.argument("output", type=str)
+def convert_legacy_jpt(jpt: str, yaml_config: str, output: str):
+    """Convert legacy JIT model to new state dict format.
+    JPT: Path to the input JIT-compiled model file.
+    YAML_CONFIG: Path to the model YAML configuration file.
+    OUTPUT: Path to the output .pt file.
+    Example:
+        aimnet convert model.jpt config.yaml model_new.pt
+    """
+    load_v1_model(jpt, yaml_config, output)

aimnet 0.0.1__py3-none-any.whl → 0.1.0__py3-none-any.whl

aimnet 0.0.1py3-none-any.whl → 0.1.0py3-none-any.whl