PyPI - aimnet - Versions diffs - 0.0.1__py3-none-any.whl → 0.1.0__py3-none-any.whl - Mend

aimnet 0.0.1py3-none-any.whl → 0.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

aimnet/__init__.py +7 -0
aimnet/base.py +24 -8
aimnet/calculators/__init__.py +4 -4
aimnet/calculators/aimnet2ase.py +19 -6
aimnet/calculators/calculator.py +868 -108
aimnet/calculators/model_registry.py +2 -5
aimnet/calculators/model_registry.yaml +55 -17
aimnet/cli.py +62 -6
aimnet/config.py +8 -9
aimnet/data/sgdataset.py +23 -22
aimnet/kernels/__init__.py +66 -0
aimnet/kernels/conv_sv_2d_sp_wp.py +478 -0
aimnet/models/__init__.py +13 -1
aimnet/models/aimnet2.py +19 -22
aimnet/models/base.py +183 -15
aimnet/models/convert.py +30 -0
aimnet/models/utils.py +735 -0
aimnet/modules/__init__.py +1 -1
aimnet/modules/aev.py +49 -48
aimnet/modules/core.py +14 -13
aimnet/modules/lr.py +520 -115
aimnet/modules/ops.py +537 -0
aimnet/nbops.py +105 -15
aimnet/ops.py +90 -18
aimnet/train/export_model.py +226 -0
aimnet/train/loss.py +7 -7
aimnet/train/metrics.py +5 -6
aimnet/train/train.py +4 -1
aimnet/train/utils.py +42 -13
aimnet-0.1.0.dist-info/METADATA +308 -0
aimnet-0.1.0.dist-info/RECORD +43 -0
{aimnet-0.0.1.dist-info → aimnet-0.1.0.dist-info}/WHEEL +1 -1
aimnet-0.1.0.dist-info/entry_points.txt +3 -0
aimnet/calculators/nb_kernel_cpu.py +0 -222
aimnet/calculators/nb_kernel_cuda.py +0 -217
aimnet/calculators/nbmat.py +0 -220
aimnet/train/pt2jpt.py +0 -81
aimnet-0.0.1.dist-info/METADATA +0 -78
aimnet-0.0.1.dist-info/RECORD +0 -41
aimnet-0.0.1.dist-info/entry_points.txt +0 -5
{aimnet-0.0.1.dist-info → aimnet-0.1.0.dist-info/licenses}/LICENSE +0 -0

aimnet/kernels/conv_sv_2d_sp_wp.py ADDED Viewed

@@ -0,0 +1,478 @@
+# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: MIT
+#
+# Permission is hereby granted, free of charge, to any person obtaining a
+# copy of this software and associated documentation files (the "Software"),
+# to deal in the Software without restriction, including without limitation
+# the rights to use, copy, modify, merge, publish, distribute, sublicense,
+# and/or sell copies of the Software, and to permit persons to whom the
+# Software is furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+# FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+# DEALINGS IN THE SOFTWARE.
+# type: ignore
+import torch
+import warp as wp
+from torch import Tensor
+wp.init()
+def _get_stream(device: torch.device):
+    """Get the Warp stream for the given device."""
+    if device.type == "cuda":
+        return wp.stream_from_torch(torch.cuda.current_stream(device))
+    return None
+# =============================================================================
+# Warp Kernels
+# =============================================================================
+@wp.kernel(enable_backward=False)
+def _conv_sv_2d_sp_kernel(
+    a: wp.array3d(dtype=wp.float32),  # (B, A, G)
+    idx: wp.array2d(dtype=wp.int32),  # (B, M)
+    g: wp.array3d(dtype=wp.vec4f),  # (B, M, G, D)
+    output: wp.array3d(dtype=wp.vec4f),  # (B, A, G, D)
+):
+    """Forward: output[b,a,g] = sum_m a[idx[b,m],a,g] * g[b,m,g]"""
+    B, M = idx.shape[0], idx.shape[1]
+    padding_value = B - 1  # last row is padding
+    _b, _a, _g = wp.tid()
+    acc = wp.vec4f()
+    for _m in range(M):
+        _idx = idx[_b, _m]
+        if _idx >= padding_value:
+            break
+        a_val = a[_idx, _a, _g]
+        g_val = g[_b, _m, _g]
+        acc += a_val * g_val
+    output[_b, _a, _g] = acc
+@wp.kernel(enable_backward=False)
+def _conv_sv_2d_sp_backward_a_kernel(
+    grad_output: wp.array3d(dtype=wp.vec4f),  # (B, A, G, D)
+    idx: wp.array2d(dtype=wp.int32),  # (B, M)
+    g: wp.array3d(dtype=wp.vec4f),  # (B, M, G, D)
+    grad_a: wp.array3d(dtype=wp.float32),  # (B, A, G)
+):
+    """Backward w.r.t. a: grad_a[idx[b,m],a,g] += dot(grad_output[b,a,g], g[b,m,g])"""
+    B, M = idx.shape[0], idx.shape[1]
+    padding_value = B - 1  # last row is padding
+    _b, _a, _g = wp.tid()
+    grad_out = grad_output[_b, _a, _g]
+    for _m in range(M):
+        _idx = idx[_b, _m]
+        if _idx >= padding_value:
+            break
+        g_val = g[_b, _m, _g]
+        val = wp.dot(grad_out, g_val)
+        wp.atomic_add(grad_a, _idx, _a, _g, val)
+@wp.kernel(enable_backward=False)
+def _conv_sv_2d_sp_backward_g_kernel(
+    grad_output: wp.array3d(dtype=wp.vec4f),  # (B, A, G, D)
+    a: wp.array3d(dtype=wp.float32),  # (B, A, G)
+    idx: wp.array2d(dtype=wp.int32),  # (B, M)
+    grad_g: wp.array3d(dtype=wp.vec4f),  # (B, M, G, D)
+):
+    """Backward w.r.t. g: grad_g[b,m,g] = sum_a a[idx[b,m],a,g] * grad_output[b,a,g]"""
+    B = idx.shape[0]
+    A = a.shape[1]
+    padding_value = B - 1  # last row is padding
+    _b, _m, _g = wp.tid()
+    _idx = idx[_b, _m]
+    if _idx >= padding_value:
+        return
+    acc = wp.vec4f()
+    for _a in range(A):
+        grad_out = grad_output[_b, _a, _g]
+        a_val = a[_idx, _a, _g]
+        acc += a_val * grad_out
+    grad_g[_b, _m, _g] = acc
+@wp.kernel(enable_backward=False)
+def _conv_sv_2d_sp_double_backward_a_g_kernel(
+    grad_grad_a: wp.array3d(dtype=wp.float32),  # (B, A, G)
+    idx: wp.array2d(dtype=wp.int32),  # (B, M)
+    grad_output: wp.array3d(dtype=wp.vec4f),  # (B, A, G, D)
+    grad_g: wp.array3d(dtype=wp.vec4f),  # (B, M, G, D)
+):
+    """Double backward: d(grad_a)/dg -> grad_g"""
+    B = idx.shape[0]
+    A = grad_grad_a.shape[1]
+    padding_value = B - 1  # last row is padding
+    _b, _m, _g = wp.tid()
+    _idx = idx[_b, _m]
+    if _idx >= padding_value:
+        return
+    acc = wp.vec4f()
+    for _a in range(A):
+        grad_grad_a_val = grad_grad_a[_idx, _a, _g]
+        grad_out = grad_output[_b, _a, _g]
+        acc += grad_grad_a_val * grad_out
+    grad_g[_b, _m, _g] = acc
+@wp.kernel(enable_backward=False)
+def _conv_sv_2d_sp_double_backward_g_contrib_kernel(
+    grad2_g: wp.array3d(dtype=wp.vec4f),  # (B, M, G, D)
+    a: wp.array3d(dtype=wp.float32),  # (B, A, G)
+    idx: wp.array2d(dtype=wp.int32),  # (B, M)
+    grad_output_double: wp.array3d(dtype=wp.vec4f),  # (B, A, G, D) - OUTPUT
+):
+    """Double backward from grad2_g: einsum('bmgd,bmag->bagd', grad2_g, a_selected)"""
+    B, M = idx.shape[0], idx.shape[1]
+    padding_value = B - 1  # last row is padding
+    _b, _a, _g = wp.tid()
+    acc = wp.vec4f()
+    for _m in range(M):
+        _idx = idx[_b, _m]
+        if _idx >= padding_value:
+            break
+        a_val = a[_idx, _a, _g]
+        grad2_g_val = grad2_g[_b, _m, _g]
+        acc += a_val * grad2_g_val
+    grad_output_double[_b, _a, _g] = acc
+@wp.kernel(enable_backward=False)
+def _conv_sv_2d_sp_double_backward_a_contrib_kernel(
+    grad2_a: wp.array3d(dtype=wp.float32),  # (B, A, G)
+    idx: wp.array2d(dtype=wp.int32),  # (B, M)
+    g: wp.array3d(dtype=wp.vec4f),  # (B, M, G, D)
+    grad_output_double: wp.array3d(dtype=wp.vec4f),  # (B, A, G, D) - OUTPUT
+):
+    """Double backward from grad2_a: einsum('bmag,bmgd->bagd', grad2_a_selected, g)"""
+    B, M = idx.shape[0], idx.shape[1]
+    padding_value = B - 1  # last row is padding
+    _b, _a, _g = wp.tid()
+    acc = wp.vec4f()
+    for _m in range(M):
+        _idx = idx[_b, _m]
+        if _idx >= padding_value:
+            break
+        grad2_a_val = grad2_a[_idx, _a, _g]
+        g_val = g[_b, _m, _g]
+        acc += grad2_a_val * g_val
+    grad_output_double[_b, _a, _g] = acc
+# =============================================================================
+# PyTorch Custom Op Primitives
+# =============================================================================
+@torch.library.custom_op(
+    "aimnet::conv_sv_2d_sp_fwd",
+    mutates_args=(),
+    device_types=["cuda"],
+)
+def _(a: Tensor, idx: Tensor, g: Tensor) -> Tensor:
+    """Forward primitive for conv_sv_2d_sp."""
+    stream = _get_stream(a.device)
+    device = wp.device_from_torch(a.device)
+    B, A, G = a.shape
+    output = torch.zeros(B, A, G, 4, dtype=a.dtype, device=a.device)
+    wp.launch(
+        _conv_sv_2d_sp_kernel,
+        dim=(B - 1, A, G),  # B-1: exclude padding row
+        stream=stream,
+        device=device,
+        inputs=(
+            wp.from_torch(a.detach(), return_ctype=True),
+            wp.from_torch(idx.to(torch.int32), return_ctype=True),
+            wp.from_torch(g.detach(), return_ctype=True, dtype=wp.vec4f),
+            wp.from_torch(output, return_ctype=True, dtype=wp.vec4f),
+        ),
+    )
+    return output
+@torch.library.register_fake("aimnet::conv_sv_2d_sp_fwd")
+def _(a: Tensor, idx: Tensor, g: Tensor) -> Tensor:
+    B, A, G = a.shape
+    return torch.empty(B, A, G, 4, dtype=a.dtype, device=a.device)
+@torch.library.custom_op(
+    "aimnet::conv_sv_2d_sp_bwd",
+    mutates_args=(),
+    device_types=["cuda"],
+)
+def _(grad_output: Tensor, a: Tensor, idx: Tensor, g: Tensor) -> list[Tensor]:
+    """Backward primitive for conv_sv_2d_sp."""
+    stream = _get_stream(a.device)
+    device = wp.device_from_torch(a.device)
+    B, A, G = a.shape
+    B_out, M = idx.shape
+    grad_a = torch.zeros_like(a)
+    grad_g = torch.zeros(B_out, M, G, 4, dtype=g.dtype, device=g.device)
+    grad_output_contig = grad_output.detach().contiguous()
+    # Launch backward w.r.t. a
+    wp.launch(
+        _conv_sv_2d_sp_backward_a_kernel,
+        dim=(B - 1, A, G),  # B-1: exclude padding row
+        stream=stream,
+        device=device,
+        inputs=(
+            wp.from_torch(grad_output_contig, return_ctype=True, dtype=wp.vec4f),
+            wp.from_torch(idx.to(torch.int32), return_ctype=True),
+            wp.from_torch(g.detach(), return_ctype=True, dtype=wp.vec4f),
+            wp.from_torch(grad_a, return_ctype=True),
+        ),
+    )
+    # Launch backward w.r.t. g
+    wp.launch(
+        _conv_sv_2d_sp_backward_g_kernel,
+        dim=(B_out - 1, M, G),  # B_out-1: exclude padding row
+        stream=stream,
+        device=device,
+        inputs=(
+            wp.from_torch(grad_output_contig, return_ctype=True, dtype=wp.vec4f),
+            wp.from_torch(a.detach(), return_ctype=True),
+            wp.from_torch(idx.to(torch.int32), return_ctype=True),
+            wp.from_torch(grad_g, return_ctype=True, dtype=wp.vec4f),
+        ),
+    )
+    return [grad_a, grad_g]
+@torch.library.register_fake("aimnet::conv_sv_2d_sp_bwd")
+def _(grad_output: Tensor, a: Tensor, idx: Tensor, g: Tensor) -> list[Tensor]:
+    B_out, M = idx.shape
+    G = a.shape[2]
+    return [
+        torch.empty_like(a),
+        torch.empty(B_out, M, G, 4, dtype=g.dtype, device=g.device),
+    ]
+@torch.library.custom_op(
+    "aimnet::conv_sv_2d_sp_bwd_bwd",
+    mutates_args=(),
+    device_types=["cuda"],
+)
+def _(
+    grad_output: Tensor,
+    grad2_a: Tensor,
+    grad2_g: Tensor,
+    a: Tensor,
+    idx: Tensor,
+    g: Tensor,
+) -> list[Tensor]:
+    """Double backward primitive for conv_sv_2d_sp."""
+    stream = _get_stream(a.device)
+    device = wp.device_from_torch(a.device)
+    B, A, G = a.shape
+    B_out, M = idx.shape
+    grad_grad_output = torch.zeros(B, A, G, 4, dtype=a.dtype, device=a.device)
+    grad_a_double = torch.zeros_like(a)
+    grad_g_double = torch.zeros(B_out, M, G, 4, dtype=a.dtype, device=a.device)
+    grad_output_contig = grad_output.detach().contiguous()
+    grad2_a_contig = grad2_a.detach().contiguous()
+    grad2_g_contig = grad2_g.detach().contiguous()
+    # Contribution from grad2_g to grad_grad_output
+    wp.launch(
+        _conv_sv_2d_sp_double_backward_g_contrib_kernel,
+        dim=(B - 1, A, G),  # B-1: exclude padding row
+        stream=stream,
+        device=device,
+        inputs=(
+            wp.from_torch(grad2_g_contig, return_ctype=True, dtype=wp.vec4f),
+            wp.from_torch(a.detach(), return_ctype=True),
+            wp.from_torch(idx.to(torch.int32), return_ctype=True),
+            wp.from_torch(grad_grad_output, return_ctype=True, dtype=wp.vec4f),
+        ),
+    )
+    # Contribution from grad2_a to grad_grad_output
+    grad_output_2_a = torch.zeros(B, A, G, 4, dtype=a.dtype, device=a.device)
+    wp.launch(
+        _conv_sv_2d_sp_double_backward_a_contrib_kernel,
+        dim=(B - 1, A, G),  # B-1: exclude padding row
+        stream=stream,
+        device=device,
+        inputs=(
+            wp.from_torch(grad2_a_contig, return_ctype=True),
+            wp.from_torch(idx.to(torch.int32), return_ctype=True),
+            wp.from_torch(g.detach(), return_ctype=True, dtype=wp.vec4f),
+            wp.from_torch(grad_output_2_a, return_ctype=True, dtype=wp.vec4f),
+        ),
+    )
+    grad_grad_output = grad_grad_output + grad_output_2_a
+    # Mixed partial: d(grad_a)/dg -> grad_g_double
+    wp.launch(
+        _conv_sv_2d_sp_double_backward_a_g_kernel,
+        dim=(B_out - 1, M, G),  # B_out-1: exclude padding row
+        stream=stream,
+        device=device,
+        inputs=(
+            wp.from_torch(grad2_a_contig, return_ctype=True),
+            wp.from_torch(idx.to(torch.int32), return_ctype=True),
+            wp.from_torch(grad_output_contig, return_ctype=True, dtype=wp.vec4f),
+            wp.from_torch(grad_g_double, return_ctype=True, dtype=wp.vec4f),
+        ),
+    )
+    # Mixed partial: d(grad_g)/da -> grad_a_double
+    wp.launch(
+        _conv_sv_2d_sp_backward_a_kernel,
+        dim=(B - 1, A, G),  # B-1: exclude padding row
+        stream=stream,
+        device=device,
+        inputs=(
+            wp.from_torch(grad_output_contig, return_ctype=True, dtype=wp.vec4f),
+            wp.from_torch(idx.to(torch.int32), return_ctype=True),
+            wp.from_torch(grad2_g_contig, return_ctype=True, dtype=wp.vec4f),
+            wp.from_torch(grad_a_double, return_ctype=True),
+        ),
+    )
+    return [grad_grad_output, grad_a_double, grad_g_double]
+@torch.library.register_fake("aimnet::conv_sv_2d_sp_bwd_bwd")
+def _(
+    grad_output: Tensor,
+    grad2_a: Tensor,
+    grad2_g: Tensor,
+    a: Tensor,
+    idx: Tensor,
+    g: Tensor,
+) -> list[Tensor]:
+    B, A, G = a.shape
+    B_out, M = idx.shape
+    return [
+        torch.empty(B, A, G, 4, dtype=a.dtype, device=a.device),
+        torch.empty_like(a),
+        torch.empty(B_out, M, G, 4, dtype=a.dtype, device=a.device),
+    ]
+# =============================================================================
+# Autograd Registration
+# =============================================================================
+def _conv_sv_2d_sp_setup_fwd_context(ctx, inputs, output):
+    """Setup context for forward pass."""
+    a, idx, g = inputs
+    ctx.save_for_backward(a, idx, g)
+def _conv_sv_2d_sp_setup_bwd_context(ctx, inputs, output):
+    """Setup context for backward pass."""
+    grad_output, a, idx, g = inputs
+    ctx.save_for_backward(grad_output, a, idx, g)
+@torch.compiler.allow_in_graph
+def _conv_sv_2d_sp_bwd(ctx, grad_output):
+    """Backward pass for conv_sv_2d_sp."""
+    a, idx, g = ctx.saved_tensors
+    grad_a, grad_g = torch.ops.aimnet.conv_sv_2d_sp_bwd(grad_output.contiguous(), a, idx, g)
+    return grad_a, None, grad_g
+@torch.compiler.allow_in_graph
+def _conv_sv_2d_sp_bwd_bwd(ctx, *grad_outputs):
+    """Double backward pass for conv_sv_2d_sp."""
+    grad2_a = grad_outputs[0][0]
+    grad2_g = grad_outputs[0][1]
+    grad_output_saved, a, idx, g = ctx.saved_tensors
+    if grad2_a is None:
+        grad2_a = torch.zeros_like(a)
+    if grad2_g is None:
+        B_out, M = idx.shape
+        G = a.shape[2]
+        grad2_g = torch.zeros(B_out, M, G, 4, dtype=g.dtype, device=g.device)
+    outputs = torch.ops.aimnet.conv_sv_2d_sp_bwd_bwd(grad_output_saved, grad2_a, grad2_g, a, idx, g)
+    return outputs[0], outputs[1], None, outputs[2]
+torch.library.register_autograd(
+    "aimnet::conv_sv_2d_sp_fwd",
+    _conv_sv_2d_sp_bwd,
+    setup_context=_conv_sv_2d_sp_setup_fwd_context,
+)
+torch.library.register_autograd(
+    "aimnet::conv_sv_2d_sp_bwd",
+    _conv_sv_2d_sp_bwd_bwd,
+    setup_context=_conv_sv_2d_sp_setup_bwd_context,
+)
+# =============================================================================
+# Public API
+# =============================================================================
+def conv_sv_2d_sp(a: Tensor, idx: Tensor, g: Tensor) -> Tensor:
+    """Compute conv_sv_2d_sp with support for 1st and 2nd order derivatives.
+    Parameters
+    ----------
+    a : Tensor
+        Input tensor of shape (B, A, G).
+    idx : Tensor
+        Index tensor of shape (B, M).
+    g : Tensor
+        Gate tensor of shape (B, M, G, 4).
+    Returns
+    -------
+    Tensor
+        Output tensor of shape (B, A, G, 4).
+    """
+    return torch.ops.aimnet.conv_sv_2d_sp_fwd(a, idx, g)

aimnet/models/__init__.py CHANGED Viewed

@@ -1,2 +1,14 @@
 from .aimnet2 import AIMNet2  # noqa: F401
-from .base import AIMNet2Base  # noqa: F401
+from .base import AIMNet2Base, load_model  # noqa: F401
+from .utils import (  # noqa: F401
+    extract_coulomb_rc,
+    extract_d3_params,
+    extract_species,
+    has_d3ts,
+    has_d3ts_in_config,
+    has_dftd3_in_config,
+    has_dispersion,
+    has_externalizable_dftd3,
+    has_lrcoulomb,
+    iter_lrcoulomb_mods,
+)

aimnet/models/aimnet2.py CHANGED Viewed

@@ -1,4 +1,4 @@
-from typing import Dict, List, Mapping, Sequence, Tuple, Union
+from collections.abc import Mapping, Sequence
 import torch
 from torch import Tensor, nn
@@ -8,17 +8,16 @@ from aimnet.models.base import AIMNet2Base
 from aimnet.modules import AEVSV, MLP, ConvSV, Embedding
-# pylint: disable=too-many-arguments, too-many-instance-attributes
 class AIMNet2(AIMNet2Base):
     def __init__(
         self,
-        aev: Dict,
+        aev: dict,
         nfeature: int,
         d2features: bool,
         ncomb_v: int,
-        hidden: Tuple[List[int]],
+        hidden: tuple[list[int]],
         aim_size: int,
-        outputs: Union[List[nn.Module], Dict[str, nn.Module]],
+        outputs: list[nn.Module] | dict[str, nn.Module],
         num_charge_channels: int = 1,
     ):
         super().__init__()
@@ -29,7 +28,7 @@ class AIMNet2(AIMNet2Base):
         self.aev = AEVSV(**aev)
         nshifts_s = aev["nshifts_s"]
-        nshifts_v = aev.get("nshitfs_v") or nshifts_s
+        nshifts_v = aev.get("nshifts_v") or nshifts_s
         if d2features:
             if nshifts_s != nshifts_v:
                 raise ValueError("nshifts_s must be equal to nshifts_v for d2features")
@@ -49,7 +48,7 @@ class AIMNet2(AIMNet2Base):
                     self.afv.weight.clone().unsqueeze(-1).expand(64, nfeature, nshifts_s).flatten(-2, -1)
                 )
-        conv_param = {"nshifts_s": nshifts_s, "nshifts_v": nshifts_v, "ncomb_v": ncomb_v, "do_vector": True}
+        conv_param = {"nshifts_s": nshifts_s, "nshifts_v": nshifts_v, "ncomb_v": ncomb_v}
         self.conv_a = ConvSV(nchannel=nfeature, d2features=d2features, **conv_param)
         self.conv_q = ConvSV(nchannel=num_charge_channels, d2features=False, **conv_param)
@@ -90,7 +89,7 @@ class AIMNet2(AIMNet2Base):
         else:
             raise TypeError("`outputs` is not either list or dict")
-    def _preprocess_spin_polarized_charge(self, data: Dict[str, Tensor]) -> Dict[str, Tensor]:
+    def _preprocess_spin_polarized_charge(self, data: dict[str, Tensor]) -> dict[str, Tensor]:
         if "mult" not in data:
             raise ValueError("mult key is required for NSE if two channels for charge are not provided")
         _half_spin = 0.5 * (data["mult"] - 1.0)
@@ -98,27 +97,27 @@ class AIMNet2(AIMNet2Base):
         data["charge"] = torch.stack([_half_q + _half_spin, _half_q - _half_spin], dim=-1)
         return data
-    def _postprocess_spin_polarized_charge(self, data: Dict[str, Tensor]) -> Dict[str, Tensor]:
+    def _postprocess_spin_polarized_charge(self, data: dict[str, Tensor]) -> dict[str, Tensor]:
         data["spin_charges"] = data["charges"][..., 0] - data["charges"][..., 1]
         data["charges"] = data["charges"].sum(dim=-1)
         data["charge"] = data["charge"].sum(dim=-1)
         return data
-    def _prepare_in_a(self, data: Dict[str, Tensor]) -> Tensor:
-        a_i, a_j = nbops.get_ij(data["a"], data)
-        avf_a = self.conv_a(a_j, data["gs"], data["gv"])
+    def _prepare_in_a(self, data: dict[str, Tensor]) -> Tensor:
+        a_i = nbops.get_i(data["a"], data)
+        avf_a = self.conv_a(data, data["a"])
         if self.d2features:
             a_i = a_i.flatten(-2, -1)
         _in = torch.cat([a_i.squeeze(-2), avf_a], dim=-1)
         return _in
-    def _prepare_in_q(self, data: Dict[str, Tensor]) -> Tensor:
-        q_i, q_j = nbops.get_ij(data["charges"], data)
-        avf_q = self.conv_q(q_j, data["gs"], data["gv"])
+    def _prepare_in_q(self, data: dict[str, Tensor]) -> Tensor:
+        q_i = nbops.get_i(data["charges"], data)
+        avf_q = self.conv_q(data, data["charges"])
         _in = torch.cat([q_i.squeeze(-2), avf_q], dim=-1)
         return _in
-    def _update_q(self, data: Dict[str, Tensor], x: Tensor, delta_q: bool = True) -> Dict[str, Tensor]:
+    def _update_q(self, data: dict[str, Tensor], x: Tensor, delta_q: bool = True) -> dict[str, Tensor]:
         _q, _f, delta_a = x.split(
             [
                 self.num_charge_channels,
@@ -127,16 +126,17 @@ class AIMNet2(AIMNet2Base):
             ],
             dim=-1,
         )
-        # for loss
+        # Charge conservation violation penalty for training loss
         data["_delta_Q"] = data["charge"] - nbops.mol_sum(_q, data)
         q = data["charges"] + _q if delta_q else _q
+        data["charges_pre"] = q if self.num_charge_channels == 2 else q.squeeze(-1)
         f = _f.pow(2)
         q = ops.nse(data["charge"], q, f, data, epsilon=1.0e-6)
         data["charges"] = q
         data["a"] = data["a"] + delta_a.view_as(data["a"])
         return data
-    def forward(self, data: Dict[str, Tensor]) -> Dict[str, Tensor]:
+    def forward(self, data: dict[str, Tensor]) -> dict[str, Tensor]:
         data = self.prepare_input(data)
         # initial features
@@ -149,13 +149,11 @@ class AIMNet2(AIMNet2Base):
         if self.num_charge_channels == 2:
             data = self._preprocess_spin_polarized_charge(data)
         else:
-            # make sure that charge has channel dimension
+            # Ensure charge tensor has channel dimension for consistency with features
             data["charge"] = data["charge"].unsqueeze(-1)
-        # AEV
         data = self.aev(data)
-        # MP iterations
         _npass = len(self.mlps)
         for ipass, mlp in enumerate(self.mlps):
             if ipass == 0:
@@ -181,7 +179,6 @@ class AIMNet2(AIMNet2Base):
             data["charges"] = data["charges"].squeeze(-1)
             data["charge"] = data["charge"].squeeze(-1)
-        # readout
         for m in self.outputs.children():
             data = m(data)

aimnet 0.0.1__py3-none-any.whl → 0.1.0__py3-none-any.whl

aimnet 0.0.1py3-none-any.whl → 0.1.0py3-none-any.whl