PyPI - foscat - Versions diffs - 2025.9.4__py3-none-any.whl → 2025.10.2__py3-none-any.whl - Mend

foscat 2025.9.4py3-none-any.whl → 2025.10.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

foscat/FoCUS.py +14 -9
foscat/Plot.py +59 -17
foscat/healpix_unet_torch.py +17 -1
foscat/healpix_vit_skip.py +445 -0
foscat/healpix_vit_torch-old.py +658 -0
foscat/healpix_vit_torch.py +521 -0
foscat/planar_vit.py +206 -0
foscat/unet_2_d_from_healpix_params.py +421 -0
{foscat-2025.9.4.dist-info → foscat-2025.10.2.dist-info}/METADATA +1 -1
{foscat-2025.9.4.dist-info → foscat-2025.10.2.dist-info}/RECORD +13 -8
{foscat-2025.9.4.dist-info → foscat-2025.10.2.dist-info}/WHEEL +0 -0
{foscat-2025.9.4.dist-info → foscat-2025.10.2.dist-info}/licenses/LICENSE +0 -0
{foscat-2025.9.4.dist-info → foscat-2025.10.2.dist-info}/top_level.txt +0 -0

foscat/FoCUS.py CHANGED Viewed

@@ -6,7 +6,7 @@ import numpy as np
 import foscat.HealSpline as HS
 from scipy.interpolate import griddata
-TMPFILE_VERSION = "V9_0"
+TMPFILE_VERSION = "V10_0"
 class FoCUS:
@@ -36,7 +36,7 @@ class FoCUS:
             mpi_rank=0
     ):
-        self.__version__ = "2025.09.4"
+        self.__version__ = "2025.10.2"
         # P00 coeff for normalization for scat_cov
         self.TMPFILE_VERSION = TMPFILE_VERSION
         self.P1_dic = None
@@ -1488,7 +1488,7 @@ class FoCUS:
                     if l_kernel == 5:
                         pw = 0.5
                         pw2 = 0.5
-                        threshold = 2e-4
+                        threshold = 2e-5
                     elif l_kernel == 3:
                         pw = 1.0 / np.sqrt(2)
@@ -1498,7 +1498,7 @@ class FoCUS:
                     elif l_kernel == 7:
                         pw = 0.5
                         pw2 = 0.25
-                        threshold = 4e-5
+                        threshold = 2e-5
                     import foscat.SphericalStencil as hs
                     import torch
@@ -1517,14 +1517,19 @@ class FoCUS:
                                                 n_gauges=self.NORIENT,
                                                 gauge_type='cosmo')
-                    xx=np.tile(np.arange(self.KERNELSZ)-self.KERNELSZ//2,self.KERNELSZ).reshape(self.KERNELSZ*self.KERNELSZ)
+                    xx=np.tile(np.arange(self.KERNELSZ)-self.KERNELSZ//2,self.KERNELSZ).reshape(self.KERNELSZ,self.KERNELSZ)
-                    wwr=hconvol.to_tensor((np.exp(-pw2*(xx**2+(xx.T)**2))*np.cos(pw*xx*np.pi)).reshape(1,1,self.KERNELSZ*self.KERNELSZ))
+                    wwr=(np.exp(-pw2*(xx**2+(xx.T)**2))*np.cos(pw*xx*np.pi)).reshape(1,1,self.KERNELSZ*self.KERNELSZ)
                     wwr-=wwr.mean()
-                    wwi=hconvol.to_tensor((np.exp(-pw2*(xx**2+(xx.T)**2))*np.sin(pw*xx*np.pi)).reshape(1,1,self.KERNELSZ*self.KERNELSZ))
+                    wwi=(np.exp(-pw2*(xx**2+(xx.T)**2))*np.sin(pw*xx*np.pi)).reshape(1,1,self.KERNELSZ*self.KERNELSZ)
                     wwi-=wwi.mean()
-                    wwr/=(abs(wwr+1J*wwi)).sum()
-                    wwi/=(abs(wwr+1J*wwi)).sum()
+                    amp=np.sum(abs(wwr+1J*wwi))
+                    wwr/=amp
+                    wwi/=amp
+                    wwr=hconvol.to_tensor(wwr)
+                    wwi=hconvol.to_tensor(wwi)
                     wavr,indice,mshape=hconvol.make_matrix(wwr)
                     wavi,indice,mshape=hconvol.make_matrix(wwi)

foscat/Plot.py CHANGED Viewed

@@ -959,8 +959,9 @@ def conjugate_gradient_normal_equation(data, x0, www, all_idx,
         rs_new = np.dot(r, r)
-        if verbose and i % 50 == 0:
-            print(f"Iter {i:03d}: residual = {np.sqrt(rs_new):.3e}")
+        if verbose and i % 10 == 0:
+            v=np.mean((LP(p, www, all_idx)-data)**2)
+            print(f"Iter {i:03d}: residual = {np.sqrt(rs_new):.3e},{np.sqrt(v):.3e}")
         if np.sqrt(rs_new) < tol:
             if verbose:
@@ -1065,28 +1066,69 @@ def _spectrum_polar_to_cartesian_core(
     valid = np.isfinite(radial_index)
     try:
         from scipy.ndimage import map_coordinates
-        order = 3 if method.lower() == "bicubic" else 1
-        coords = np.vstack([radial_index.ravel(), angular_index.ravel()])
-        eps = 1e-6
-        coords[0, :] = np.where(np.isfinite(coords[0, :]),
-                                np.clip(coords[0, :], 0.0+eps, (ns-1)-eps), 0.0)
-        sampled = map_coordinates(
-            w, coords, order=order, mode="wrap", cval=fill_value, prefilter=True
-        ).reshape(n_pixels, n_pixels)
-        img = np.where(valid, sampled, fill_value)
+        if method.lower() == "bicubic":
+            # ===== Bicubic with circular angular wrap =====
+            # Pad the angular axis by K columns on both sides so that the cubic kernel
+            # has valid neighbors across the 0°/360° seam. K=2 is enough for a cubic kernel.
+            K = 2
+            # w has shape (Nscale, Norient)
+            w_pad = np.concatenate([w[:, -K:], w, w[:, :K]], axis=1)  # (ns, no+2K)
+            # Build coordinates for map_coordinates on the padded array:
+            # - radial index stays the same, clipped to [0, ns-1] (no wrap)
+            # - angular index is shifted by +K and wrapped into [0, no) before querying
+            order = 3
+            coords = np.vstack([radial_index.ravel(), angular_index.ravel()])
+            # clip the radial coordinate to the valid [eps, ns-1-eps] band
+            eps = 1e-6
+            coords[0, :] = np.where(
+                np.isfinite(coords[0, :]),
+                np.clip(coords[0, :], 0.0 + eps, (ns - 1) - eps),
+                0.0,
+            )
+            # wrap angular coordinate to [0, no) then shift by +K to address the padded array
+            ang = np.mod(coords[1, :], float(no)) + K  # [K, no+K)
+            coords[1, :] = ang
+            # Now sample the padded array; 'nearest' mode is fine thanks to explicit padding
+            sampled = map_coordinates(
+                w_pad, coords, order=order, mode="nearest", cval=fill_value, prefilter=True
+            ).reshape(n_pixels, n_pixels)
+            img = np.where(valid, sampled, fill_value)
+        else:
+            # ===== Bilinear (or other) without special padding =====
+            order = 1
+            coords = np.vstack([radial_index.ravel(), angular_index.ravel()])
+            eps = 1e-6
+            coords[0, :] = np.where(
+                np.isfinite(coords[0, :]),
+                np.clip(coords[0, :], 0.0 + eps, (ns - 1) - eps),
+                0.0,
+            )
+            # For non-bicubic, SciPy's mode="wrap" is sufficient on the angular axis
+            sampled = map_coordinates(
+                w, coords, order=order, mode="wrap", cval=fill_value, prefilter=True
+            ).reshape(n_pixels, n_pixels)
+            img = np.where(valid, sampled, fill_value)
     except Exception:
-        # bilinear fallback
+        # ---- Vectorized bilinear fallback with explicit angular wrap ----
         r_idx = np.floor(radial_index).astype(np.int64)
         t_idx = np.floor(angular_index).astype(np.int64)
-        r_idx = np.clip(r_idx, 0, ns-2)
+        r_idx = np.clip(r_idx, 0, ns - 2)
         t0 = np.mod(t_idx, no)
-        t1 = np.mod(t_idx+1, no)
+        t1 = np.mod(t_idx + 1, no)
         tr = np.clip(radial_index - r_idx, 0.0, 1.0)
         ta = np.clip(angular_index - t_idx, 0.0, 1.0)
         f00 = w[r_idx,     t0]
         f01 = w[r_idx,     t1]
-        f10 = w[r_idx+1,   t0]
-        f11 = w[r_idx+1,   t1]
+        f10 = w[r_idx + 1, t0]
+        f11 = w[r_idx + 1, t1]
         g0 = (1.0 - ta) * f00 + ta * f01
         g1 = (1.0 - ta) * f10 + ta * f11
         img = (1.0 - tr) * g0 + tr * g1
@@ -1114,7 +1156,7 @@ def plot_wave(wave,title="spectrum",unit="Amplitude",cmap="viridis"):
     plt.xlabel(r"$k_x$ [cycles / km]")
     plt.ylabel(r"$k_y$ [cycles / km]")
     plt.title(title)
 def lonlat_edges_from_ref(shape, ref_lon, ref_lat, dlon, dlat, anchor="center"):
     """
     Build lon/lat *edges* (H+1, W+1) for a regular, axis-aligned grid.

foscat/healpix_unet_torch.py CHANGED Viewed

@@ -982,6 +982,9 @@ def fit(
         n_epoch: int = 10,
         view_epoch: int = 10,
         batch_size: int = 16,
+        x_valid: Union[torch.Tensor, np.ndarray, List[Union[torch.Tensor, np.ndarray]]]= None,
+        y_valid: Union[torch.Tensor, np.ndarray, List[Union[torch.Tensor, np.ndarray]]]= None,
+        save_model: bool = False,
         lr: float = 1e-3,
         weight_decay: float = 0.0,
         clip_grad_norm: Optional[float] = None,
@@ -1005,6 +1008,11 @@ def fit(
     device = model.runtime_device if hasattr(model, "runtime_device") else (torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu"))
     model.to(device)
+    if save_model:
+        assert x_valid is None, "If save_mode=True x_valid should not be None"
+        assert y_valid is None, "If save_mode=True y_valid should not be None"
+        best_valid=1E30
     # Detect variable-length mode
     varlen_mode = isinstance(x_train, (list, tuple))
@@ -1197,6 +1205,14 @@ def fit(
             history.append(epoch_loss)
             # print every view_epoch logical step
             if verbose and ((len(history) % view_epoch == 0) or (len(history) == 1)):
-                print(f"[epoch {len(history)}] loss={epoch_loss:.6f}")
+                if x_valid is not None:
+                    preds=model.predict(model.to_tensor(x_valid)).cpu().numpy()
+                    valid_loss=np.mean((preds-y_valid)**2)
+                    if save_model:
+                        if best_valid>valid_loss:
+                            torch.save({"model": self.state_dict(), "cfg": CFG}, os.path.join(CFG["save_dir"], "best.pt"))
+                    print(f"[epoch {len(history)}] loss={epoch_loss:.4f} loss_valid={valid_loss:.4f}")
+                else:
+                    print(f"[epoch {len(history)}] loss={epoch_loss:.4f}")
     return {"loss": history}

foscat/healpix_vit_skip.py ADDED Viewed

@@ -0,0 +1,445 @@
+# healpix_vit_skip.py
+# HEALPix ViT U-Net with temporal encoders and Transformer-based skip fusion.
+# - Multi-level HEALPix pyramid using Foscat.SphericalStencil
+# - Per-level temporal encoding (sequence over T_in months) at encoder
+# - Decoder uses cross-attention to fuse upsampled features with encoder skips
+# - Double spherical convolution + GroupNorm + GELU at each encoder/decoder level
+from __future__ import annotations
+from typing import List, Optional, Literal
+import numpy as np
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import foscat.scat_cov as sc
+import foscat.SphericalStencil as ho
+class MLP(nn.Module):
+    def __init__(self, d: int, hidden_mult: int = 4, drop: float = 0.0):
+        super().__init__()
+        self.net = nn.Sequential(
+            nn.LayerNorm(d),
+            nn.Linear(d, hidden_mult * d),
+            nn.GELU(),
+            nn.Dropout(drop),
+            nn.Linear(hidden_mult * d, d),
+            nn.Dropout(drop),
+        )
+    def forward(self, x):
+        return self.net(x)
+class HealpixViTSkip(nn.Module):
+    def __init__(
+        self,
+        *,
+        in_nside: int,
+        n_chan_in: int,
+        level_dims: List[int],
+        depth_token: int,
+        num_heads_token: int,
+        cell_ids: np.ndarray,
+        task: Literal["regression","segmentation","global"] = "regression",
+        out_channels: int = 1,
+        mlp_ratio_token: float = 4.0,
+        KERNELSZ: int = 3,
+        gauge_type: Literal["cosmo","phi"] = "cosmo",
+        G: int = 1,
+        prefer_foscat_gpu: bool = True,
+        dropout: float = 0.1,
+        dtype: Literal["float32","float64"] = "float32",
+        pos_embed_per_level: bool = True,
+    ) -> None:
+        super().__init__()
+        self.in_nside = int(in_nside)
+        self.n_chan_in = int(n_chan_in)
+        self.level_dims = list(level_dims)
+        self.token_down = len(self.level_dims) - 1
+        assert self.token_down >= 0
+        self.C_fine = int(self.level_dims[0])
+        self.embed_dim = int(self.level_dims[-1])
+        self.depth_token = int(depth_token)
+        self.num_heads_token = int(num_heads_token)
+        self.mlp_ratio_token = float(mlp_ratio_token)
+        self.task = task
+        self.out_channels = int(out_channels)
+        self.KERNELSZ = int(KERNELSZ)
+        self.gauge_type = gauge_type
+        self.G = int(G)
+        self.prefer_foscat_gpu = bool(prefer_foscat_gpu)
+        self.dropout = float(dropout)
+        self.dtype = dtype
+        self.pos_embed_per_level = bool(pos_embed_per_level)
+        for d in self.level_dims:
+            if d % self.G != 0:
+                raise ValueError(f"All level_dims must be divisible by G={self.G}, got {d}.")
+        if self.embed_dim % self.num_heads_token != 0:
+            raise ValueError("embed_dim must be divisible by num_heads_token.")
+        if dtype == "float32":
+            self.np_dtype = np.float32
+            self.torch_dtype = torch.float32
+        else:
+            self.np_dtype = np.float64
+            self.torch_dtype = torch.float32
+        if cell_ids is None:
+            raise ValueError("cell_ids (finest) must be provided.")
+        self.cell_ids_fine = np.asarray(cell_ids)
+        if self.task == "segmentation":
+            self.final_activation = "sigmoid" if self.out_channels == 1 else "softmax"
+        else:
+            self.final_activation = "none"
+        self.f = sc.funct(KERNELSZ=self.KERNELSZ)
+        # Build stencils
+        self.hconv_levels: List[ho.SphericalStencil] = []
+        self.level_cell_ids: List[np.ndarray] = [self.cell_ids_fine]
+        current_nside = self.in_nside
+        dummy = self.f.backend.bk_cast(np.zeros((1, 1, self.cell_ids_fine.shape[0]), dtype=self.np_dtype))
+        for _ in range(self.token_down):
+            hc = ho.SphericalStencil(current_nside, self.KERNELSZ, n_gauges=self.G,
+                                     gauge_type=self.gauge_type, cell_ids=self.level_cell_ids[-1],
+                                     dtype=self.torch_dtype)
+            self.hconv_levels.append(hc)
+            dummy, next_ids = hc.Down(dummy, cell_ids=self.level_cell_ids[-1], nside=current_nside, max_poll=True)
+            self.level_cell_ids.append(self.f.backend.to_numpy(next_ids))
+            current_nside //= 2
+        self.token_nside = current_nside if self.token_down > 0 else self.in_nside
+        self.token_cell_ids = self.level_cell_ids[-1]
+        self.hconv_token = ho.SphericalStencil(self.token_nside, self.KERNELSZ, n_gauges=self.G,
+                                               gauge_type=self.gauge_type, cell_ids=self.token_cell_ids, dtype=self.torch_dtype)
+        self.hconv_head  = ho.SphericalStencil(self.in_nside, self.KERNELSZ, n_gauges=self.G,
+                                               gauge_type=self.gauge_type, cell_ids=self.cell_ids_fine, dtype=self.torch_dtype)
+        self.nsides_levels = [self.in_nside // (2**i) for i in range(self.token_down+1)]
+        self.ntokens_levels = [12 * n * n for n in self.nsides_levels]
+        # Patch embed (double conv)
+        fine_g = self.C_fine // self.G
+        self.pe_w1 = nn.Parameter(torch.empty(self.n_chan_in, fine_g, self.KERNELSZ*self.KERNELSZ))
+        nn.init.kaiming_uniform_(self.pe_w1.view(self.n_chan_in * fine_g, -1), a=np.sqrt(5))
+        self.pe_w2 = nn.Parameter(torch.empty(self.C_fine, fine_g, self.KERNELSZ*self.KERNELSZ))
+        nn.init.kaiming_uniform_(self.pe_w2.view(self.C_fine * fine_g, -1), a=np.sqrt(5))
+        self.pe_bn1 = nn.GroupNorm(num_groups=min(8, self.C_fine if self.C_fine>1 else 1), num_channels=self.C_fine)
+        self.pe_bn2 = nn.GroupNorm(num_groups=min(8, self.C_fine if self.C_fine>1 else 1), num_channels=self.C_fine)
+        # Encoder double convs
+        self.enc_w1 = nn.ParameterList()
+        self.enc_w2 = nn.ParameterList()
+        self.enc_bn1 = nn.ModuleList()
+        self.enc_bn2 = nn.ModuleList()
+        for i in range(self.token_down):
+            Cin = self.level_dims[i]
+            Cout = self.level_dims[i+1]
+            Cout_g = Cout // self.G
+            w1 = nn.Parameter(torch.empty(Cin, Cout_g, self.KERNELSZ*self.KERNELSZ))
+            nn.init.kaiming_uniform_(w1.view(Cin * Cout_g, -1), a=np.sqrt(5))
+            w2 = nn.Parameter(torch.empty(Cout, Cout_g, self.KERNELSZ*self.KERNELSZ))
+            nn.init.kaiming_uniform_(w2.view(Cout * Cout_g, -1), a=np.sqrt(5))
+            self.enc_w1.append(w1); self.enc_w2.append(w2)
+            self.enc_bn1.append(nn.GroupNorm(num_groups=min(8, Cout if Cout>1 else 1), num_channels=Cout))
+            self.enc_bn2.append(nn.GroupNorm(num_groups=min(8, Cout if Cout>1 else 1), num_channels=Cout))
+        # Temporal encoders per level (fine..pre-token)
+        self.temporal_encoders = nn.ModuleList([
+            nn.TransformerEncoder(
+                nn.TransformerEncoderLayer(
+                    d_model=self.level_dims[i],
+                    nhead=max(1, min(8, self.level_dims[i] // 64)),
+                    dim_feedforward=2*self.level_dims[i],
+                    dropout=self.dropout,
+                    activation='gelu',
+                    batch_first=True,
+                    norm_first=True,
+                ),
+                num_layers=2,
+            )
+            for i in range(self.token_down)
+        ])
+        # Token-level Transformer
+        self.n_tokens = int(self.token_cell_ids.shape[0])
+        self.pos_token = nn.Parameter(torch.zeros(1, self.n_tokens, self.embed_dim))
+        nn.init.trunc_normal_(self.pos_token, std=0.02)
+        enc_layer = nn.TransformerEncoderLayer(
+            d_model=self.embed_dim,
+            nhead=self.num_heads_token,
+            dim_feedforward=int(self.embed_dim * self.mlp_ratio_token),
+            dropout=self.dropout,
+            activation='gelu',
+            batch_first=True,
+            norm_first=True,
+        )
+        self.encoder_token = nn.TransformerEncoder(enc_layer, num_layers=self.depth_token)
+        # Decoder fusion modules per level (cross-attention)
+        self.dec_q = nn.ModuleList()
+        self.dec_k = nn.ModuleList()
+        self.dec_v = nn.ModuleList()
+        self.dec_attn = nn.ModuleList()
+        self.dec_mlp = nn.ModuleList()
+        self.level_pos = nn.ParameterList() if self.pos_embed_per_level else None
+        for i in range(self.token_down, 0, -1):
+            Cfine = self.level_dims[i-1]
+            d_fuse = Cfine
+            self.dec_q.append(nn.Linear(Cfine, d_fuse))
+            self.dec_k.append(nn.Linear(Cfine, d_fuse))
+            self.dec_v.append(nn.Linear(Cfine, d_fuse))
+            self.dec_attn.append(nn.MultiheadAttention(embed_dim=d_fuse, num_heads=max(1, min(8, d_fuse // 64)), batch_first=True))
+            self.dec_mlp.append(MLP(d_fuse, hidden_mult=4, drop=self.dropout))
+            if self.pos_embed_per_level:
+                n_tok_i = self.ntokens_levels[i-1]
+                p = nn.Parameter(torch.zeros(1, n_tok_i, d_fuse))
+                nn.init.trunc_normal_(p, std=0.02)
+                self.level_pos.append(p)
+        # Decoder refinement double convs
+        self.dec_refine_w1 = nn.ParameterList()
+        self.dec_refine_w2 = nn.ParameterList()
+        self.dec_refine_bn1 = nn.ModuleList()
+        self.dec_refine_bn2 = nn.ModuleList()
+        for i in range(self.token_down, 0, -1):
+            Cfine = self.level_dims[i-1]
+            Cfine_g = Cfine // self.G
+            w1 = nn.Parameter(torch.empty(Cfine, Cfine_g, self.KERNELSZ*self.KERNELSZ))
+            nn.init.kaiming_uniform_(w1.view(Cfine * Cfine_g, -1), a=np.sqrt(5))
+            w2 = nn.Parameter(torch.empty(Cfine, Cfine_g, self.KERNELSZ*self.KERNELSZ))
+            nn.init.kaiming_uniform_(w2.view(Cfine * Cfine_g, -1), a=np.sqrt(5))
+            self.dec_refine_w1.append(w1); self.dec_refine_w2.append(w2)
+            self.dec_refine_bn1.append(nn.GroupNorm(num_groups=min(8, Cfine if Cfine>1 else 1), num_channels=Cfine))
+            self.dec_refine_bn2.append(nn.GroupNorm(num_groups=min(8, Cfine if Cfine>1 else 1), num_channels=Cfine))
+        # Head
+        if self.task == "global":
+            self.global_head = nn.Linear(self.embed_dim, self.out_channels)
+        else:
+            if self.out_channels % self.G != 0:
+                raise ValueError(f"out_channels={self.out_channels} must be divisible by G={self.G}")
+            out_g = self.out_channels // self.G
+            self.head_w = nn.Parameter(torch.empty(self.C_fine, out_g, self.KERNELSZ*self.KERNELSZ))
+            nn.init.kaiming_uniform_(self.head_w.view(self.C_fine * out_g, -1), a=np.sqrt(5))
+            self.head_bn = nn.GroupNorm(num_groups=min(8, self.out_channels if self.out_channels>1 else 1),
+                                        num_channels=self.out_channels) if self.task=="segmentation" else None
+        pref = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        self.runtime_device = self._probe_and_set_runtime_device(pref)
+    def _move_hc(self, hc: ho.SphericalStencil, device: torch.device) -> None:
+        for name, val in list(vars(hc).items()):
+            try:
+                if torch.is_tensor(val):
+                    setattr(hc, name, val.to(device))
+                elif isinstance(val, (list, tuple)) and val and torch.is_tensor(val[0]):
+                    setattr(hc, name, type(val)([v.to(device) for v in val]))
+            except Exception:
+                pass
+    @torch.no_grad()
+    def _probe_and_set_runtime_device(self, preferred: torch.device) -> torch.device:
+        if preferred.type == "cuda":
+            try:
+                super().to(preferred)
+                for hc in self.hconv_levels + [self.hconv_token, self.hconv_head]:
+                    self._move_hc(hc, preferred)
+                npix0 = int(self.cell_ids_fine.shape[0])
+                x_try = torch.zeros(1, self.n_chan_in, npix0, device=preferred)
+                hc0 = self.hconv_levels[0] if len(self.hconv_levels)>0 else self.hconv_head
+                y_try = hc0.Convol_torch(x_try, self.pe_w1, cell_ids=self.cell_ids_fine)
+                _ = (y_try if torch.is_tensor(y_try) else torch.as_tensor(y_try, device=preferred)).sum().item()
+                self._foscat_device = preferred
+                return preferred
+            except Exception:
+                pass
+        cpu = torch.device("cpu")
+        super().to(cpu)
+        for hc in self.hconv_levels + [self.hconv_token, self.hconv_head]:
+            self._move_hc(hc, cpu)
+        self._foscat_device = cpu
+        return cpu
+    def _as_tensor_batch(self, x):
+        if isinstance(x, list):
+            if len(x) == 1:
+                t = x[0]
+                return t.unsqueeze(0) if t.dim() == 2 else t
+            raise ValueError("Variable-length list not supported here; pass a tensor.")
+        return x
+    def _to_numpy_ids(self, ids):
+        if torch.is_tensor(ids):
+            return ids.detach().cpu().numpy()
+        return np.asarray(ids)
+    def _patch_embed_fine(self, x_t: torch.Tensor) -> torch.Tensor:
+        hc0 = self.hconv_levels[0] if len(self.hconv_levels)>0 else self.hconv_head
+        z = hc0.Convol_torch(x_t, self.pe_w1, cell_ids=self.cell_ids_fine)
+        z = self._as_tensor_batch(z if torch.is_tensor(z) else torch.as_tensor(z, device=self.runtime_device))
+        z = self.pe_bn1(z); z = F.gelu(z)
+        z = hc0.Convol_torch(z, self.pe_w2, cell_ids=self.cell_ids_fine)
+        z = self._as_tensor_batch(z if torch.is_tensor(z) else torch.as_tensor(z, device=self.runtime_device))
+        z = self.pe_bn2(z); z = F.gelu(z)
+        return z
+    def forward(self, x: torch.Tensor, runtime_ids: Optional[np.ndarray] = None) -> torch.Tensor:
+        if x.dim() != 4:
+            raise ValueError("Expected input shape (B, T_in, C_in, Npix)")
+        B, T_in, C_in, Nf = x.shape
+        if C_in != self.n_chan_in:
+            raise ValueError(f"Expected n_chan_in={self.n_chan_in}, got {C_in}")
+        x = x.to(self.runtime_device)
+        fine_ids_runtime = self.cell_ids_fine if runtime_ids is None else self._to_numpy_ids(runtime_ids)
+        ids_chain = [np.asarray(fine_ids_runtime)]
+        nside_tmp = self.in_nside
+        _dummy = self.f.backend.bk_cast(np.zeros((1, 1, ids_chain[0].shape[0]), dtype=self.np_dtype))
+        for hc in self.hconv_levels:
+            _dummy, _next = hc.Down(_dummy, cell_ids=ids_chain[-1], nside=nside_tmp, max_poll=True)
+            ids_chain.append(self.f.backend.to_numpy(_next))
+            nside_tmp //= 2
+        # Encoder histories per level
+        l_hist: List[torch.Tensor] = []
+        l_ids:  List[np.ndarray] = []
+        feats_fine = []
+        for t in range(T_in):
+            zt = self._patch_embed_fine(x[:, t, :, :])
+            feats_fine.append(zt.unsqueeze(1))
+        feats_fine = torch.cat(feats_fine, dim=1)  # (B, T_in, C_fine, N_fine)
+        l_hist.append(feats_fine)
+        l_ids.append(self.cell_ids_fine)
+        current_nside = self.in_nside
+        l_data_hist = feats_fine
+        for i, hc in enumerate(self.hconv_levels):
+            Cin = self.level_dims[i]
+            Cout = self.level_dims[i+1]
+            w1, w2 = self.enc_w1[i], self.enc_w2[i]
+            feats_next = []
+            for t in range(T_in):
+                zt = l_data_hist[:, t, :, :]
+                zt = hc.Convol_torch(zt, w1, cell_ids=l_ids[-1])
+                zt = self._as_tensor_batch(zt if torch.is_tensor(zt) else torch.as_tensor(zt, device=self.runtime_device))
+                zt = self.enc_bn1[i](zt); zt = F.gelu(zt)
+                zt = hc.Convol_torch(zt, w2, cell_ids=l_ids[-1])
+                zt = self._as_tensor_batch(zt if torch.is_tensor(zt) else torch.as_tensor(zt, device=self.runtime_device))
+                zt = self.enc_bn2[i](zt); zt = F.gelu(zt)
+                feats_next.append(zt.unsqueeze(1))
+            feats_next = torch.cat(feats_next, dim=1)  # (B, T_in, Cout, N_i)
+            feats_down = []
+            next_ids_list = None
+            for t in range(T_in):
+                zt, next_ids = hc.Down(feats_next[:, t, :, :], cell_ids=l_ids[-1], nside=current_nside, max_poll=True)
+                zt = self._as_tensor_batch(zt)
+                feats_down.append(zt.unsqueeze(1))
+                next_ids_list = next_ids
+            feats_down = torch.cat(feats_down, dim=1)  # (B, T_in, Cout, N_{i+1})
+            l_hist.append(feats_down)
+            l_ids.append(self.f.backend.to_numpy(next_ids_list))
+            l_data_hist = feats_down
+            current_nside //= 2
+        # Temporal encoder on skips (levels 0..token_down-1)
+        skips: List[torch.Tensor] = []
+        for i in range(self.token_down):
+            Bx, Tx, Cx, Nx = l_hist[i].shape
+            z = l_hist[i].permute(0, 3, 1, 2).reshape(Bx*Nx, Tx, Cx)
+            z = self.temporal_encoders[i](z)
+            z = z.mean(dim=1)
+            H_i = z.view(Bx, Nx, Cx).permute(0, 2, 1).contiguous()
+            skips.append(H_i)
+        # Token-level transformer (spatial)
+        x_tok_hist = l_hist[-1]                       # (B, T_in, E, Ntok)
+        x_tok = x_tok_hist.mean(dim=1)                # (B, E, Ntok)  (could add temporal encoder here as well)
+        seq = x_tok.permute(0, 2, 1) + self.pos_token[:, :x_tok.shape[2], :]
+        seq = self.encoder_token(seq)
+        y = seq.permute(0, 2, 1)                      # (B, E, Ntok)
+        if self.task == "global":
+            g = seq.mean(dim=1)
+            return self.global_head(g)
+        # Decoder: Up + cross-attn fusion + double conv refinement
+        dec_idx = 0
+        for i in range(self.token_down, 0, -1):
+            coarse_ids = ids_chain[i]
+            fine_ids   = ids_chain[i-1]
+            source_ns  = self.in_nside // (2 ** i)
+            fine_ns    = self.in_nside // (2 ** (i-1))
+            Cfine      = self.level_dims[i-1]
+            op_fine = self.hconv_head if fine_ns == self.in_nside else self.hconv_levels[self.nsides_levels.index(fine_ns)]
+            y_up = op_fine.Up(y, cell_ids=coarse_ids, o_cell_ids=fine_ids, nside=source_ns)
+            y_up = self._as_tensor_batch(y_up if torch.is_tensor(y_up) else torch.as_tensor(y_up, device=self.runtime_device))  # (B, Cfine, N)
+            skip_i = skips[i-1]  # (B, Cfine, N)
+            q = self.dec_q[dec_idx](y_up.permute(0,2,1))
+            k = self.dec_k[dec_idx](skip_i.permute(0,2,1))
+            v = self.dec_v[dec_idx](skip_i.permute(0,2,1))
+            if self.pos_embed_per_level:
+                pos = self.level_pos[dec_idx][:, :q.shape[1], :]
+                q = q + pos; k = k + pos
+            z, _ = self.dec_attn[dec_idx](q, k, v)
+            z = self.dec_mlp[dec_idx](z)
+            z = z.permute(0,2,1).contiguous()  # (B, Cfine, N)
+            z = op_fine.Convol_torch(z, self.dec_refine_w1[dec_idx], cell_ids=fine_ids)
+            z = self._as_tensor_batch(z if torch.is_tensor(z) else torch.as_tensor(z, device=self.runtime_device))
+            z = self.dec_refine_bn1[dec_idx](z); z = F.gelu(z)
+            z = op_fine.Convol_torch(z, self.dec_refine_w2[dec_idx], cell_ids=fine_ids)
+            z = self._as_tensor_batch(z if torch.is_tensor(z) else torch.as_tensor(z, device=self.runtime_device))
+            z = self.dec_refine_bn2[dec_idx](z); z = F.gelu(z)
+            y = z
+            dec_idx += 1
+        y = self.hconv_head.Convol_torch(y, self.head_w, cell_ids=fine_ids_runtime)
+        y = self._as_tensor_batch(y if torch.is_tensor(y) else torch.as_tensor(y, device=self.runtime_device))
+        if self.task == "segmentation" and self.head_bn is not None:
+            y = self.head_bn(y)
+        if self.final_activation == "sigmoid":
+            y = torch.sigmoid(y)
+        elif self.final_activation == "softmax":
+            y = torch.softmax(y, dim=1)
+        return y
+if __name__ == "__main__":
+    in_nside = 4
+    npix = 12 * in_nside * in_nside
+    cell_ids = np.arange(npix, dtype=np.int64)
+    B, T_in, Cin = 2, 3, 4
+    x = torch.randn(B, T_in, Cin, npix)
+    model = HealpixViTSkip(
+        in_nside=in_nside,
+        n_chan_in=Cin,
+        level_dims=[64, 96, 128],
+        depth_token=2,
+        num_heads_token=4,
+        cell_ids=cell_ids,
+        task="regression",
+        out_channels=1,
+        KERNELSZ=3,
+        G=1,
+        dropout=0.1,
+    ).eval()
+    with torch.no_grad():
+        y = model(x)
+    print("Output:", tuple(y.shape))

foscat 2025.9.4__py3-none-any.whl → 2025.10.2__py3-none-any.whl

foscat 2025.9.4py3-none-any.whl → 2025.10.2py3-none-any.whl