Spaces:

PhurinutR
/

ecg_reconstruction

Running

File size: 8,987 Bytes

"""Spatio-Temporal Dual Masking (STDM) from CoRe-ECG — reconstruction branch only."""

from __future__ import annotations

import torch


def sample_stdm_masks(
    batch_size: int,
    num_leads: int,
    num_patches: int,
    *,
    p_time: float,
    p_lead: float,
    k_visible: int,
    device: torch.device,
    generator: torch.Generator | None = None,
) -> tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
    """
    Sample visible (V), reconstruction-target (M), and dropped (D) masks.

    Each mask is ``(B, C, N)`` bool with ``V | M | D`` partitioning the grid (exclusive).

    Parameters
    ----------
    k_visible : number of leads kept visible in partial (non–full-temporal-mask) mode.
    p_time : Bernoulli prob for full temporal mask at a patch index.
    p_lead : Bernoulli prob for *dropping* a lead from supervision among hidden leads.
    """
    if not 0 <= p_time <= 1 or not 0 <= p_lead <= 1:
        raise ValueError("p_time and p_lead must be in [0, 1]")
    if k_visible < 1 or k_visible > num_leads:
        raise ValueError("k_visible must be in [1, num_leads]")

    C, N = num_leads, num_patches
    V = torch.zeros(batch_size, C, N, dtype=torch.bool, device=device)
    M = torch.zeros_like(V)
    D = torch.zeros_like(V)

    # Per (b, n): full temporal mask vs partial
    u_time = torch.rand(batch_size, N, device=device, generator=generator)
    full_time = u_time < p_time

    for b in range(batch_size):
        for n in range(N):
            if full_time[b, n]:
                M[b, :, n] = True
                continue
            # Partial: choose k_visible leads uniformly
            perm = torch.randperm(C, device=device, generator=generator)
            vis = perm[:k_visible]
            hid = perm[k_visible:]
            V[b, vis, n] = True
            if hid.numel() == 0:
                continue
            u = torch.rand(hid.numel(), device=device, generator=generator)
            dropped = hid[u < p_lead]
            masked = hid[u >= p_lead]
            D[b, dropped, n] = True
            M[b, masked, n] = True

    return V, M, D


def _sample_non_overlapping_band_starts(
    num_patches: int,
    band_width: int,
    num_bands: int,
    device: torch.device,
    generator: torch.Generator | None,
) -> list[int]:
    """Sample ``num_bands`` start indices in ``[0, num_patches - band_width]`` with disjoint intervals."""
    max_start = num_patches - band_width
    if max_start < 0:
        raise ValueError(
            f"band_width={band_width} exceeds num_patches={num_patches}; cannot place temporal bands."
        )
    for _ in range(128):
        starts = [
            int(torch.randint(0, max_start + 1, (1,), device=device, generator=generator).item())
            for _ in range(num_bands)
        ]
        ok = True
        for i in range(num_bands):
            for j in range(i + 1, num_bands):
                a0, a1 = starts[i], starts[i] + band_width
                b0, b1 = starts[j], starts[j] + band_width
                if not (a1 <= b0 or b1 <= a0):
                    ok = False
                    break
            if not ok:
                break
        if ok:
            return starts
    # Deterministic fallback: pack bands from the left with a gap if needed.
    gap = max(1, (max_start + 1 - num_bands * band_width) // max(1, num_bands - 1)) if num_bands > 1 else 0
    starts = [min(i * (band_width + gap), max_start) for i in range(num_bands)]
    return starts


def _simple_horizontal_masks(
    batch_size: int,
    num_leads: int,
    num_patches: int,
    num_masked_leads: int,
    device: torch.device,
    generator: torch.Generator | None,
) -> tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
    """Mask ``num_masked_leads`` random leads at every time patch (horizontal stripes)."""
    C, N = num_leads, num_patches
    perm = torch.rand(batch_size, C, device=device, generator=generator).argsort(dim=1)
    rank_cols = torch.arange(num_masked_leads, device=device).view(1, -1).expand(batch_size, -1)
    masked_lead = torch.gather(perm, 1, rank_cols)
    is_masked_lead = torch.zeros(batch_size, C, dtype=torch.bool, device=device)
    is_masked_lead.scatter_(1, masked_lead, True)

    M = is_masked_lead.unsqueeze(-1).expand(-1, -1, N)
    V = ~M
    D = torch.zeros(batch_size, C, N, dtype=torch.bool, device=device)
    return V, M, D


def _simple_vertical_masks(
    batch_size: int,
    num_leads: int,
    num_patches: int,
    *,
    band_width: int,
    num_bands: int,
    device: torch.device,
    generator: torch.Generator | None,
) -> tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
    """Mask ``num_bands`` disjoint time bands (all leads), each of width ``band_width`` patches."""
    C, N = num_leads, num_patches
    M = torch.zeros(batch_size, C, N, dtype=torch.bool, device=device)
    for b in range(batch_size):
        starts = _sample_non_overlapping_band_starts(N, band_width, num_bands, device, generator)
        for s in starts:
            M[b, :, s : s + band_width] = True
    V = ~M
    D = torch.zeros_like(M)
    return V, M, D


def _no_mask_autoencoder(
    batch_size: int,
    num_leads: int,
    num_patches: int,
    device: torch.device,
) -> tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
    """
    Autoencoder-style branch: all tokens visible and all tokens supervised.

    ``V`` and ``M`` are all-True, ``D`` is all-False.
    """
    V = torch.ones(batch_size, num_leads, num_patches, dtype=torch.bool, device=device)
    M = torch.ones_like(V)
    D = torch.zeros_like(V)
    return V, M, D


def get_mask(
    batch_size: int,
    num_leads: int,
    num_patches: int,
    *,
    p_time: float,
    p_lead: float,
    k_visible: int,
    device: torch.device,
    generator: torch.Generator | None = None,
    p_stdm: float = 0.25,
    p_no_mask_autoencoder: float = 0.25,
    p_simple_horizontal: float = 0.25,
    p_simple_vertical: float = 0.25,
    num_masked_leads: int = 2,
    vertical_band_width: int = 11,
    num_vertical_bands: int = 2,
) -> tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
    """
    Per batch item, choose one of four mask types (probabilities sum to 1 by default):

    - ``p_stdm`` (0.25): ``sample_stdm_masks`` (full STDM).
    - ``p_no_mask_autoencoder`` (0.25): all patches visible and supervised (AE-style).
    - ``p_simple_horizontal`` (0.25): mask ``num_masked_leads`` random leads at all time patches.
    - ``p_simple_vertical`` (0.25): mask ``num_vertical_bands`` disjoint time bands of width
      ``vertical_band_width`` patches; all leads are **M** inside each band.

    Returns ``(V, M, D)`` each ``(B, C, N)`` bool.
    For STDM/horizontal/vertical branches, ``V | M | D`` partitions the grid.
    For AE-style branch, ``V`` and ``M`` intentionally overlap (both all-True), ``D`` is all-False.
    """
    probs = (p_stdm, p_no_mask_autoencoder, p_simple_horizontal, p_simple_vertical)
    if any(p < 0 or p > 1 for p in probs):
        raise ValueError("mask probabilities must be in [0, 1]")
    if abs(sum(probs) - 1.0) > 1e-6:
        raise ValueError(
            "p_stdm + p_no_mask_autoencoder + p_simple_horizontal + p_simple_vertical "
            f"must equal 1, got {sum(probs)}"
        )
    if num_masked_leads < 1 or num_masked_leads > num_leads:
        raise ValueError("num_masked_leads must be in [1, num_leads]")
    if num_vertical_bands < 1:
        raise ValueError("num_vertical_bands must be >= 1")
    if vertical_band_width < 1:
        raise ValueError("vertical_band_width must be >= 1")

    C, N = num_leads, num_patches
    V_stdm, M_stdm, D_stdm = sample_stdm_masks(
        batch_size,
        num_leads,
        num_patches,
        p_time=p_time,
        p_lead=p_lead,
        k_visible=k_visible,
        device=device,
        generator=generator,
    )

    V_h, M_h, D_h = _simple_horizontal_masks(
        batch_size, num_leads, num_patches, num_masked_leads, device, generator
    )
    V_v, M_v, D_v = _simple_vertical_masks(
        batch_size,
        num_leads,
        num_patches,
        band_width=vertical_band_width,
        num_bands=num_vertical_bands,
        device=device,
        generator=generator,
    )
    V_ae, M_ae, D_ae = _no_mask_autoencoder(batch_size, num_leads, num_patches, device)

    u = torch.rand(batch_size, device=device, generator=generator)
    t0 = p_stdm
    t1 = t0 + p_no_mask_autoencoder
    t2 = t1 + p_simple_horizontal
    use_stdm = u < t0
    use_ae = (u >= t0) & (u < t1)
    use_h = (u >= t1) & (u < t2)
    use_v = u >= t2

    sel_stdm = use_stdm.view(batch_size, 1, 1)
    sel_ae = use_ae.view(batch_size, 1, 1)
    sel_h = use_h.view(batch_size, 1, 1)

    V = torch.where(sel_stdm, V_stdm, torch.where(sel_ae, V_ae, torch.where(sel_h, V_h, V_v)))
    M = torch.where(sel_stdm, M_stdm, torch.where(sel_ae, M_ae, torch.where(sel_h, M_h, M_v)))
    D = torch.where(sel_stdm, D_stdm, torch.where(sel_ae, D_ae, torch.where(sel_h, D_h, D_v)))
    return V, M, D