Jonttup
/

palette-edit-classifier

Model card Files Files and versions

xet

Community

Jonttup commited on 22 days ago

Commit

27fdf85

verified ·

1 Parent(s): e27c6bd

Upload models/oklab_utils.py with huggingface_hub

Browse files

Files changed (1) hide show

models/oklab_utils.py +263 -0

models/oklab_utils.py ADDED Viewed

	@@ -0,0 +1,263 @@

+"""
+OKLab Color Space Utilities
+Perceptually uniform color space for semantic loss computation.
+OKLab ensures that equal distances in the color space correspond to
+equal perceived differences — critical for meaningful color-based encoding.
+Key functions:
+- srgb_to_oklab / oklab_to_srgb: Color space conversions
+- rotate_ab: Rotate hue in a-b plane (for domain/idiom shifts)
+- set_chroma: Set chroma magnitude (for purity encoding)
+- OKLabMSELoss: Perceptually uniform loss function
+- hsl_to_oklab_batch: Batch conversion for training
+"""
+import torch
+import torch.nn as nn
+import math
+from typing import Tuple
+def clamp(x: float, lo: float, hi: float) -> float:
+    """Clamp a value to [lo, hi]."""
+    return max(lo, min(hi, x))
+# ── sRGB ↔ Linear RGB ──
+def srgb_to_linear(c: float) -> float:
+    """sRGB gamma to linear."""
+    if c <= 0.04045:
+        return c / 12.92
+    return ((c + 0.055) / 1.055) ** 2.4
+def linear_to_srgb(c: float) -> float:
+    """Linear to sRGB gamma."""
+    if c <= 0.0031308:
+        return c * 12.92
+    return 1.055 * (c ** (1.0 / 2.4)) - 0.055
+# ── sRGB ↔ OKLab ──
+def srgb_to_oklab(r: float, g: float, b: float) -> Tuple[float, float, float]:
+    """Convert sRGB [0,1] to OKLab."""
+    r_lin = srgb_to_linear(r)
+    g_lin = srgb_to_linear(g)
+    b_lin = srgb_to_linear(b)
+    l_ = 0.4122214708 * r_lin + 0.5363325363 * g_lin + 0.0514459929 * b_lin
+    m_ = 0.2119034982 * r_lin + 0.6806995451 * g_lin + 0.1073969566 * b_lin
+    s_ = 0.0883024619 * r_lin + 0.2817188376 * g_lin + 0.6299787005 * b_lin
+    l_c = l_ ** (1.0 / 3.0) if l_ >= 0 else -((-l_) ** (1.0 / 3.0))
+    m_c = m_ ** (1.0 / 3.0) if m_ >= 0 else -((-m_) ** (1.0 / 3.0))
+    s_c = s_ ** (1.0 / 3.0) if s_ >= 0 else -((-s_) ** (1.0 / 3.0))
+    L = 0.2104542553 * l_c + 0.7936177850 * m_c - 0.0040720468 * s_c
+    a = 1.9779984951 * l_c - 2.4285922050 * m_c + 0.4505937099 * s_c
+    b_ok = 0.0259040371 * l_c + 0.7827717662 * m_c - 0.8086757660 * s_c
+    return (L, a, b_ok)
+def oklab_to_srgb(L: float, a: float, b_ok: float) -> Tuple[float, float, float]:
+    """Convert OKLab to sRGB [0,1]."""
+    l_c = L + 0.3963377774 * a + 0.2158037573 * b_ok
+    m_c = L - 0.1055613458 * a - 0.0638541728 * b_ok
+    s_c = L - 0.0894841775 * a - 1.2914855480 * b_ok
+    l_ = l_c * l_c * l_c
+    m_ = m_c * m_c * m_c
+    s_ = s_c * s_c * s_c
+    r_lin = +4.0767416621 * l_ - 3.3077115913 * m_ + 0.2309699292 * s_
+    g_lin = -1.2684380046 * l_ + 2.6097574011 * m_ - 0.3413193965 * s_
+    b_lin = -0.0041960863 * l_ - 0.7034186147 * m_ + 1.7076147010 * s_
+    r = clamp(linear_to_srgb(clamp(r_lin, 0, 1)), 0, 1)
+    g = clamp(linear_to_srgb(clamp(g_lin, 0, 1)), 0, 1)
+    b = clamp(linear_to_srgb(clamp(b_lin, 0, 1)), 0, 1)
+    return (r, g, b)
+# ── HSL ↔ RGB ──
+def hsl_to_rgb(h_deg: float, s_pct: float, l_pct: float) -> Tuple[float, float, float]:
+    """Convert HSL (degrees, percent, percent) to RGB [0,1]."""
+    h = h_deg / 360.0
+    s = s_pct / 100.0
+    l = l_pct / 100.0
+    if s == 0:
+        return (l, l, l)
+    def hue_to_rgb(p, q, t):
+        if t < 0: t += 1
+        if t > 1: t -= 1
+        if t < 1/6: return p + (q - p) * 6 * t
+        if t < 1/2: return q
+        if t < 2/3: return p + (q - p) * (2/3 - t) * 6
+        return p
+    q = l * (1 + s) if l < 0.5 else l + s - l * s
+    p = 2 * l - q
+    r = hue_to_rgb(p, q, h + 1/3)
+    g = hue_to_rgb(p, q, h)
+    b = hue_to_rgb(p, q, h - 1/3)
+    return (r, g, b)
+def rgb_to_hsl(r: float, g: float, b: float) -> Tuple[float, float, float]:
+    """Convert RGB [0,1] to HSL (degrees, percent, percent)."""
+    max_c = max(r, g, b)
+    min_c = min(r, g, b)
+    l = (max_c + min_c) / 2.0
+    if max_c == min_c:
+        h = s = 0.0
+    else:
+        d = max_c - min_c
+        s = d / (2.0 - max_c - min_c) if l > 0.5 else d / (max_c + min_c)
+        if max_c == r:
+            h = (g - b) / d + (6 if g < b else 0)
+        elif max_c == g:
+            h = (b - r) / d + 2
+        else:
+            h = (r - g) / d + 4
+        h /= 6.0
+    return (h * 360.0, s * 100.0, l * 100.0)
+# ── OKLab Operations ──
+def rotate_ab(a: float, b: float, degrees: float) -> Tuple[float, float]:
+    """Rotate hue in OKLab a-b plane by given degrees."""
+    rad = math.radians(degrees)
+    cos_r = math.cos(rad)
+    sin_r = math.sin(rad)
+    return (a * cos_r - b * sin_r, a * sin_r + b * cos_r)
+def set_chroma(a: float, b: float, target_c: float) -> Tuple[float, float]:
+    """Set the chroma (magnitude in a-b plane) to target value."""
+    current_c = math.sqrt(a * a + b * b)
+    if current_c < 1e-10:
+        return (target_c, 0.0)  # Default direction
+    scale = target_c / current_c
+    return (a * scale, b * scale)
+def get_chroma(a: float, b: float) -> float:
+    """Get chroma magnitude from a-b values."""
+    return math.sqrt(a * a + b * b)
+def compute_delta_e_oklab(
+    L1: float, a1: float, b1: float,
+    L2: float, a2: float, b2: float,
+) -> float:
+    """Compute ΔE in OKLab space (perceptual color difference)."""
+    return math.sqrt((L1 - L2) ** 2 + (a1 - a2) ** 2 + (b1 - b2) ** 2)
+# ── Batch Operations (PyTorch) ──
+def hsl_to_oklab_batch(hsl: torch.Tensor) -> torch.Tensor:
+    """
+    Batch convert HSL [0,1] normalized to OKLab.
+    Args:
+        hsl: (..., 3) tensor with H,S,L in [0,1]
+    Returns:
+        (..., 3) tensor with L,a,b in OKLab
+    """
+    h = hsl[..., 0] * 360.0  # Back to degrees
+    s = hsl[..., 1] * 100.0  # Back to percent
+    l = hsl[..., 2] * 100.0  # Back to percent
+    # HSL to RGB (vectorized)
+    h_norm = h / 360.0
+    q = torch.where(l / 100.0 < 0.5,
+                    (l / 100.0) * (1 + s / 100.0),
+                    (l / 100.0) + (s / 100.0) - (l / 100.0) * (s / 100.0))
+    p = 2 * (l / 100.0) - q
+    def hue2rgb(p, q, t):
+        t = t % 1.0
+        r = torch.where(t < 1/6, p + (q - p) * 6 * t,
+            torch.where(t < 1/2, q,
+            torch.where(t < 2/3, p + (q - p) * (2/3 - t) * 6, p)))
+        return r
+    r = hue2rgb(p, q, h_norm + 1/3)
+    g = hue2rgb(p, q, h_norm)
+    b = hue2rgb(p, q, h_norm - 1/3)
+    # Handle achromatic (s == 0)
+    achromatic = (s < 0.001)
+    r = torch.where(achromatic, l / 100.0, r)
+    g = torch.where(achromatic, l / 100.0, g)
+    b = torch.where(achromatic, l / 100.0, b)
+    # sRGB to linear
+    r_lin = torch.where(r <= 0.04045, r / 12.92, ((r + 0.055) / 1.055) ** 2.4)
+    g_lin = torch.where(g <= 0.04045, g / 12.92, ((g + 0.055) / 1.055) ** 2.4)
+    b_lin = torch.where(b <= 0.04045, b / 12.92, ((b + 0.055) / 1.055) ** 2.4)
+    # Linear RGB to OKLab
+    l_ = 0.4122214708 * r_lin + 0.5363325363 * g_lin + 0.0514459929 * b_lin
+    m_ = 0.2119034982 * r_lin + 0.6806995451 * g_lin + 0.1073969566 * b_lin
+    s_ = 0.0883024619 * r_lin + 0.2817188376 * g_lin + 0.6299787005 * b_lin
+    l_c = torch.sign(l_) * torch.abs(l_).pow(1/3)
+    m_c = torch.sign(m_) * torch.abs(m_).pow(1/3)
+    s_c = torch.sign(s_) * torch.abs(s_).pow(1/3)
+    L_ok = 0.2104542553 * l_c + 0.7936177850 * m_c - 0.0040720468 * s_c
+    a_ok = 1.9779984951 * l_c - 2.4285922050 * m_c + 0.4505937099 * s_c
+    b_ok = 0.0259040371 * l_c + 0.7827717662 * m_c - 0.8086757660 * s_c
+    return torch.stack([L_ok, a_ok, b_ok], dim=-1)
+def denormalize_hsl(hsl_norm: torch.Tensor) -> torch.Tensor:
+    """Convert normalized HSL [0,1] to degrees/percent format."""
+    result = hsl_norm.clone()
+    result[..., 0] *= 360.0  # H: [0,1] → [0,360]
+    result[..., 1] *= 100.0  # S: [0,1] → [0,100]
+    result[..., 2] *= 100.0  # L: [0,1] → [0,100]
+    return result
+class OKLabMSELoss(nn.Module):
+    """
+    Perceptually uniform loss in OKLab space.
+    Converts predicted and target HSL values to OKLab, then computes MSE.
+    This handles hue circularity correctly (359° ≈ 1°) because OKLab
+    represents hue as a-b coordinates, not an angle.
+    """
+    def __init__(self):
+        super().__init__()
+    def forward(
+        self,
+        pred_hsl: torch.Tensor,    # (B, 3) predicted HSL in [0,1]
+        target_hsl: torch.Tensor,  # (B, 3) target HSL in [0,1]
+    ) -> torch.Tensor:
+        """Compute perceptually uniform loss."""
+        pred_oklab = hsl_to_oklab_batch(pred_hsl)
+        target_oklab = hsl_to_oklab_batch(target_hsl)
+        return torch.nn.functional.mse_loss(pred_oklab, target_oklab)