iris-image-gen / iris /train.py
asdf98's picture
Upload iris/train.py
fcd6bec verified
raw
history blame
2.11 kB
"""IRIS Training utilities: synthetic dataset and scheduler."""
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import Dataset, DataLoader
import math
import time
import os
from .model import IRIS
from .flow_matching import flow_matching_loss, euler_sample, DCAE_F32C32_SCALE
class SyntheticLatentDataset(Dataset):
"""Generates synthetic latent/text pairs for testing training stability."""
def __init__(self, num_samples=10000, latent_channels=32, latent_size=16, text_dim=512, text_length=32, seed=42):
self.num_samples = num_samples
gen = torch.Generator().manual_seed(seed)
self.latents = torch.randn(num_samples, latent_channels, latent_size, latent_size, generator=gen) * 2.5
self.text_embeds = torch.randn(num_samples, text_length, text_dim, generator=gen)
self.text_embeds = F.normalize(self.text_embeds, dim=-1) * math.sqrt(text_dim)
def __len__(self):
return self.num_samples
def __getitem__(self, idx):
return {"latent": self.latents[idx], "text_embed": self.text_embeds[idx]}
class CosineWarmupScheduler:
"""Cosine decay with linear warmup."""
def __init__(self, optimizer, warmup_steps, total_steps, min_lr_ratio=0.1):
self.optimizer = optimizer
self.warmup_steps = warmup_steps
self.total_steps = total_steps
self.min_lr_ratio = min_lr_ratio
self.base_lrs = [pg["lr"] for pg in optimizer.param_groups]
self.step_count = 0
def step(self):
self.step_count += 1
if self.step_count <= self.warmup_steps:
scale = self.step_count / max(1, self.warmup_steps)
else:
progress = (self.step_count - self.warmup_steps) / max(1, self.total_steps - self.warmup_steps)
scale = self.min_lr_ratio + (1 - self.min_lr_ratio) * 0.5 * (1 + math.cos(math.pi * progress))
for pg, base_lr in zip(self.optimizer.param_groups, self.base_lrs):
pg["lr"] = base_lr * scale
def get_lr(self):
return [pg["lr"] for pg in self.optimizer.param_groups]