{ "cache_dir": "hf://usm3d/s23dr-2026-sampled_2048_v2:train", "val_cache_dir": "", "arch": "perceiver", "segments": 64, "hidden": 256, "ff": 1024, "latent_tokens": 256, "latent_layers": 7, "encoder_layers": 4, "pre_encoder_layers": 0, "decoder_layers": 3, "decoder_input_xattn": false, "qk_norm": true, "qk_norm_type": "l2", "learnable_fourier": false, "num_heads": 4, "kv_heads_cross": 2, "kv_heads_self": 2, "cross_attn_interval": 4, "dropout": 0.1, "steps": 160000, "batch_size": 32, "lr": 3e-05, "muon_lr": null, "adam_betas": "0.9,0.95", "warmup": 10000, "cosine_decay": false, "cooldown_start": 140000, "cooldown_steps": 20000, "mup": false, "mup_base_width": 128, "seed": 353, "varifold_weight": 0.0, "varifold_cross_only": false, "sinkhorn_weight": 1.0, "sinkhorn_eps": 0.1, "sinkhorn_eps_start": null, "sinkhorn_iters": 20, "sinkhorn_dustbin": 0.3, "vertex_f1_weight": 0.0, "soft_hss_weight": 0.0, "endpoint_weight": 0.1, "endpoint_warmup": 0, "aug_rotate": true, "aug_jitter": 0.0, "aug_drop": 0.0, "aug_flip": true, "gpu_dataset": false, "stored_seq_len": 8192, "rms_norm": true, "activation": "gelu", "behind_emb_dim": 8, "vote_features": true, "segment_param": "midpoint_dir_len", "length_floor": 0.0, "segment_conf": true, "conf_weight": 0.1, "conf_mode": "sinkhorn", "conf_clamp_min": null, "conf_head_wd": 0.1, "optimizer": "adamw", "out_dir": "/workspace/s23dr_2026_example/runs", "resume": "runs/20260322_085443/checkpoints/step125000.pt", "cpu": false, "args_from": "runs/20260322_085443/args.json" }