connaaa's picture
Phase 5 release: 7 TopK SAEs + specificity / null-steering JSON artifacts
5f2451e verified
[
{
"step": 200,
"loss": 29.05353546142578,
"l0": 40.0,
"fve": 0.7888412205173247,
"n_dead": 0,
"mse": 0.05674518644809723
},
{
"step": 400,
"loss": 44.51063537597656,
"l0": 40.0,
"fve": 0.828121429866145,
"n_dead": 769,
"mse": 0.04685475304722786
},
{
"step": 600,
"loss": 40.60480880737305,
"l0": 40.0,
"fve": 0.8353118397308505,
"n_dead": 239,
"mse": 0.04323723167181015
},
{
"step": 800,
"loss": 22.681713104248047,
"l0": 40.0,
"fve": 0.8478801929634973,
"n_dead": 29,
"mse": 0.03988751769065857
},
{
"step": 1000,
"loss": 19.90431785583496,
"l0": 40.0,
"fve": 0.8681096795485392,
"n_dead": 4,
"mse": 0.03827929496765137
},
{
"step": 1200,
"loss": 19.122100830078125,
"l0": 40.0,
"fve": 0.8613335049168376,
"n_dead": 2,
"mse": 0.037058740854263306
},
{
"step": 1400,
"loss": 18.61587142944336,
"l0": 40.0,
"fve": 0.854929133645014,
"n_dead": 2,
"mse": 0.03607767075300217
},
{
"step": 1600,
"loss": 17.96778106689453,
"l0": 40.0,
"fve": 0.8535506236950299,
"n_dead": 1,
"mse": 0.03495676815509796
},
{
"step": 1800,
"loss": 17.5817928314209,
"l0": 40.0,
"fve": 0.8671142899286272,
"n_dead": 1,
"mse": 0.03420582413673401
},
{
"step": 2000,
"loss": 17.37525749206543,
"l0": 40.0,
"fve": 0.8686602042934782,
"n_dead": 2,
"mse": 0.03367304056882858
},
{
"step": 2200,
"loss": 16.68439483642578,
"l0": 40.0,
"fve": 0.877142112507239,
"n_dead": 1,
"mse": 0.03245990723371506
},
{
"step": 2400,
"loss": 16.43060874938965,
"l0": 40.0,
"fve": 0.8754777867952352,
"n_dead": 0,
"mse": 0.03209103271365166
},
{
"step": 2441,
"loss": 16.80815315246582,
"l0": 40.0,
"fve": 0.8691270860953982,
"n_dead": 0,
"mse": 0.032828424125909805
}
]