connaaa's picture
Phase 5 release: 7 TopK SAEs + specificity / null-steering JSON artifacts
5f2451e verified
[
{
"step": 200,
"loss": 14.795553207397461,
"l0": 40.0,
"fve": 0.8293616575146343,
"n_dead": 0,
"mse": 0.028897564858198166
},
{
"step": 400,
"loss": 22.638526916503906,
"l0": 40.0,
"fve": 0.8359017185027313,
"n_dead": 663,
"mse": 0.023937705904245377
},
{
"step": 600,
"loss": 19.389955520629883,
"l0": 40.0,
"fve": 0.8645987532704418,
"n_dead": 222,
"mse": 0.021326521411538124
},
{
"step": 800,
"loss": 11.63227653503418,
"l0": 40.0,
"fve": 0.8760963178028377,
"n_dead": 35,
"mse": 0.02005489356815815
},
{
"step": 1000,
"loss": 9.950961112976074,
"l0": 40.0,
"fve": 0.8784041379676274,
"n_dead": 8,
"mse": 0.018850065767765045
},
{
"step": 1200,
"loss": 9.30925178527832,
"l0": 40.0,
"fve": 0.8774098117815495,
"n_dead": 2,
"mse": 0.018041376024484634
},
{
"step": 1400,
"loss": 8.932659149169922,
"l0": 40.0,
"fve": 0.8964732688104713,
"n_dead": 1,
"mse": 0.01737871766090393
},
{
"step": 1600,
"loss": 8.559926986694336,
"l0": 40.0,
"fve": 0.8907664732630304,
"n_dead": 0,
"mse": 0.016718603670597076
},
{
"step": 1800,
"loss": 8.413354873657227,
"l0": 40.0,
"fve": 0.8881362105445537,
"n_dead": 0,
"mse": 0.01643233373761177
},
{
"step": 2000,
"loss": 8.195343017578125,
"l0": 40.0,
"fve": 0.8944998626527212,
"n_dead": 1,
"mse": 0.015944253653287888
},
{
"step": 2200,
"loss": 8.069483757019043,
"l0": 40.0,
"fve": 0.9000171435610246,
"n_dead": 1,
"mse": 0.01569938287138939
},
{
"step": 2400,
"loss": 7.750567436218262,
"l0": 40.0,
"fve": 0.9054223585460653,
"n_dead": 0,
"mse": 0.015137827023863792
},
{
"step": 2441,
"loss": 7.990331649780273,
"l0": 40.0,
"fve": 0.8937416797380295,
"n_dead": 1,
"mse": 0.015545391477644444
}
]