cyb011-baseline-classifier / multi_seed_results.json
pradeep-xpert's picture
Initial release: attack_phase 7-class baseline + 6-oracle-path leakage diagnostic + missing tier note
03d64e5 verified
{
"purpose": "Multi-seed evaluation across 10 group-aware splits of the 14,000-event sample (200 campaigns).",
"seeds_evaluated": [
42,
7,
13,
17,
23,
31,
45,
99,
123,
200
],
"per_seed": [
{
"seed": 42,
"test_n_classes": 7,
"accuracy": 0.8642857142857143,
"macro_f1": 0.7693247628697397,
"macro_roc_auc_ovr": 0.9752868672798508
},
{
"seed": 7,
"test_n_classes": 7,
"accuracy": 0.8733333333333333,
"macro_f1": 0.7868555284450741,
"macro_roc_auc_ovr": 0.9786952359398997
},
{
"seed": 13,
"test_n_classes": 7,
"accuracy": 0.8752380952380953,
"macro_f1": 0.7750991458229394,
"macro_roc_auc_ovr": 0.9779387743730787
},
{
"seed": 17,
"test_n_classes": 7,
"accuracy": 0.8738095238095238,
"macro_f1": 0.7814925647016364,
"macro_roc_auc_ovr": 0.9776960470844541
},
{
"seed": 23,
"test_n_classes": 7,
"accuracy": 0.8838095238095238,
"macro_f1": 0.7978303920930874,
"macro_roc_auc_ovr": 0.9798719092961202
},
{
"seed": 31,
"test_n_classes": 7,
"accuracy": 0.8690476190476191,
"macro_f1": 0.7726664814609271,
"macro_roc_auc_ovr": 0.9759310226918093
},
{
"seed": 45,
"test_n_classes": 7,
"accuracy": 0.8519047619047619,
"macro_f1": 0.7504006897882468,
"macro_roc_auc_ovr": 0.9727919502752255
},
{
"seed": 99,
"test_n_classes": 7,
"accuracy": 0.8585714285714285,
"macro_f1": 0.7746640410602633,
"macro_roc_auc_ovr": 0.9769979540429897
},
{
"seed": 123,
"test_n_classes": 7,
"accuracy": 0.8533333333333334,
"macro_f1": 0.771942700676468,
"macro_roc_auc_ovr": 0.9738063729400632
},
{
"seed": 200,
"test_n_classes": 7,
"accuracy": 0.8652380952380953,
"macro_f1": 0.7668641323226082,
"macro_roc_auc_ovr": 0.9762239650477442
}
],
"aggregate": {
"accuracy_mean": 0.8668571428571428,
"accuracy_std": 0.009680145423468645,
"accuracy_min": 0.8519047619047619,
"accuracy_max": 0.8838095238095238,
"macro_f1_mean": 0.774714043924099,
"macro_f1_std": 0.011922910105924629,
"roc_auc_mean": 0.9765240098971235,
"roc_auc_std": 0.0020690216988592247
},
"published_artifact_seed": 42
}