File size: 2,443 Bytes
16be928 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 | {
"purpose": "With n=100 campaigns, single-seed metrics carry test-fold variance. Multi-seed evaluation gives a more reliable picture.",
"seeds_evaluated": [
42,
7,
13,
17,
23,
31,
45,
99,
123,
200
],
"per_seed": [
{
"seed": 42,
"test_n_classes": 7,
"accuracy": 0.6547008547008547,
"macro_f1": 0.6401276666852063,
"macro_roc_auc_ovr": 0.935584434710217
},
{
"seed": 7,
"test_n_classes": 7,
"accuracy": 0.6267123287671232,
"macro_f1": 0.6141815367358149,
"macro_roc_auc_ovr": 0.9256987657069029
},
{
"seed": 13,
"test_n_classes": 7,
"accuracy": 0.5983050847457627,
"macro_f1": 0.5953435905708684,
"macro_roc_auc_ovr": 0.9235372520169014
},
{
"seed": 17,
"test_n_classes": 7,
"accuracy": 0.64349376114082,
"macro_f1": 0.6328717716731788,
"macro_roc_auc_ovr": 0.9426545946495839
},
{
"seed": 23,
"test_n_classes": 7,
"accuracy": 0.5915254237288136,
"macro_f1": 0.5734921834318393,
"macro_roc_auc_ovr": 0.9245031023094512
},
{
"seed": 31,
"test_n_classes": 7,
"accuracy": 0.6220095693779905,
"macro_f1": 0.6103022022937624,
"macro_roc_auc_ovr": 0.9325576570435162
},
{
"seed": 45,
"test_n_classes": 7,
"accuracy": 0.6678082191780822,
"macro_f1": 0.655097964659693,
"macro_roc_auc_ovr": 0.9396074000285977
},
{
"seed": 99,
"test_n_classes": 7,
"accuracy": 0.7111111111111111,
"macro_f1": 0.7136854710276727,
"macro_roc_auc_ovr": 0.9538147161172963
},
{
"seed": 123,
"test_n_classes": 7,
"accuracy": 0.6823734729493892,
"macro_f1": 0.6727927606720584,
"macro_roc_auc_ovr": 0.9443324151480283
},
{
"seed": 200,
"test_n_classes": 7,
"accuracy": 0.6931407942238267,
"macro_f1": 0.6752712902262269,
"macro_roc_auc_ovr": 0.9450377543018418
}
],
"aggregate": {
"accuracy_mean": 0.6491180619923773,
"accuracy_std": 0.03799334369624316,
"accuracy_min": 0.5915254237288136,
"accuracy_max": 0.7111111111111111,
"macro_f1_mean": 0.638316643797632,
"macro_f1_std": 0.039956794294168915,
"roc_auc_mean": 0.9367328092032338,
"roc_auc_std": 0.009623085359130642
},
"published_artifact_seed": 42
} |