File size: 2,443 Bytes
16be928
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
{
  "purpose": "With n=100 campaigns, single-seed metrics carry test-fold variance. Multi-seed evaluation gives a more reliable picture.",
  "seeds_evaluated": [
    42,
    7,
    13,
    17,
    23,
    31,
    45,
    99,
    123,
    200
  ],
  "per_seed": [
    {
      "seed": 42,
      "test_n_classes": 7,
      "accuracy": 0.6547008547008547,
      "macro_f1": 0.6401276666852063,
      "macro_roc_auc_ovr": 0.935584434710217
    },
    {
      "seed": 7,
      "test_n_classes": 7,
      "accuracy": 0.6267123287671232,
      "macro_f1": 0.6141815367358149,
      "macro_roc_auc_ovr": 0.9256987657069029
    },
    {
      "seed": 13,
      "test_n_classes": 7,
      "accuracy": 0.5983050847457627,
      "macro_f1": 0.5953435905708684,
      "macro_roc_auc_ovr": 0.9235372520169014
    },
    {
      "seed": 17,
      "test_n_classes": 7,
      "accuracy": 0.64349376114082,
      "macro_f1": 0.6328717716731788,
      "macro_roc_auc_ovr": 0.9426545946495839
    },
    {
      "seed": 23,
      "test_n_classes": 7,
      "accuracy": 0.5915254237288136,
      "macro_f1": 0.5734921834318393,
      "macro_roc_auc_ovr": 0.9245031023094512
    },
    {
      "seed": 31,
      "test_n_classes": 7,
      "accuracy": 0.6220095693779905,
      "macro_f1": 0.6103022022937624,
      "macro_roc_auc_ovr": 0.9325576570435162
    },
    {
      "seed": 45,
      "test_n_classes": 7,
      "accuracy": 0.6678082191780822,
      "macro_f1": 0.655097964659693,
      "macro_roc_auc_ovr": 0.9396074000285977
    },
    {
      "seed": 99,
      "test_n_classes": 7,
      "accuracy": 0.7111111111111111,
      "macro_f1": 0.7136854710276727,
      "macro_roc_auc_ovr": 0.9538147161172963
    },
    {
      "seed": 123,
      "test_n_classes": 7,
      "accuracy": 0.6823734729493892,
      "macro_f1": 0.6727927606720584,
      "macro_roc_auc_ovr": 0.9443324151480283
    },
    {
      "seed": 200,
      "test_n_classes": 7,
      "accuracy": 0.6931407942238267,
      "macro_f1": 0.6752712902262269,
      "macro_roc_auc_ovr": 0.9450377543018418
    }
  ],
  "aggregate": {
    "accuracy_mean": 0.6491180619923773,
    "accuracy_std": 0.03799334369624316,
    "accuracy_min": 0.5915254237288136,
    "accuracy_max": 0.7111111111111111,
    "macro_f1_mean": 0.638316643797632,
    "macro_f1_std": 0.039956794294168915,
    "roc_auc_mean": 0.9367328092032338,
    "roc_auc_std": 0.009623085359130642
  },
  "published_artifact_seed": 42
}