{
  "_meta": {
    "eval_file": "logs/eval_v2.json",
    "iterations": 10000,
    "seed": 42,
    "method": "percentile bootstrap on Bernoulli outcome arrays reconstructed from logs/eval_v2.json aggregates",
    "n_scams": 144,
    "n_benign": 30,
    "n_total": 174
  },
  "detection": {
    "point": 0.9930555555555556,
    "ci_low": 0.9791666666666666,
    "ci_high": 1.0
  },
  "fpr": {
    "point": 0.06666666666666667,
    "ci_low": 0.0,
    "ci_high": 0.16666666666666666
  },
  "f1": {
    "point": 0.9896193771626298,
    "ci_low": 0.9759450171821307,
    "ci_high": 1.0
  },
  "per_difficulty": {
    "easy": {
      "n": 26,
      "detection": {
        "point": 1.0,
        "ci_low": 1.0,
        "ci_high": 1.0
      }
    },
    "medium": {
      "n": 66,
      "detection": {
        "point": 1.0,
        "ci_low": 1.0,
        "ci_high": 1.0
      }
    },
    "hard": {
      "n": 18,
      "detection": {
        "point": 1.0,
        "ci_low": 1.0,
        "ci_high": 1.0
      }
    },
    "novel": {
      "n": 34,
      "detection": {
        "point": 0.9705882352941176,
        "ci_low": 0.9117647058823529,
        "ci_high": 1.0
      }
    }
  }
}