cyb011-baseline-classifier / validation_results.json

Initial release: attack_phase 7-class baseline + 6-oracle-path leakage diagnostic + missing tier note

03d64e5 verified 1 day ago

6.48 kB

	{
	"version": "1.0.0",
	"dataset": "xpertsystems/cyb011-sample",
	"task": "7-class attack_phase classification",
	"baselines": {
	"always_predict_majority_accuracy": 0.5033333333333333,
	"majority_class": "evasion_attempt",
	"random_guess_accuracy": 0.14285714285714285
	},
	"split": {
	"strategy": "group-aware (GroupShuffleSplit on campaign_id, nested 70/15/15)",
	"rationale": "200 campaigns x 70 timesteps each. Timesteps from the same campaign share attacker, target segment, and tier - so train/test contamination is a real risk with random splitting. ~30 test campaigns per fold.",
	"events_train": 9730,
	"events_val": 2170,
	"events_test": 2100,
	"seed": 42
	},
	"n_features": 37,
	"label_classes": [
	"reconnaissance",
	"feature_space_probe",
	"perturbation_craft",
	"evasion_attempt",
	"feedback_adaptation",
	"campaign_consolidation",
	"idle_dwell"
	],
	"class_distribution_train": {
	"evasion_attempt": 5082,
	"idle_dwell": 1677,
	"feature_space_probe": 983,
	"campaign_consolidation": 571,
	"reconnaissance": 558,
	"perturbation_craft": 511,
	"feedback_adaptation": 348
	},
	"class_distribution_test": {
	"evasion_attempt": 1057,
	"idle_dwell": 388,
	"feature_space_probe": 220,
	"reconnaissance": 128,
	"campaign_consolidation": 116,
	"perturbation_craft": 115,
	"feedback_adaptation": 76
	},
	"oracle_excluded_features": [
	"detection_outcome (perfect oracle for evasion_attempt phase)",
	"detector_confidence_score (mechanical decoder for detection_outcome)",
	"evasion_budget_consumed (==0 is perfect oracle for 3 early phases)"
	],
	"timestep_kept_as_legitimate_feature": "timestep is KEPT as a feature. It's a partial oracle for 3 phases (reconnaissance, feedback_adaptation, campaign_consolidation) but is a legitimate campaign-progress observable a defender would have at decision time. Removing it drops accuracy by ~9pp.",
	"leakage_audit_note": "See leakage_diagnostic.json for the full 6-oracle-path audit, 4 unlearnable README-suggested targets, and the missing nation_state attacker tier note.",
	"models": {
	"xgboost": {
	"architecture": "Gradient-boosted decision trees, multi:softprob, 7 classes",
	"framework": "xgboost",
	"test_metrics": {
	"model": "xgboost",
	"accuracy": 0.8642857142857143,
	"macro_f1": 0.7693247628697397,
	"weighted_f1": 0.8650489644308249,
	"per_class_f1": {
	"reconnaissance": 0.8865248226950354,
	"feature_space_probe": 0.7829977628635347,
	"perturbation_craft": 0.4927536231884058,
	"evasion_attempt": 0.9962013295346629,
	"feedback_adaptation": 0.7151515151515152,
	"campaign_consolidation": 0.8075471698113208,
	"idle_dwell": 0.7040971168437026
	},
	"confusion_matrix": {
	"labels": [
	"reconnaissance",
	"feature_space_probe",
	"perturbation_craft",
	"evasion_attempt",
	"feedback_adaptation",
	"campaign_consolidation",
	"idle_dwell"
	],
	"matrix": [
	[
	125,
	0,
	0,
	0,
	0,
	0,
	3
	],
	[
	0,
	175,
	43,
	0,
	0,
	0,
	2
	],
	[
	0,
	20,
	68,
	0,
	0,
	0,
	27
	],
	[
	0,
	0,
	2,
	1049,
	0,
	0,
	6
	],
	[
	0,
	0,
	0,
	0,
	59,
	16,
	1
	],
	[
	0,
	0,
	0,
	0,
	9,
	107,
	0
	],
	[
	29,
	32,
	48,
	0,
	21,
	26,
	232
	]
	]
	},
	"macro_roc_auc_ovr": 0.9752868672798508
	}
	},
	"mlp": {
	"architecture": "PyTorch MLP, 37 -> 128 -> 64 -> 7, BatchNorm1d + ReLU + Dropout, weighted cross-entropy loss",
	"framework": "pytorch",
	"test_metrics": {
	"model": "mlp",
	"accuracy": 0.8385714285714285,
	"macro_f1": 0.7344635260259678,
	"weighted_f1": 0.8387834443096441,
	"per_class_f1": {
	"reconnaissance": 0.8737201365187713,
	"feature_space_probe": 0.746606334841629,
	"perturbation_craft": 0.49707602339181284,
	"evasion_attempt": 0.9928537398761315,
	"feedback_adaptation": 0.627906976744186,
	"campaign_consolidation": 0.784452296819788,
	"idle_dwell": 0.6186291739894552
	},
	"confusion_matrix": {
	"labels": [
	"reconnaissance",
	"feature_space_probe",
	"perturbation_craft",
	"evasion_attempt",
	"feedback_adaptation",
	"campaign_consolidation",
	"idle_dwell"
	],
	"matrix": [
	[
	128,
	0,
	0,
	0,
	0,
	0,
	0
	],
	[
	0,
	165,
	55,
	0,
	0,
	0,
	0
	],
	[
	5,
	24,
	85,
	0,
	0,
	0,
	1
	],
	[
	0,
	4,
	2,
	1042,
	4,
	1,
	4
	],
	[
	0,
	0,
	0,
	0,
	54,
	22,
	0
	],
	[
	0,
	0,
	0,
	0,
	5,
	111,
	0
	],
	[
	32,
	29,
	85,
	0,
	33,
	33,
	176
	]
	]
	},
	"macro_roc_auc_ovr": 0.9705026035482472
	}
	}
	}
	}