{
  "config": {
    "pins": {
      "torch": "2.7.0",
      "unsloth": "2026.4.4",
      "unsloth_zoo": "2026.4.4",
      "trl": "0.21.0",
      "transformers": "4.56.2",
      "vllm": "0.9.2",
      "peft": "0.18.0",
      "accelerate": "1.13.0",
      "bitsandbytes": "0.49.2",
      "torchao": "0.17.0"
    },
    "grpo": {
      "num_generations": 4,
      "max_completion_length": 512,
      "gradient_accumulation_steps": 8,
      "learning_rate": 5e-06,
      "beta": 0.04,
      "num_train_epochs": 1,
      "max_steps": 400,
      "logging_steps": 5,
      "save_steps": 25,
      "eval_steps": 25,
      "lr_scheduler_type": "cosine",
      "warmup_ratio": 0.05
    },
    "sft": {
      "num_train_epochs": 1,
      "per_device_train_batch_size": 4,
      "gradient_accumulation_steps": 4,
      "learning_rate": 2e-05,
      "max_seq_length": 1024
    },
    "task_filter": "action_screen",
    "smoke_steps": 5,
    "abort_step100_min_reward": 0.05,
    "abort_step200_min_reward": 0.7
  },
  "f1_per_tier": {
    "action_screen": {
      "precision": 1.0,
      "recall": 0.9744,
      "f1": 0.987
    },
    "war_room": {
      "precision": 1.0,
      "recall": 0.9624,
      "f1": 0.9808
    },
    "drift_ops": {
      "precision": 0.9205,
      "recall": 0.7864,
      "f1": 0.8482
    }
  },
  "baseline_qwen3_1_7b_zeroshot_f1_per_tier": {},
  "abort_path": null,
  "wall_clock_s": 5078.9,
  "best_checkpoint_step": 350,
  "model_repo": "Elliot89/sentinel-overseer-qwen3-1.7b-grpo400",
  "git_repo": "https://github.com/MrEinsteinE/sentinel-openenv",
  "sentinel_url": "https://elliot89-sentinel.hf.space"
}