adithya9903's picture
Upload PolyGuard training artifacts: docs/results
b5cc210 verified
raw
history blame contribute delete
596 Bytes
{
"status": "ok",
"backend": "trl_transformers",
"examples_used": 2000,
"model_id": "Qwen/Qwen2.5-3B-Instruct",
"unsloth_available": false,
"train_runtime": 372.1845,
"train_loss": 0.18184852770145518,
"train_metrics": {
"train_runtime": 372.1845,
"train_samples_per_second": 5.374,
"train_steps_per_second": 5.374,
"total_flos": 1.1456146931712e+16,
"train_loss": 0.18184852770145518
},
"history_path": "/app/checkpoints/sweeps/qwen-qwen2-5-3b-instruct/sft_history.json",
"artifact_path": "/app/checkpoints/sweeps/qwen-qwen2-5-3b-instruct/sft_adapter"
}