| { | |
| "status": "ok", | |
| "backend": "trl_transformers", | |
| "examples_used": 2000, | |
| "model_id": "Qwen/Qwen2.5-3B-Instruct", | |
| "unsloth_available": false, | |
| "train_runtime": 715.2908, | |
| "train_loss": 0.15688225453009363, | |
| "train_metrics": { | |
| "train_runtime": 715.2908, | |
| "train_samples_per_second": 5.592, | |
| "train_steps_per_second": 2.796, | |
| "total_flos": 2.949554402500608e+16, | |
| "train_loss": 0.15688225453009363 | |
| }, | |
| "history_path": "/app/checkpoints/sweeps/qwen-qwen2-5-3b-instruct/sft_history.json", | |
| "artifact_path": "/app/checkpoints/sweeps/qwen-qwen2-5-3b-instruct/sft_adapter" | |
| } |