Ill-Ness commited on
Commit
0e8a062
·
verified ·
1 Parent(s): 6fde20b

Delete training_report.json

Browse files
Files changed (1) hide show
  1. training_report.json +0 -37
training_report.json DELETED
@@ -1,37 +0,0 @@
1
- {
2
- "model_name": "Supertron2-24B",
3
- "base_model": "mistralai/Devstral-Small-2-24B-Instruct-2512",
4
- "training_base_model": "akoumpa/Devstral-Small-2-24B-Instruct-2512-BF16",
5
- "run_dir": "/artifacts/20260518-164838",
6
- "adapter_dir": "/artifacts/20260518-164838/adapter",
7
- "merged_dir": null,
8
- "train_minutes": 60,
9
- "elapsed_seconds": 181.40671366200002,
10
- "global_step": 600,
11
- "train_loss": 1.570858365794023,
12
- "parameter_count": 24034167808,
13
- "trainable_parameter_count": 22806528,
14
- "attention_impl": "flash_attention_2",
15
- "resumed_from": null,
16
- "use_4bit": false,
17
- "torch_compile": false,
18
- "gradient_checkpointing": true,
19
- "lora": {
20
- "r": 16,
21
- "alpha": 32,
22
- "dropout": 0.03
23
- },
24
- "datasets": {
25
- "SWE-bench/SWE-smith": 2000,
26
- "SWE-bench/SWE-bench": 2000,
27
- "ise-uiuc/Magicoder-OSS-Instruct-75K": 6000,
28
- "m-a-p/CodeFeedback-Filtered-Instruction": 6000,
29
- "Open-Orca/OpenOrca": 5000,
30
- "HuggingFaceH4/ultrachat_200k": 5000,
31
- "gsm8k": 4000,
32
- "allenai/sciq": 3000,
33
- "supertron2-identity": 1000
34
- },
35
- "pushed_to_hub": false,
36
- "hub_repo_id": "Surpem/Supertron2-24B"
37
- }