brthor commited on
Commit
e9793a2
·
verified ·
1 Parent(s): d8ad126

Refresh base adapter to best eval_loss (profile=qwen3_5_9b, step=288, eval_loss=0.045270)

Browse files
qwen__qwen3.5-9b/adapter_config.json CHANGED
@@ -33,16 +33,16 @@
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
 
36
  "out_proj",
37
- "k_proj",
38
  "q_proj",
39
  "v_proj",
40
- "down_proj",
41
  "o_proj",
 
42
  "in_proj_qkv",
43
  "in_proj_z",
44
- "gate_proj",
45
- "up_proj"
46
  ],
47
  "target_parameters": null,
48
  "task_type": "CAUSAL_LM",
 
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
+ "down_proj",
37
  "out_proj",
 
38
  "q_proj",
39
  "v_proj",
40
+ "gate_proj",
41
  "o_proj",
42
+ "up_proj",
43
  "in_proj_qkv",
44
  "in_proj_z",
45
+ "k_proj"
 
46
  ],
47
  "target_parameters": null,
48
  "task_type": "CAUSAL_LM",
qwen__qwen3.5-9b/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:486ed260350c203aee8100eac07c25e4103d918c3f5186932be4241c6b2d800f
3
  size 80275624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29be519746ededecbd60e5efc79aa9aa9ecd81e82762ee80c2845b9234510d85
3
  size 80275624
qwen__qwen3.5-9b/best_eval_metrics.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_eval_loss": 0.037669453769922256,
3
- "best_step": 1152,
4
- "epoch": 2.0034782608695654
5
  }
 
1
  {
2
+ "best_eval_loss": 0.04526974633336067,
3
+ "best_step": 288,
4
+ "epoch": 0.5008695652173913
5
  }