YashashMathur commited on
Commit
aac0ab9
·
verified ·
1 Parent(s): 2688686

More SFT warmup (40 steps) for better JSON format

Browse files
Files changed (1) hide show
  1. train.py +1 -1
train.py CHANGED
@@ -34,7 +34,7 @@ except Exception as e:
34
  print(f"Repo create: {e}")
35
 
36
  MAX_SEQ_LEN = 1024
37
- SFT_STEPS = 20 # 50 done, 20 remaining to reach 70
38
  GRPO_STEPS = 250
39
  GRPO_K = 2
40
  GRPO_LR = 1e-5
 
34
  print(f"Repo create: {e}")
35
 
36
  MAX_SEQ_LEN = 1024
37
+ SFT_STEPS = 40 # More warmup for JSON format
38
  GRPO_STEPS = 250
39
  GRPO_K = 2
40
  GRPO_LR = 1e-5