Jayant-Kernel commited on
Commit
42f691c
·
unverified ·
1 Parent(s): eed0745

fix: batch size 4 to match num_generations 4

Browse files
Files changed (1) hide show
  1. train.py +1 -1
train.py CHANGED
@@ -159,7 +159,7 @@ trainer = GRPOTrainer(
159
  args=GRPOConfig(
160
  output_dir="./deceit-1.5b",
161
  max_steps=150,
162
- per_device_train_batch_size=2,
163
  num_generations=4,
164
  learning_rate=5e-6,
165
  warmup_steps=5,
 
159
  args=GRPOConfig(
160
  output_dir="./deceit-1.5b",
161
  max_steps=150,
162
+ per_device_train_batch_size=4,
163
  num_generations=4,
164
  learning_rate=5e-6,
165
  warmup_steps=5,