tharun2909 commited on
Commit
e75a1e4
·
verified ·
1 Parent(s): 223a95a

Upload training configuration

Browse files
Files changed (1) hide show
  1. run_config.json +10 -10
run_config.json CHANGED
@@ -1,18 +1,18 @@
1
  {
2
- "model_name": "sshleifer/tiny-gpt2",
3
- "epochs": 1,
4
- "batch_size": 2,
5
- "learning_rate": 0.0002,
6
  "grad_accum_steps": 4,
7
  "precision": "fp32",
8
- "quantization_bits": 4,
9
- "lora_r": 8,
10
- "lora_alpha": 16,
11
- "lora_dropout": 0.05,
12
  "target_modules": [
13
  "c_attn",
14
  "c_proj"
15
  ],
16
- "total_steps": 62,
17
- "num_train_samples": 490
18
  }
 
1
  {
2
+ "model_name": "distilgpt2",
3
+ "epochs": 2,
4
+ "batch_size": 1,
5
+ "learning_rate": 0.0003,
6
  "grad_accum_steps": 4,
7
  "precision": "fp32",
8
+ "quantization_bits": 8,
9
+ "lora_r": 4,
10
+ "lora_alpha": 8,
11
+ "lora_dropout": 0.04,
12
  "target_modules": [
13
  "c_attn",
14
  "c_proj"
15
  ],
16
+ "total_steps": 60,
17
+ "num_train_samples": 240
18
  }