Eeppa commited on
Commit
0afbae0
·
verified ·
1 Parent(s): 23a5917

Update configuration_tinybuddy.py

Browse files
Files changed (1) hide show
  1. configuration_tinybuddy.py +25 -12
configuration_tinybuddy.py CHANGED
@@ -2,16 +2,29 @@
2
  Configuration class for TinyBuddy-30M.
3
  """
4
 
5
- from dataclasses import dataclass
6
 
7
-
8
- @dataclass
9
- class GPTConfig:
10
- vocab_size: int = 50000
11
- block_size: int = 512 # max context length
12
- n_layer: int = 6
13
- n_head: int = 8
14
- n_embd: int = 256
15
- mlp_ratio: int = 4 # hidden = mlp_ratio * n_embd
16
- dropout: float = 0.0
17
- tie_weights: bool = False # False -> ~30M params; True -> ~22M
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  Configuration class for TinyBuddy-30M.
3
  """
4
 
5
+ from transformers import PretrainedConfig
6
 
7
+ class GPTConfig(PretrainedConfig):
8
+ model_type = "tinybuddy"
9
+
10
+ def __init__(
11
+ self,
12
+ vocab_size: int = 50000,
13
+ block_size: int = 512,
14
+ n_layer: int = 6,
15
+ n_head: int = 8,
16
+ n_embd: int = 256,
17
+ mlp_ratio: int = 4,
18
+ dropout: float = 0.0,
19
+ tie_weights: bool = False,
20
+ **kwargs
21
+ ):
22
+ super().__init__(**kwargs)
23
+ self.vocab_size = vocab_size
24
+ self.block_size = block_size
25
+ self.n_layer = n_layer
26
+ self.n_head = n_head
27
+ self.n_embd = n_embd
28
+ self.mlp_ratio = mlp_ratio
29
+ self.dropout = dropout
30
+ self.tie_weights = tie_weights