LH-Tech-AI commited on
Commit
274c8f4
·
verified ·
1 Parent(s): bf1bea9

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +9 -9
config.json CHANGED
@@ -7,26 +7,26 @@
7
  "bos_token_id": 0,
8
  "dtype": "float32",
9
  "eos_token_id": 2,
10
- "head_dim": 8,
11
  "hidden_act": "silu",
12
- "hidden_size": 64,
13
  "initializer_range": 0.02,
14
- "intermediate_size": 128,
15
  "max_position_embeddings": 512,
16
  "mlp_bias": false,
17
  "model_type": "llama",
18
- "num_attention_heads": 8,
19
- "num_hidden_layers": 5,
20
- "num_key_value_heads": 8,
21
  "pad_token_id": 1,
22
  "pretraining_tp": 1,
23
  "rms_norm_eps": 1e-06,
24
  "rope_parameters": {
25
- "rope_theta": 10000.0,
26
  "rope_type": "default"
27
  },
28
  "tie_word_embeddings": true,
29
  "transformers_version": "5.8.1",
30
  "use_cache": false,
31
- "vocab_size": 4096
32
- }
 
7
  "bos_token_id": 0,
8
  "dtype": "float32",
9
  "eos_token_id": 2,
10
+ "head_dim": 32,
11
  "hidden_act": "silu",
12
+ "hidden_size": 128,
13
  "initializer_range": 0.02,
14
+ "intermediate_size": 512,
15
  "max_position_embeddings": 512,
16
  "mlp_bias": false,
17
  "model_type": "llama",
18
+ "num_attention_heads": 4,
19
+ "num_hidden_layers": 6,
20
+ "num_key_value_heads": 4,
21
  "pad_token_id": 1,
22
  "pretraining_tp": 1,
23
  "rms_norm_eps": 1e-06,
24
  "rope_parameters": {
25
+ "rope_theta": 500000,
26
  "rope_type": "default"
27
  },
28
  "tie_word_embeddings": true,
29
  "transformers_version": "5.8.1",
30
  "use_cache": false,
31
+ "vocab_size": 8192
32
+ }