llama3-edge / configuration_llama_edge.py
crab27's picture
Upload folder using huggingface_hub
4dd7afe verified
from transformers import PretrainedConfig
from typing import Optional
class LlamaEdgeConfig(PretrainedConfig):
model_type = "llama_edge"
def __init__(
self,
dim: int = 4096,
n_layers: int = 32,
n_heads: int = 32,
n_kv_heads: int = 8,
vocab_size: int = 9942,
multiple_of: int = 256,
ffn_dim_multiplier: Optional[float] = 1.3,
norm_eps: float = 1e-5,
rope_theta: float = 500000.0,
max_seq_len: int = 8192,
intermediate_size: int = 14336,
**kwargs,
):
self.dim = dim
self.n_layers = n_layers
self.n_heads = n_heads
self.n_kv_heads = n_kv_heads
self.vocab_size = vocab_size
self.multiple_of = multiple_of
self.ffn_dim_multiplier = ffn_dim_multiplier
self.norm_eps = norm_eps
self.rope_theta = rope_theta
self.max_seq_len = max_seq_len
self.intermediate_size = intermediate_size
super().__init__(**kwargs)