SemiticGPT-3B / config.json
ronnengmail's picture
Upload config.json with huggingface_hub
4b368cd verified
{
"model_type": "semitic-gpt",
"architectures": [
"SemiticGPT"
],
"vocab_size": 32000,
"hidden_size": 3072,
"num_hidden_layers": 26,
"num_attention_heads": 24,
"intermediate_size": 8192,
"max_position_embeddings": 2048,
"rope_theta": 10000.0,
"rope_dim": 64,
"rms_norm_eps": 1e-06,
"tie_word_embeddings": false,
"torch_dtype": "bfloat16",
"num_parameters": 3140000000,
"tokenizer": "sentencepiece",
"tokenizer_model": "multilingual_32k.model",
"languages": [
"Hebrew (he)",
"Arabic (ar)",
"Farsi/Persian (fa)",
"English (en)"
],
"training": {
"pretraining_tokens": "4.48B",
"pretraining_languages": "Hebrew (40%), Arabic (20%), Farsi (20%), English (20%)",
"sft_v4_samples": 36980,
"sft_optimizer": "AdamW",
"sft_lr": "2e-5",
"sft_steps": 8000
}
}