| { | |
| "model_type": "adaptive_retro_gpt", | |
| "architectures": [ | |
| "RetroGPT" | |
| ], | |
| "vocab_size": 50000, | |
| "d_model": 2048, | |
| "n_layers": 20, | |
| "n_heads": 16, | |
| "seq_len": 2048, | |
| "retrieval_layers": "5,11,17", | |
| "top_k": 2, | |
| "retrieval_seq_len": 512, | |
| "hash_dim": 1024, | |
| "retrieval_budget_lambda": 0.001, | |
| "no_retrieval_prob": 0.1, | |
| "random_retrieval_prob": 0.1, | |
| "parameter_count": 1172146179, | |
| "checkpoint_step": 20000 | |
| } |