| { | |
| "calibration_samples": 128, | |
| "created_at_unix": 1779205965, | |
| "cuda_runtime": "13.0", | |
| "dtype": "bf16", | |
| "excluded_patterns": [ | |
| "*lm_head*", | |
| "*embed_tokens*", | |
| "*router*", | |
| "*conv_qk*" | |
| ], | |
| "gpu_capability": [ | |
| 12, | |
| 0 | |
| ], | |
| "gpu_name": "NVIDIA RTX PRO 6000 Blackwell Workstation Edition", | |
| "max_seq_len": 2048, | |
| "module_summary": { | |
| "linear_expert": 1280, | |
| "linear_lm_head": 1, | |
| "linear_router": 160, | |
| "linear_targeted_estimate": 1480, | |
| "linear_total": 1641 | |
| }, | |
| "platform": "Linux-6.8.0-107-generic-x86_64-with-glibc2.39", | |
| "python": "3.12.3", | |
| "quantization": "ModelOpt NVFP4_DEFAULT_CFG", | |
| "source_model": "Zyphra/ZAYA1-8B", | |
| "source_revision": "970cfc9f5e7e5a4f5f6f0645955928a9b6a98415", | |
| "tensor_stats": { | |
| "files": [ | |
| { | |
| "bytes": 5804183272, | |
| "name": "model.safetensors" | |
| } | |
| ], | |
| "tensor_dtypes": { | |
| "torch.bfloat16": 963, | |
| "torch.float32": 3000, | |
| "torch.float8_e4m3fn": 1480, | |
| "torch.uint8": 1480 | |
| } | |
| }, | |
| "torch": "2.12.0+cu130" | |
| } |