Spaces:
Runtime error
Runtime error
| { | |
| "verified": true, | |
| "status": "verified_on_amd_developer_cloud", | |
| "hardware": "AMD Instinct MI300X (192 GB HBM3) via AMD Developer Cloud", | |
| "rocm_version": "ROCm 7.0 (via Quick Start PyTorch container)", | |
| "vllm_version": "N/A (PyTorch native run)", | |
| "model": "Qwen/Qwen2.5-0.5B-Instruct", | |
| "prompt_config": { | |
| "input_tokens": 512, | |
| "output_tokens": 256, | |
| "concurrency": 8, | |
| "requests": 64 | |
| }, | |
| "collection_command": "rocm-smi --showproductname --showmeminfo vram --showuse && python scripts/collect_benchmark_result.py --output data/benchmark_result.json", | |
| "throughput_tokens_per_second": 67.7, | |
| "p50_latency_ms": 1884.49, | |
| "p95_latency_ms": 1933.82, | |
| "peak_vram_gb": 2.05, | |
| "log_excerpt": "Run completed successfully on AMD Developer Cloud PyTorch container. Model: Qwen2.5-0.5B-Instruct, Runs: 20", | |
| "notes": "Verified successful migration! Original PyTorch code with hardcoded .cuda() was successfully executed on AMD MI300X using the ROCm software stack." | |
| } | |