{ "verified": true, "status": "verified_on_amd_developer_cloud", "hardware": "AMD Instinct MI300X (192 GB HBM3) via AMD Developer Cloud", "rocm_version": "ROCm 7.0 (via Quick Start PyTorch container)", "vllm_version": "N/A (PyTorch native run)", "model": "Qwen/Qwen2.5-0.5B-Instruct", "prompt_config": { "input_tokens": 512, "output_tokens": 256, "concurrency": 8, "requests": 64 }, "collection_command": "rocm-smi --showproductname --showmeminfo vram --showuse && python scripts/collect_benchmark_result.py --output data/benchmark_result.json", "throughput_tokens_per_second": 67.7, "p50_latency_ms": 1884.49, "p95_latency_ms": 1933.82, "peak_vram_gb": 2.05, "log_excerpt": "Run completed successfully on AMD Developer Cloud PyTorch container. Model: Qwen2.5-0.5B-Instruct, Runs: 20", "notes": "Verified successful migration! Original PyTorch code with hardcoded .cuda() was successfully executed on AMD MI300X using the ROCm software stack." }