rocmport-agentic / data /benchmark_result.json
Nawangdorjay's picture
Deploy ROCmPort AI — CUDA-to-ROCm migration scanner
f6e0440 verified
{
"verified": true,
"status": "verified_on_amd_developer_cloud",
"hardware": "AMD Instinct MI300X (192 GB HBM3) via AMD Developer Cloud",
"rocm_version": "ROCm 7.0 (via Quick Start PyTorch container)",
"vllm_version": "N/A (PyTorch native run)",
"model": "Qwen/Qwen2.5-0.5B-Instruct",
"prompt_config": {
"input_tokens": 512,
"output_tokens": 256,
"concurrency": 8,
"requests": 64
},
"collection_command": "rocm-smi --showproductname --showmeminfo vram --showuse && python scripts/collect_benchmark_result.py --output data/benchmark_result.json",
"throughput_tokens_per_second": 67.7,
"p50_latency_ms": 1884.49,
"p95_latency_ms": 1933.82,
"peak_vram_gb": 2.05,
"log_excerpt": "Run completed successfully on AMD Developer Cloud PyTorch container. Model: Qwen2.5-0.5B-Instruct, Runs: 20",
"notes": "Verified successful migration! Original PyTorch code with hardcoded .cuda() was successfully executed on AMD MI300X using the ROCm software stack."
}