File size: 992 Bytes
f6e0440
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
{
  "verified": true,
  "status": "verified_on_amd_developer_cloud",
  "hardware": "AMD Instinct MI300X (192 GB HBM3) via AMD Developer Cloud",
  "rocm_version": "ROCm 7.0 (via Quick Start PyTorch container)",
  "vllm_version": "N/A (PyTorch native run)",
  "model": "Qwen/Qwen2.5-0.5B-Instruct",
  "prompt_config": {
    "input_tokens": 512,
    "output_tokens": 256,
    "concurrency": 8,
    "requests": 64
  },
  "collection_command": "rocm-smi --showproductname --showmeminfo vram --showuse && python scripts/collect_benchmark_result.py --output data/benchmark_result.json",
  "throughput_tokens_per_second": 67.7,
  "p50_latency_ms": 1884.49,
  "p95_latency_ms": 1933.82,
  "peak_vram_gb": 2.05,
  "log_excerpt": "Run completed successfully on AMD Developer Cloud PyTorch container. Model: Qwen2.5-0.5B-Instruct, Runs: 20",
  "notes": "Verified successful migration! Original PyTorch code with hardcoded .cuda() was successfully executed on AMD MI300X using the ROCm software stack."
}