File size: 365 Bytes
229fc53
 
3ec5524
 
229fc53
3ec5524
229fc53
 
 
 
1
2
3
4
5
6
7
8
9
10
11
import os

# vLLM server on AMD Developer Cloud (OpenAI-compatible endpoint)
VLLM_API_URL = os.environ.get("VLLM_API_URL", "http://localhost:8000")

MODEL_NAME = os.environ.get("MODEL_NAME", "Qwen/Qwen2.5-VL-7B-Instruct")

# Generation settings
MAX_NEW_TOKENS = int(os.environ.get("MAX_NEW_TOKENS", "512"))
TEMPERATURE = float(os.environ.get("TEMPERATURE", "0.2"))