File size: 440 Bytes
e90f769 | 1 2 3 4 5 6 7 8 9 10 11 12 13 | """Applied automatically in every Python process on PYTHONPATH.
vLLM spawns worker subprocesses that re-import modules; without this file
the monkey-patch would be missing in workers and weight loading would fail
for the heterogeneous per-layer expert counts.
"""
import os
if os.environ.get('VLLM_PRUNED_PATCH_DISABLE') != '1':
try:
import vllm_pruned_patch
vllm_pruned_patch.apply()
except Exception:
pass
|