| |
| FROM 763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-training:2.1.0-transformers4.36.0-gpu-py310-cu121-ubuntu20.04 |
|
|
| |
| RUN pip3 uninstall -y pytorch-quantization \ |
| pytorch-triton torch torch-tensorrt torchvision \ |
| xgboost transformer_engine flash_attn apex megatron-core |
|
|
| |
| ENV MAX_JOBS=32 |
| ENV VLLM_WORKER_MULTIPROC_METHOD=spawn |
| ENV DEBIAN_FRONTEND=noninteractive |
| ENV NODE_OPTIONS="" |
| ENV HF_HUB_ENABLE_HF_TRANSFER="1" |
|
|
| |
| RUN apt-get update && \ |
| apt-get install -y -o Dpkg::Options::="--force-confdef" systemd && \ |
| apt-get clean |
|
|
| |
| RUN apt-get update && \ |
| apt-get install -y tini && \ |
| apt-get clean |
|
|
| |
| RUN pip install --no-cache-dir vllm==0.8.2 torch==2.6.0 torchvision==0.21.0 torchaudio==2.6.0 tensordict torchdata==0.11.0 \ |
| transformers>=4.49.0 accelerate datasets peft hf-transfer \ |
| ray[default] codetiming hydra-core pandas pyarrow>=15.0.0 pylatexenc qwen-vl-utils wandb dill pybind11 liger-kernel mathruler \ |
| pytest pre-commit py-spy pyext ruff tensorboard |
|
|
| |
| RUN pip uninstall -y transformer-engine flash-attn && \ |
| pip install flash-attn==2.7.4.post1 --no-build-isolation |
|
|
| |
| RUN pip uninstall -y pynvml nvidia-ml-py && \ |
| pip install --no-cache-dir nvidia-ml-py>=12.560.30 opencv-python-headless==4.8.0.74 fastapi==0.115.6 && \ |
| pip install --no-cache-dir --upgrade optree>=0.13.0 |
|
|
| |
| RUN pip install --no-cache-dir verl[vllm] -U |
|
|
| |
| RUN pip config unset global.index-url && \ |
| pip config unset global.extra-index-url |
|
|