vllm
Rocm
Install
sh -c 'echo 0 > /proc/sys/kernel/numa_balancing'
cat /proc/sys/kernel/numa_balancing
Using Docker
sudo pamac pacman -Ss docker containerd
sudo usermod -aG docker $USER
sudo mkdir /etc/docker/
sudo bash -c 'cat > /etc/docker/daemon.json <<EOF
{
"insecure-registries" : ["https://docker.arvancloud.ir"],
"registry-mirrors": ["https://docker.arvancloud.ir"],
"features": {
"containerd-snapshotter": true,
"buildkit": true
}
}
EOF'
sudo systemctl enable docker
sudo systemctl daemon-reload
docker logout
sudo systemctl restart docker
sudo reboot
nano dockerfile
#FROM rocm/vllm-dev:main
FROM rocm/vllm-dev:main
# Install development tools
RUN apt-get update && apt-get install -y \
curl \
&& rm -rf /var/lib/apt/lists/*
# Install dependencies
RUN pip3 install --no-cache-dir \
transformers \
accelerate \
safetensors
# Create non-root user for security
RUN useradd -m -u 2000 vllm
WORKDIR /app
RUN chown vllm:vllm /app
# Switch to non-root user
USER vllm
docker pull docker.iranserver.com/rocm/vllm-dev:main
docker build -t vllm-toolkit .
docker run -it --rm \
--device=/dev/kfd --device=/dev/dri \
--group-add=$(getent group video | cut -d: -f3) \
--group-add=$(getent group render | cut -d: -f3) \
--ipc=host \
--security-opt seccomp=unconfined \
-p 8000:8000 \
vllm-toolkit
Env config
- FlashMLA