• Joined on 2025-11-02

vllm-therock-gfx1151 (turboquant-6ef1efd)

Published 2026-04-18 18:26:37 +02:00 by mat

Installation

docker pull git.mialemrobicnic.pl/mat/vllm-therock-gfx1151:turboquant-6ef1efd
sha256:f36665975ed16a8015def82830b80ae2e593ad277c6b39177ef7c3a31bd3ef8d

Image Layers

KIWI 10.3.0
COPY scripts/install_deps.sh /tmp/install_deps.sh # buildkit
RUN /bin/sh -c sh /tmp/install_deps.sh # buildkit
WORKDIR /tmp
ARG ROCM_MAJOR_VER=7
ARG GFX=gfx1151
COPY scripts/install_rocm_sdk.sh /tmp/install_rocm_sdk.sh # buildkit
RUN |2 ROCM_MAJOR_VER=7 GFX=gfx1151 /bin/sh -c chmod +x /tmp/install_rocm_sdk.sh && export ROCM_MAJOR_VER=$ROCM_MAJOR_VER && export GFX=$GFX && /tmp/install_rocm_sdk.sh # buildkit
RUN |2 ROCM_MAJOR_VER=7 GFX=gfx1151 /bin/sh -c /usr/bin/python3.12 -m venv /opt/venv # buildkit
ENV VIRTUAL_ENV=/opt/venv
ENV PATH=/opt/venv/bin:/usr/local/bin:/usr/bin
ENV PIP_NO_CACHE_DIR=1
RUN |2 ROCM_MAJOR_VER=7 GFX=gfx1151 /bin/sh -c printf 'source /opt/venv/bin/activate\n' > /etc/profile.d/venv.sh # buildkit
RUN |2 ROCM_MAJOR_VER=7 GFX=gfx1151 /bin/sh -c python -m pip install --upgrade pip wheel packaging "setuptools<80.0.0" # buildkit
RUN |2 ROCM_MAJOR_VER=7 GFX=gfx1151 /bin/sh -c python -m pip install --index-url https://rocm.nightlies.amd.com/v2-staging/gfx1151/ --pre torch torchaudio torchvision # buildkit
WORKDIR /opt
COPY scripts/patch_aiter_headers.py /opt/patch_aiter_headers.py # buildkit
RUN |2 ROCM_MAJOR_VER=7 GFX=gfx1151 /bin/sh -c python -m pip install --upgrade cmake ninja packaging wheel numpy "setuptools-scm>=8" "setuptools<80.0.0" scikit-build-core pybind11 numba scipy # buildkit
ENV FLASH_ATTENTION_TRITON_AMD_ENABLE=TRUE
ENV LD_LIBRARY_PATH=/opt/rocm/lib:/opt/rocm/lib64:
RUN |2 ROCM_MAJOR_VER=7 GFX=gfx1151 /bin/sh -c git clone https://github.com/ROCm/flash-attention.git && cd flash-attention && git checkout main_perf && git submodule update --init third_party/aiter && cd third_party/aiter && git submodule update --init 3rdparty/composable_kernel && export CK_DIR="$(pwd)/3rdparty/composable_kernel" && python -m pip wheel --no-build-isolation --no-deps -w /tmp/dist -v . && python -m pip install --force-reinstall /tmp/dist/amd_aiter*.whl && python /opt/patch_aiter_headers.py && cd /opt/flash-attention && python -c "import re; f=open('setup.py','r'); t=f.read(); f.close(); t=re.sub(r'subprocess\.run\([\s\S]*?third_party/aiter[\s\S]*?check=True,\s*\)', 'pass # patched', t); f=open('setup.py','w'); f.write(t)" && pip install --no-build-isolation --no-deps . && cd /opt && rm -rf /opt/flash-attention /opt/patch_aiter_headers.py # buildkit
RUN |2 ROCM_MAJOR_VER=7 GFX=gfx1151 /bin/sh -c if [ -d /opt/venv/lib/python3.12/site-packages/aiter ]; then cp -rn /opt/venv/lib/python3.12/site-packages/aiter/* /opt/venv/lib64/python3.12/site-packages/aiter/ 2>/dev/null || true; rm -rf /opt/venv/lib/python3.12/site-packages/aiter; fi # buildkit
ARG VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c git clone https://github.com/vllm-project/vllm.git /opt/vllm # buildkit
WORKDIR /opt/vllm
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c if [ -n "$VLLM_COMMIT" ]; then echo "Pinning vLLM to commit $VLLM_COMMIT" && git checkout "$VLLM_COMMIT"; fi # buildkit
COPY scripts/patch_strix.py /opt/vllm/patch_strix.py # buildkit
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c python /opt/vllm/patch_strix.py # buildkit
ENV ROCM_HOME=/opt/rocm
ENV HIP_PATH=/opt/rocm
ENV VLLM_TARGET_DEVICE=rocm
ENV PYTORCH_ROCM_ARCH=gfx1151
ENV HIP_ARCHITECTURES=gfx1151
ENV AMDGPU_TARGETS=gfx1151
ENV MAX_JOBS=4
ENV CC=/opt/rocm/llvm/bin/clang
ENV CXX=/opt/rocm/llvm/bin/clang++
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c export HIP_DEVICE_LIB_PATH=$(find /opt/rocm -type d -name bitcode -print -quit) && echo "Compiling with Bitcode: $HIP_DEVICE_LIB_PATH" && export CMAKE_ARGS="-DROCM_PATH=/opt/rocm -DHIP_PATH=/opt/rocm -DAMDGPU_TARGETS=gfx1151 -DHIP_ARCHITECTURES=gfx1151" && python -m pip wheel --no-build-isolation --no-deps -w /tmp/dist -v . && python -m pip install /tmp/dist/*.whl # buildkit
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c python -m pip install ray # buildkit
WORKDIR /opt
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c git clone -b rocm_enabled_multi_backend https://github.com/ROCm/bitsandbytes.git # buildkit
WORKDIR /opt/bitsandbytes
ENV HIP_PLATFORM=amd
ENV CMAKE_PREFIX_PATH=/opt/rocm
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c cmake -S . -DGPU_TARGETS="gfx1151" -DBNB_ROCM_ARCH="gfx1151" -DCOMPUTE_BACKEND=hip -DCMAKE_HIP_COMPILER=/opt/rocm/llvm/bin/clang++ -DCMAKE_CXX_COMPILER=/opt/rocm/llvm/bin/clang++ && make -j$(nproc) && python -m pip install --no-cache-dir . --no-build-isolation --no-deps # buildkit
WORKDIR /opt
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c find /opt/venv -type f -name "*.so" -exec strip -s {} + 2>/dev/null || true && find /opt/venv -type d -name "__pycache__" -prune -exec rm -rf {} + && rm -rf /root/.cache/pip || true && dnf clean all && rm -rf /var/cache/dnf/* # buildkit
COPY scripts/01-rocm-env-for-triton.sh /etc/profile.d/01-rocm-env-for-triton.sh # buildkit
COPY scripts/99-toolbox-banner.sh /etc/profile.d/99-toolbox-banner.sh # buildkit
COPY scripts/zz-venv-last.sh /etc/profile.d/zz-venv-last.sh # buildkit
COPY scripts/start_vllm.py /opt/start-vllm # buildkit
COPY scripts/start_vllm_cluster.py /opt/start-vllm-cluster # buildkit
COPY scripts/measure_bandwidth.sh /opt/measure_bandwidth.sh # buildkit
COPY scripts/cluster_manager.py /opt/cluster_manager.py # buildkit
COPY scripts/models.py /opt/models.py # buildkit
COPY benchmarks/max_context_results.json /opt/max_context_results.json # buildkit
COPY benchmarks/bench_utils.py /opt/bench_utils.py # buildkit
COPY benchmarks/run_vllm_bench.py /opt/run_vllm_bench.py # buildkit
COPY benchmarks/vllm_cluster_bench.py /opt/vllm_cluster_bench.py # buildkit
COPY benchmarks/find_max_context.py /opt/find_max_context.py # buildkit
COPY rdma_cluster/compare_eth_vs_rdma.sh /opt/compare_eth_vs_rdma.sh # buildkit
COPY scripts/configure_cluster.sh /opt/configure_cluster.sh # buildkit
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c chmod +x /opt/configure_cluster.sh # buildkit
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c chmod +x /opt/start-vllm /opt/start-vllm-cluster /opt/vllm_cluster_bench.py /opt/compare_eth_vs_rdma.sh /opt/find_max_context.py /opt/run_vllm_bench.py && ln -s /opt/start-vllm /usr/local/bin/start-vllm && ln -s /opt/start-vllm-cluster /usr/local/bin/start-vllm-cluster && chmod 0644 /etc/profile.d/*.sh /opt/max_context_results.json /opt/models.py # buildkit
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c chmod 0644 /etc/profile.d/*.sh # buildkit
RUN |3 ROCM_MAJOR_VER=7 GFX=gfx1151 VLLM_COMMIT=6ef1efd51f11106fc44deb9e7b2f5cd1247fc37e /bin/sh -c printf 'ulimit -S -c 0\n' > /etc/profile.d/90-nocoredump.sh && chmod 0644 /etc/profile.d/90-nocoredump.sh # buildkit
CMD ["/bin/bash"]

Labels

Key Value
io.buildah.version 1.43.1
license MIT
name fedora
org.opencontainers.image.license MIT
org.opencontainers.image.licenses MIT
org.opencontainers.image.name fedora
org.opencontainers.image.title fedora
org.opencontainers.image.url https://fedoraproject.org/
org.opencontainers.image.vendor Fedora Project
org.opencontainers.image.version 43
vendor Fedora Project
version 43
Details
Container
2026-04-18 18:26:37 +02:00
2
OCI / Docker
linux/amd64
MIT
7.3 GiB
Versions (8) View all