Updating toolboxes with a two-stage build process to reduce size

This commit is contained in:
Donato Capitella
2025-08-16 10:21:59 +01:00
parent 551d14b11d
commit ca0800bd01
9 changed files with 492 additions and 209 deletions
+43 -23
View File
@@ -1,38 +1,58 @@
FROM fedora:rawhide # build
FROM registry.fedoraproject.org/fedora:rawhide AS builder
# Install build dependencies and tools # deps + rocm toolchain
RUN dnf install -y \ RUN dnf -y --nodocs --setopt=install_weak_deps=False install \
make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \ make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \
rocminfo radeontop 'rocm-*' 'rocblas-*' 'hipblas' 'hipblas-*' \ rocminfo radeontop 'rocm-*' 'rocblas-*' hipblas 'hipblas-*' \
git vim \ git vim rsync sudo tar xz \
&& dnf clean all && dnf clean all && rm -rf /var/cache/dnf/*
# Set up working directory # llama.cpp
WORKDIR /opt/llama.cpp WORKDIR /opt/llama.cpp
# Clone llama.cpp repository (with submodules)
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
# Build llama.cpp with HIP support # build + install
RUN git clean -xdf \ RUN git clean -xdf \
&& git pull \ && git pull \
&& git submodule update --recursive \ && git submodule update --recursive \
&& \ && HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \
# Configure and compile with HIP toolchain cmake -S . -B build \
HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \ -DGGML_HIP=ON \
cmake -S . -B build \ -DAMDGPU_TARGETS=gfx1151 \
-DGGML_HIP=ON \ -DCMAKE_BUILD_TYPE=Release \
-DAMDGPU_TARGETS=gfx1151 \ -DLLAMA_HIP_UMA=ON \
-DCMAKE_BUILD_TYPE=Release \ && cmake --build build --config Release -- -j$(nproc) \
-DLLAMA_HIP_UMA=ON \ && cmake --install build --config Release
&& cmake --build build --config Release -- -j$(nproc) \
&& cmake --install build --config Release
# make ld see libllama in builder too (kept same step)
RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \ RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \
&& ldconfig && ldconfig
# runtime
FROM registry.fedoraproject.org/fedora-minimal:rawhide
# runtime deps (same rocm packages; no build toolchain)
RUN microdnf -y --nodocs --setopt=install_weak_deps=0 install \
bash ca-certificates libatomic libstdc++ libgcc \
rocminfo radeontop 'rocm-*' 'rocblas-*' hipblas 'hipblas-*' \
&& microdnf clean all && rm -rf /var/cache/dnf/*
# bits from builder
COPY --from=builder /usr/local/ /usr/local/
COPY --from=builder /usr/include/rocwmma /usr/include/rocwmma
# ensure libllama is on the linker path
RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \
&& echo "/usr/local/lib64" >> /etc/ld.so.conf.d/local.conf \
&& ldconfig \
&& cp -n /usr/local/lib/libllama*.so* /usr/lib64/ 2>/dev/null || true \
&& ldconfig
# helper
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# Default to interactive shell # shell
CMD ["/bin/bash"] CMD ["/bin/bash"]
+46 -26
View File
@@ -1,45 +1,65 @@
FROM fedora:rawhide # build
FROM registry.fedoraproject.org/fedora:rawhide AS builder
# Install build dependencies and tools # deps + rocm toolchain
RUN dnf install -y \ RUN dnf -y --nodocs --setopt=install_weak_deps=False install \
make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \ make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \
rocminfo radeontop 'rocm-*' 'rocblas-*' 'hipblas' 'hipblas-*' \ rocminfo radeontop 'rocm-*' 'rocblas-*' hipblas 'hipblas-*' \
git vim rsync \ git vim rsync sudo tar xz \
&& dnf clean all && dnf clean all && rm -rf /var/cache/dnf/*
# rocWMMA headers
WORKDIR /opt/ WORKDIR /opt
RUN git clone -b release/rocm-rel-7.0 https://github.com/ROCm/rocWMMA.git RUN git clone -b release/rocm-rel-7.0 https://github.com/ROCm/rocWMMA.git
RUN sudo mkdir -p /usr/include/rocwmma RUN sudo mkdir -p /usr/include/rocwmma
RUN sudo rsync -a rocWMMA/library/include/rocwmma/ /usr/include/rocwmma/ RUN sudo rsync -a rocWMMA/library/include/rocwmma/ /usr/include/rocwmma/
# Set up working directory # llama.cpp
WORKDIR /opt/llama.cpp WORKDIR /opt/llama.cpp
# Clone llama.cpp repository (with submodules)
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
# Build llama.cpp with HIP support # build + install
RUN git clean -xdf \ RUN git clean -xdf \
&& git pull \ && git pull \
&& git submodule update --recursive \ && git submodule update --recursive \
&& \ && HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \
# Configure and compile with HIP toolchain cmake -S . -B build \
HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \ -DGGML_HIP=ON \
cmake -S . -B build \ -DAMDGPU_TARGETS=gfx1151 \
-DGGML_HIP=ON \ -DCMAKE_BUILD_TYPE=Release \
-DAMDGPU_TARGETS=gfx1151 \ -DLLAMA_HIP_UMA=ON \
-DCMAKE_BUILD_TYPE=Release \ -DGGML_HIP_ROCWMMA_FATTN=ON \
-DLLAMA_HIP_UMA=ON \ && cmake --build build --config Release -- -j$(nproc) \
-DGGML_HIP_ROCWMMA_FATTN=ON \ && cmake --install build --config Release
&& cmake --build build --config Release -- -j$(nproc) \
&& cmake --install build --config Release
# make ld see libllama in builder too (kept same step)
RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \ RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \
&& ldconfig && ldconfig
# runtime
FROM registry.fedoraproject.org/fedora-minimal:rawhide
# runtime deps (same rocm packages; no build toolchain)
RUN microdnf -y --nodocs --setopt=install_weak_deps=0 install \
bash ca-certificates libatomic libstdc++ libgcc \
rocminfo radeontop 'rocm-*' 'rocblas-*' hipblas 'hipblas-*' \
&& microdnf clean all && rm -rf /var/cache/dnf/*
# bits from builder
COPY --from=builder /usr/local/ /usr/local/
COPY --from=builder /usr/include/rocwmma /usr/include/rocwmma
# ensure libllama is on the linker path
RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \
&& echo "/usr/local/lib64" >> /etc/ld.so.conf.d/local.conf \
&& ldconfig \
&& cp -n /usr/local/lib/libllama*.so* /usr/lib64/ 2>/dev/null || true \
&& ldconfig
# helper
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# Default to interactive shell # shell
CMD ["/bin/bash"] CMD ["/bin/bash"]
+67 -31
View File
@@ -1,7 +1,8 @@
FROM fedora:rawhide # build stage
FROM registry.fedoraproject.org/fedora:rawhide AS builder
# getting Rocm6.4.3 repos # rocm 6.4.3 repo
RUN <<EOF RUN <<'EOF'
tee /etc/yum.repos.d/rocm.repo <<REPO tee /etc/yum.repos.d/rocm.repo <<REPO
[ROCm-6.4.3] [ROCm-6.4.3]
name=ROCm6.4.3 name=ROCm6.4.3
@@ -11,48 +12,83 @@ priority=50
gpgcheck=1 gpgcheck=1
gpgkey=https://repo.radeon.com/rocm/rocm.gpg.key gpgkey=https://repo.radeon.com/rocm/rocm.gpg.key
REPO REPO
EOF EOF
# Install build dependencies and tools # deps
RUN dnf install -y \ RUN dnf -y --nodocs --setopt=install_weak_deps=False install \
make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \ make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \
rocm rocminfo radeontop \ rocm rocminfo radeontop \
git vim \ git vim sudo rsync \
&& dnf clean all && dnf clean all && rm -rf /var/cache/dnf/*
# Set up working directory # llama.cpp
WORKDIR /opt/llama.cpp WORKDIR /opt/llama.cpp
# Clone llama.cpp repository (with submodules)
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
# Build llama.cpp with HIP support # build
RUN git clean -xdf \ RUN git clean -xdf \
&& git pull \ && git pull \
&& git submodule update --recursive \ && git submodule update --recursive \
&& \ && HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \
# Configure and compile with HIP toolchain cmake -S . -B build \
HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \ -DGGML_HIP=ON \
cmake -S . -B build \ -DAMDGPU_TARGETS=gfx1151 \
-DGGML_HIP=ON \ -DCMAKE_BUILD_TYPE=Release \
-DAMDGPU_TARGETS=gfx1151 \ -DLLAMA_HIP_UMA=ON \
-DCMAKE_BUILD_TYPE=Release \ && cmake --build build --config Release -- -j$(nproc) \
-DLLAMA_HIP_UMA=ON \ && cmake --install build --config Release
&& cmake --build build --config Release -- -j$(nproc) \
&& cmake --install build --config Release
# libs
RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \ RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \
&& ldconfig && ldconfig
RUN printf '%s\n' \ # helper
'export ROCBLAS_USE_HIPBLASLT=1' \
> /etc/profile.d/rocm.sh \
&& chmod +x /etc/profile.d/rocm.sh \
&& echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# Default to interactive shell
# runtime stage
FROM registry.fedoraproject.org/fedora-minimal:rawhide
# rocm 6.4.3 repo
RUN <<'EOF'
tee /etc/yum.repos.d/rocm.repo <<REPO
[ROCm-6.4.3]
name=ROCm6.4.3
baseurl=https://repo.radeon.com/rocm/el9/6.4.3/main
enabled=1
priority=50
gpgcheck=1
gpgkey=https://repo.radeon.com/rocm/rocm.gpg.key
REPO
EOF
# runtime deps
RUN microdnf -y --nodocs --setopt=install_weak_deps=0 install \
bash ca-certificates libatomic libstdc++ libgcc \
rocm rocminfo radeontop \
&& microdnf clean all && rm -rf /var/cache/dnf/*
# copy
COPY --from=builder /usr/local/ /usr/local/
COPY --from=builder /usr/include/rocwmma /usr/include/rocwmma
# ld
RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \
&& echo "/usr/local/lib64" >> /etc/ld.so.conf.d/local.conf \
&& ldconfig \
&& cp -n /usr/local/lib/libllama*.so* /usr/lib64/ 2>/dev/null || true \
&& ldconfig
# helper
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# profile
RUN printf '%s\n' \
'export ROCBLAS_USE_HIPBLASLT=1' \
> /etc/profile.d/rocm.sh && chmod +x /etc/profile.d/rocm.sh \
&& echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc
# shell
CMD ["/bin/bash"] CMD ["/bin/bash"]
+66 -30
View File
@@ -1,7 +1,8 @@
FROM fedora:rawhide # build stage
FROM registry.fedoraproject.org/fedora:rawhide AS builder
# getting Rocm6.4.3 repos # rocm 6.4.3 repo
RUN <<EOF RUN <<'EOF'
tee /etc/yum.repos.d/rocm.repo <<REPO tee /etc/yum.repos.d/rocm.repo <<REPO
[ROCm-6.4.3] [ROCm-6.4.3]
name=ROCm6.4.3 name=ROCm6.4.3
@@ -11,55 +12,90 @@ priority=50
gpgcheck=1 gpgcheck=1
gpgkey=https://repo.radeon.com/rocm/rocm.gpg.key gpgkey=https://repo.radeon.com/rocm/rocm.gpg.key
REPO REPO
EOF EOF
# Install build dependencies and tools # deps
RUN dnf install -y \ RUN dnf -y --nodocs --setopt=install_weak_deps=False install \
make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \ make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \
rocm rocminfo radeontop \ rocm rocminfo radeontop \
git vim \ git vim sudo rsync \
&& dnf clean all && dnf clean all && rm -rf /var/cache/dnf/*
# rocWMMA
WORKDIR /opt/ WORKDIR /opt
RUN git clone -b release/rocm-rel-7.0 https://github.com/ROCm/rocWMMA.git RUN git clone -b release/rocm-rel-7.0 https://github.com/ROCm/rocWMMA.git
RUN sudo mkdir -p /usr/include/rocwmma RUN sudo mkdir -p /usr/include/rocwmma
RUN sudo cp -r rocWMMA/library/include/rocwmma /usr/include/ RUN sudo cp -r rocWMMA/library/include/rocwmma /usr/include/
# Set up working directory # llama.cpp
WORKDIR /opt/llama.cpp WORKDIR /opt/llama.cpp
# Clone llama.cpp repository (with submodules)
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
# Build llama.cpp with HIP support # build
RUN git clean -xdf \ RUN git clean -xdf \
&& git pull \ && git pull \
&& git submodule update --recursive \ && git submodule update --recursive \
&& \ && HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \
# Configure and compile with HIP toolchain cmake -S . -B build \
HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \ -DGGML_HIP=ON \
cmake -S . -B build \ -DAMDGPU_TARGETS=gfx1151 \
-DGGML_HIP=ON \ -DCMAKE_BUILD_TYPE=Release \
-DAMDGPU_TARGETS=gfx1151 \ -DLLAMA_HIP_UMA=ON \
-DCMAKE_BUILD_TYPE=Release \ -DGGML_HIP_ROCWMMA_FATTN=ON \
-DLLAMA_HIP_UMA=ON \ && cmake --build build --config Release -- -j$(nproc) \
-DGGML_HIP_ROCWMMA_FATTN=ON \ && cmake --install build --config Release
&& cmake --build build --config Release -- -j$(nproc) \
&& cmake --install build --config Release
# libs
RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \ RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \
&& ldconfig && ldconfig
# helper
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# runtime stage
FROM registry.fedoraproject.org/fedora-minimal:rawhide
# rocm 6.4.3 repo
RUN <<'EOF'
tee /etc/yum.repos.d/rocm.repo <<REPO
[ROCm-6.4.3]
name=ROCm6.4.3
baseurl=https://repo.radeon.com/rocm/el9/6.4.3/main
enabled=1
priority=50
gpgcheck=1
gpgkey=https://repo.radeon.com/rocm/rocm.gpg.key
REPO
EOF
# runtime deps
RUN microdnf -y --nodocs --setopt=install_weak_deps=0 install \
bash ca-certificates libatomic libstdc++ libgcc \
rocm rocminfo radeontop \
&& microdnf clean all && rm -rf /var/cache/dnf/*
# copy
COPY --from=builder /usr/local/ /usr/local/
COPY --from=builder /usr/include/rocwmma /usr/include/rocwmma
# ld
RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \
&& echo "/usr/local/lib64" >> /etc/ld.so.conf.d/local.conf \
&& ldconfig \
&& cp -n /usr/local/lib/libllama*.so* /usr/lib64/ 2>/dev/null || true \
&& ldconfig
# helper
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# profile
RUN printf '%s\n' \ RUN printf '%s\n' \
'export ROCBLAS_USE_HIPBLASLT=1' \ 'export ROCBLAS_USE_HIPBLASLT=1' \
> /etc/profile.d/rocm.sh \ > /etc/profile.d/rocm.sh && chmod +x /etc/profile.d/rocm.sh \
&& chmod +x /etc/profile.d/rocm.sh \
&& echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc && echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc
# Default to interactive shell # shell
CMD ["/bin/bash"] CMD ["/bin/bash"]
+71 -27
View File
@@ -1,7 +1,8 @@
FROM fedora:rawhide # build stage
FROM registry.fedoraproject.org/fedora:rawhide AS builder
# getting Rocm7 repos # rocm 7.0 repos
RUN <<EOF RUN <<'EOF'
tee /etc/yum.repos.d/rocm.repo <<REPO tee /etc/yum.repos.d/rocm.repo <<REPO
[ROCm-7.0.0] [ROCm-7.0.0]
name=ROCm7.0.0 name=ROCm7.0.0
@@ -21,49 +22,92 @@ priority=50
gpgcheck=1 gpgcheck=1
gpgkey=https://repo.radeon.com/rocm/rocm.gpg.key gpgkey=https://repo.radeon.com/rocm/rocm.gpg.key
REPO REPO
EOF EOF
# Install build dependencies and tools # deps
RUN dnf install -y \ RUN dnf -y --nodocs --setopt=install_weak_deps=False install \
make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \ make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \
rocm rocminfo radeontop \ rocm rocminfo radeontop \
git vim \ git vim \
&& dnf clean all && dnf clean all && rm -rf /var/cache/dnf/*
# Set up working directory # llama.cpp
WORKDIR /opt/llama.cpp WORKDIR /opt/llama.cpp
# Clone llama.cpp repository (with submodules)
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
# Build llama.cpp with HIP support # build
RUN git clean -xdf \ RUN git clean -xdf \
&& git pull \ && git pull \
&& git submodule update --recursive \ && git submodule update --recursive \
&& \ && HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \
# Configure and compile with HIP toolchain cmake -S . -B build \
HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \ -DGGML_HIP=ON \
cmake -S . -B build \ -DAMDGPU_TARGETS=gfx1151 \
-DGGML_HIP=ON \ -DCMAKE_BUILD_TYPE=Release \
-DAMDGPU_TARGETS=gfx1151 \ -DLLAMA_HIP_UMA=ON \
-DCMAKE_BUILD_TYPE=Release \ && cmake --build build --config Release -- -j$(nproc) \
-DLLAMA_HIP_UMA=ON \ && cmake --install build --config Release
&& cmake --build build --config Release -- -j$(nproc) \
&& cmake --install build --config Release
# libs
RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \ RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \
&& ldconfig && ldconfig
# helper
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# Ensure we are using hipblaslt
# runtime stage
FROM registry.fedoraproject.org/fedora-minimal:rawhide
# rocm 7.0 repos
RUN <<'EOF'
tee /etc/yum.repos.d/rocm.repo <<REPO
[ROCm-7.0.0]
name=ROCm7.0.0
baseurl=https://repo.radeon.com/rocm/el9/7.0_beta/main
enabled=1
priority=50
gpgcheck=1
gpgkey=https://repo.radeon.com/rocm/rocm.gpg.key
REPO
tee /etc/yum.repos.d/rocm-graphics.repo <<REPO
[ROCm-7.0.0-Graphics]
name=ROCm7.0.0-Graphics
baseurl=https://repo.radeon.com/graphics/7.0_beta/rhel/9/main/x86_64/
enabled=1
priority=50
gpgcheck=1
gpgkey=https://repo.radeon.com/rocm/rocm.gpg.key
REPO
EOF
# runtime deps
RUN microdnf -y --nodocs --setopt=install_weak_deps=0 install \
bash ca-certificates libatomic libstdc++ libgcc \
rocm rocminfo radeontop \
&& microdnf clean all && rm -rf /var/cache/dnf/*
# copy
COPY --from=builder /usr/local/ /usr/local/
# ld
RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \
&& echo "/usr/local/lib64" >> /etc/ld.so.conf.d/local.conf \
&& ldconfig \
&& cp -n /usr/local/lib/libllama*.so* /usr/lib64/ 2>/dev/null || true \
&& ldconfig
# helper
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# profile
RUN printf '%s\n' \ RUN printf '%s\n' \
'export ROCBLAS_USE_HIPBLASLT=1' \ 'export ROCBLAS_USE_HIPBLASLT=1' \
> /etc/profile.d/rocm.sh \ > /etc/profile.d/rocm.sh && chmod +x /etc/profile.d/rocm.sh \
&& chmod +x /etc/profile.d/rocm.sh \
&& echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc && echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc
# Default to interactive shell # shell
CMD ["/bin/bash"] CMD ["/bin/bash"]
+58 -22
View File
@@ -1,21 +1,17 @@
FROM fedora:rawhide # build
FROM registry.fedoraproject.org/fedora:rawhide AS builder
# 1) Install dependencies RUN dnf -y --nodocs --setopt=install_weak_deps=False install \
RUN dnf install -y \
make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \ make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \
radeontop git vim patch curl \ radeontop git vim patch curl ninja-build tar xz \
&& dnf clean all && dnf clean all && rm -rf /var/cache/dnf/*
# 2) Download ROCm nightly tarball
WORKDIR /tmp WORKDIR /tmp
RUN curl -L -o therock.tar.gz \ RUN curl -L -o therock.tar.gz \
https://therock-nightly-tarball.s3.amazonaws.com/therock-dist-linux-gfx1151-7.0.0rc20250811.tar.gz https://therock-nightly-tarball.s3.amazonaws.com/therock-dist-linux-gfx1151-7.0.0rc20250811.tar.gz
# 3) Extract into /opt/rocm-7.0
RUN mkdir -p /opt/rocm-7.0 \ RUN mkdir -p /opt/rocm-7.0 \
&& tar xvf therock.tar.gz -C /opt/rocm-7.0 --strip-components=1 && tar xzf therock.tar.gz -C /opt/rocm-7.0 --strip-components=1
# 4) Bake in ROCm env + full system PATH
ENV ROCM_PATH=/opt/rocm-7.0 \ ENV ROCM_PATH=/opt/rocm-7.0 \
HIP_PLATFORM=amd \ HIP_PLATFORM=amd \
HIP_PATH=/opt/rocm-7.0 \ HIP_PATH=/opt/rocm-7.0 \
@@ -29,7 +25,6 @@ ENV ROCM_PATH=/opt/rocm-7.0 \
CPATH=/opt/rocm-7.0/include \ CPATH=/opt/rocm-7.0/include \
PKG_CONFIG_PATH=/opt/rocm-7.0/lib/pkgconfig PKG_CONFIG_PATH=/opt/rocm-7.0/lib/pkgconfig
# 5) profile.d snippet for login & interactive shells
RUN printf '%s\n' \ RUN printf '%s\n' \
'export ROCM_PATH=/opt/rocm-7.0' \ 'export ROCM_PATH=/opt/rocm-7.0' \
'export HIP_PLATFORM=amd' \ 'export HIP_PLATFORM=amd' \
@@ -48,32 +43,73 @@ RUN printf '%s\n' \
&& chmod +x /etc/profile.d/rocm.sh \ && chmod +x /etc/profile.d/rocm.sh \
&& echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc && echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc
# 6) Clone llama.cpp
WORKDIR /opt/llama.cpp WORKDIR /opt/llama.cpp
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . \ RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . \
&& git clean -xdf \ && git clean -xdf \
&& git submodule update --recursive && git submodule update --recursive
# 7) Copy in your external patch and apply
COPY hip-rocm7rc.patch /opt/llama.cpp/hip-rocm7rc.patch
RUN patch -p1 < hip-rocm7rc.patch
# 8) Configure, build & install llama.cpp with HIP
RUN cmake -S . -B build \ RUN cmake -S . -B build \
-DGGML_HIP=ON \ -DGGML_HIP=ON \
-DAMDGPU_TARGETS=gfx1151 \ -DAMDGPU_TARGETS=gfx1151 \
-DCMAKE_BUILD_TYPE=Release \ -DCMAKE_BUILD_TYPE=Release \
-DLLAMA_HIP_UMA=ON \ -DLLAMA_HIP_UMA=ON \
-DGGML_HIP_ROCWMMA_FATTN=ON \
&& cmake --build build --config Release -- -j$(nproc) \ && cmake --build build --config Release -- -j$(nproc) \
&& cmake --install build --config Release && cmake --install build --config Release
# 9) Copy the .so from build/bin into /usr/lib64 so ldconfig can see it # keep bin; drop headers/docs/static libs; drop source tree
RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \ RUN find /opt/rocm-7.0 -type f -name '*.a' -delete \
&& ldconfig && rm -rf /opt/rocm-7.0/include /opt/rocm-7.0/share \
/opt/rocm-7.0/llvm/include /opt/rocm-7.0/llvm/share \
&& rm -rf /opt/llama.cpp
# runtime
FROM registry.fedoraproject.org/fedora-minimal:rawhide
RUN microdnf -y --nodocs --setopt=install_weak_deps=0 install \
bash ca-certificates libatomic libstdc++ libgcc radeontop vim \
&& microdnf clean all && rm -rf /var/cache/dnf/*
COPY --from=builder /opt/rocm-7.0 /opt/rocm-7.0
COPY --from=builder /usr/local/ /usr/local/
# 10) Install helper script
COPY gguf-vram-estimator.py /usr/local/bin/ COPY gguf-vram-estimator.py /usr/local/bin/
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# 11) Default to interactive bash ENV ROCM_PATH=/opt/rocm-7.0 \
HIP_PLATFORM=amd \
HIP_PATH=/opt/rocm-7.0 \
HIP_CLANG_PATH=/opt/rocm-7.0/llvm/bin \
HIP_INCLUDE_PATH=/opt/rocm-7.0/include \
HIP_LIB_PATH=/opt/rocm-7.0/lib \
HIP_DEVICE_LIB_PATH=/opt/rocm-7.0/lib/llvm/amdgcn/bitcode \
PATH=/opt/rocm-7.0/bin:/opt/rocm-7.0/llvm/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin \
LD_LIBRARY_PATH=/opt/rocm-7.0/lib:/opt/rocm-7.0/lib64:/opt/rocm-7.0/llvm/lib \
LIBRARY_PATH=/opt/rocm-7.0/lib:/opt/rocm-7.0/lib64 \
CPATH=/opt/rocm-7.0/include \
PKG_CONFIG_PATH=/opt/rocm-7.0/lib/pkgconfig
RUN printf '%s\n' \
'export ROCM_PATH=/opt/rocm-7.0' \
'export HIP_PLATFORM=amd' \
'export HIP_PATH=/opt/rocm-7.0' \
'export HIP_CLANG_PATH=/opt/rocm-7.0/llvm/bin' \
'export HIP_INCLUDE_PATH=/opt/rocm-7.0/include' \
'export HIP_LIB_PATH=/opt/rocm-7.0/lib' \
'export HIP_DEVICE_LIB_PATH=/opt/rocm-7.0/lib/llvm/amdgcn/bitcode' \
'export PATH="$ROCM_PATH/bin:$HIP_CLANG_PATH:$PATH"' \
'export LD_LIBRARY_PATH="$HIP_LIB_PATH:$ROCM_PATH/lib:$ROCM_PATH/lib64:$ROCM_PATH/llvm/lib"' \
'export LIBRARY_PATH="$HIP_LIB_PATH:$ROCM_PATH/lib:$ROCM_PATH/lib64"' \
'export CPATH="$HIP_INCLUDE_PATH"' \
'export PKG_CONFIG_PATH="$ROCM_PATH/lib/pkgconfig"' \
'export ROCBLAS_USE_HIPBLASLT=1' \
> /etc/profile.d/rocm.sh \
&& chmod +x /etc/profile.d/rocm.sh \
&& echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc
# make /usr/local libs visible without touching env
RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \
&& echo "/usr/local/lib64" >> /etc/ld.so.conf.d/local.conf \
&& ldconfig
CMD ["/bin/bash"] CMD ["/bin/bash"]
+61 -31
View File
@@ -1,21 +1,17 @@
FROM fedora:rawhide # build
FROM registry.fedoraproject.org/fedora:rawhide AS builder
# 1) Install dependencies RUN dnf -y --nodocs --setopt=install_weak_deps=False install \
RUN dnf install -y \
make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \ make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \
radeontop git vim patch curl ninja-build \ radeontop git vim patch curl ninja-build tar xz \
&& dnf clean all && dnf clean all && rm -rf /var/cache/dnf/*
# 2) Download ROCm nightly tarball
WORKDIR /tmp WORKDIR /tmp
RUN curl -L -o therock.tar.gz \ RUN curl -L -o therock.tar.gz \
https://therock-nightly-tarball.s3.amazonaws.com/therock-dist-linux-gfx1151-7.0.0rc20250811.tar.gz https://therock-nightly-tarball.s3.amazonaws.com/therock-dist-linux-gfx1151-7.0.0rc20250811.tar.gz
# 3) Extract into /opt/rocm-7.0
RUN mkdir -p /opt/rocm-7.0 \ RUN mkdir -p /opt/rocm-7.0 \
&& tar xvf therock.tar.gz -C /opt/rocm-7.0 --strip-components=1 && tar xzf therock.tar.gz -C /opt/rocm-7.0 --strip-components=1
# 4) Bake in ROCm env + full system PATH
ENV ROCM_PATH=/opt/rocm-7.0 \ ENV ROCM_PATH=/opt/rocm-7.0 \
HIP_PLATFORM=amd \ HIP_PLATFORM=amd \
HIP_PATH=/opt/rocm-7.0 \ HIP_PATH=/opt/rocm-7.0 \
@@ -29,7 +25,6 @@ ENV ROCM_PATH=/opt/rocm-7.0 \
CPATH=/opt/rocm-7.0/include \ CPATH=/opt/rocm-7.0/include \
PKG_CONFIG_PATH=/opt/rocm-7.0/lib/pkgconfig PKG_CONFIG_PATH=/opt/rocm-7.0/lib/pkgconfig
# 5) profile.d snippet for login & interactive shells
RUN printf '%s\n' \ RUN printf '%s\n' \
'export ROCM_PATH=/opt/rocm-7.0' \ 'export ROCM_PATH=/opt/rocm-7.0' \
'export HIP_PLATFORM=amd' \ 'export HIP_PLATFORM=amd' \
@@ -48,28 +43,17 @@ RUN printf '%s\n' \
&& chmod +x /etc/profile.d/rocm.sh \ && chmod +x /etc/profile.d/rocm.sh \
&& echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc && echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc
# Install rocwmma WORKDIR /opt
WORKDIR /opt/
COPY ./build-rocwmma.sh . COPY ./build-rocwmma.sh .
RUN chmod +x build-rocwmma.sh RUN chmod +x build-rocwmma.sh && ./build-rocwmma.sh
RUN ./build-rocwmma.sh
# 6) Clone llama.cpp
WORKDIR /opt/llama.cpp WORKDIR /opt/llama.cpp
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . \ RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . \
&& git clean -xdf \ && git clean -xdf \
&& git submodule update --recursive && git submodule update --recursive
COPY ./apply-rocwmma-fix.sh /opt/apply-rocwmma-fix.sh
RUN chmod +x /opt/apply-rocwmma-fix.sh && /opt/apply-rocwmma-fix.sh /opt/llama.cpp
# Apply PAtch for rocwmma
COPY ./apply-rocwmma-fix.sh /opt
RUN chmod +x /opt/apply-rocwmma-fix.sh
RUN /opt/apply-rocwmma-fix.sh /opt/llama.cpp
# 7) Apply patchpatch and apply
COPY hip-rocm7rc.patch /opt/llama.cpp/hip-rocm7rc.patch
RUN patch -p1 < hip-rocm7rc.patch
# 8) Configure, build & install llama.cpp with HIP
RUN cmake -S . -B build \ RUN cmake -S . -B build \
-DGGML_HIP=ON \ -DGGML_HIP=ON \
-DAMDGPU_TARGETS=gfx1151 \ -DAMDGPU_TARGETS=gfx1151 \
@@ -79,13 +63,59 @@ RUN cmake -S . -B build \
&& cmake --build build --config Release -- -j$(nproc) \ && cmake --build build --config Release -- -j$(nproc) \
&& cmake --install build --config Release && cmake --install build --config Release
# 9) Copy the .so from build/bin into /usr/lib64 so ldconfig can see it # keep bin; drop headers/docs/static libs; drop source tree
RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \ RUN find /opt/rocm-7.0 -type f -name '*.a' -delete \
&& ldconfig && rm -rf /opt/rocm-7.0/include /opt/rocm-7.0/share \
/opt/rocm-7.0/llvm/include /opt/rocm-7.0/llvm/share \
&& rm -rf /opt/llama.cpp
# runtime
FROM registry.fedoraproject.org/fedora-minimal:rawhide
RUN microdnf -y --nodocs --setopt=install_weak_deps=0 install \
bash ca-certificates libatomic libstdc++ libgcc radeontop vim \
&& microdnf clean all && rm -rf /var/cache/dnf/*
COPY --from=builder /opt/rocm-7.0 /opt/rocm-7.0
COPY --from=builder /usr/local/ /usr/local/
# 10) Install helper script
COPY gguf-vram-estimator.py /usr/local/bin/ COPY gguf-vram-estimator.py /usr/local/bin/
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# 11) Default to interactive bash ENV ROCM_PATH=/opt/rocm-7.0 \
HIP_PLATFORM=amd \
HIP_PATH=/opt/rocm-7.0 \
HIP_CLANG_PATH=/opt/rocm-7.0/llvm/bin \
HIP_INCLUDE_PATH=/opt/rocm-7.0/include \
HIP_LIB_PATH=/opt/rocm-7.0/lib \
HIP_DEVICE_LIB_PATH=/opt/rocm-7.0/lib/llvm/amdgcn/bitcode \
PATH=/opt/rocm-7.0/bin:/opt/rocm-7.0/llvm/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin \
LD_LIBRARY_PATH=/opt/rocm-7.0/lib:/opt/rocm-7.0/lib64:/opt/rocm-7.0/llvm/lib \
LIBRARY_PATH=/opt/rocm-7.0/lib:/opt/rocm-7.0/lib64 \
CPATH=/opt/rocm-7.0/include \
PKG_CONFIG_PATH=/opt/rocm-7.0/lib/pkgconfig
RUN printf '%s\n' \
'export ROCM_PATH=/opt/rocm-7.0' \
'export HIP_PLATFORM=amd' \
'export HIP_PATH=/opt/rocm-7.0' \
'export HIP_CLANG_PATH=/opt/rocm-7.0/llvm/bin' \
'export HIP_INCLUDE_PATH=/opt/rocm-7.0/include' \
'export HIP_LIB_PATH=/opt/rocm-7.0/lib' \
'export HIP_DEVICE_LIB_PATH=/opt/rocm-7.0/lib/llvm/amdgcn/bitcode' \
'export PATH="$ROCM_PATH/bin:$HIP_CLANG_PATH:$PATH"' \
'export LD_LIBRARY_PATH="$HIP_LIB_PATH:$ROCM_PATH/lib:$ROCM_PATH/lib64:$ROCM_PATH/llvm/lib"' \
'export LIBRARY_PATH="$HIP_LIB_PATH:$ROCM_PATH/lib:$ROCM_PATH/lib64"' \
'export CPATH="$HIP_INCLUDE_PATH"' \
'export PKG_CONFIG_PATH="$ROCM_PATH/lib/pkgconfig"' \
'export ROCBLAS_USE_HIPBLASLT=1' \
> /etc/profile.d/rocm.sh \
&& chmod +x /etc/profile.d/rocm.sh \
&& echo 'source /etc/profile.d/rocm.sh' >> /etc/bashrc
# make /usr/local libs visible without touching env
RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \
&& echo "/usr/local/lib64" >> /etc/ld.so.conf.d/local.conf \
&& ldconfig
CMD ["/bin/bash"] CMD ["/bin/bash"]
+44 -10
View File
@@ -1,24 +1,25 @@
FROM fedora:rawhide # build stage
FROM registry.fedoraproject.org/fedora:rawhide AS builder
# Install build tools, Vulkan headers/loader, and glslc # deps
RUN dnf install --refresh -y \ RUN dnf -y --nodocs --setopt=install_weak_deps=False install \
git vim \ git vim \
make gcc cmake ninja-build lld clang clang-devel compiler-rt libcurl-devel \ make gcc cmake ninja-build lld clang clang-devel compiler-rt libcurl-devel \
vulkan-loader-devel vulkaninfo mesa-vulkan-drivers \ vulkan-loader-devel vulkaninfo mesa-vulkan-drivers \
radeontop glslc wget \ radeontop glslc wget \
&& dnf clean all && dnf clean all && rm -rf /var/cache/dnf/*
# Get AMDVLK drivers # amdvlk
RUN curl -L -o /tmp/amdvlk-2025.Q2.1.x86_64.rpm \ RUN curl -L -o /tmp/amdvlk-2025.Q2.1.x86_64.rpm \
https://github.com/GPUOpen-Drivers/AMDVLK/releases/download/v-2025.Q2.1/amdvlk-2025.Q2.1.x86_64.rpm https://github.com/GPUOpen-Drivers/AMDVLK/releases/download/v-2025.Q2.1/amdvlk-2025.Q2.1.x86_64.rpm \
RUN dnf install -y /tmp/amdvlk-*.rpm && dnf -y install /tmp/amdvlk-*.rpm \
&& rm -f /tmp/amdvlk-*.rpm
# llama.cpp
WORKDIR /opt/llama.cpp WORKDIR /opt/llama.cpp
# Clone llama.cpp
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
# Build with Vulkan support # build
RUN git clean -xdf \ RUN git clean -xdf \
&& git pull \ && git pull \
&& git submodule update --recursive \ && git submodule update --recursive \
@@ -32,10 +33,43 @@ RUN git clean -xdf \
&& cmake --build build --config Release \ && cmake --build build --config Release \
&& cmake --install build --config Release && cmake --install build --config Release
# libs
RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \ RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \
&& ldconfig && ldconfig
# helper
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# runtime stage
FROM registry.fedoraproject.org/fedora-minimal:rawhide
# runtime deps
RUN microdnf -y --nodocs --setopt=install_weak_deps=0 install \
bash ca-certificates libatomic libstdc++ libgcc \
vulkan-loader vulkan-loader-devel vulkaninfo mesa-vulkan-drivers radeontop \
&& microdnf clean all && rm -rf /var/cache/dnf/*
# amdvlk
RUN curl -L -o /tmp/amdvlk-2025.Q2.1.x86_64.rpm \
https://github.com/GPUOpen-Drivers/AMDVLK/releases/download/v-2025.Q2.1/amdvlk-2025.Q2.1.x86_64.rpm \
&& microdnf -y install /tmp/amdvlk-*.rpm \
&& rm -f /tmp/amdvlk-*.rpm
# copy
COPY --from=builder /usr/local/ /usr/local/
# ld
RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \
&& echo "/usr/local/lib64" >> /etc/ld.so.conf.d/local.conf \
&& ldconfig \
&& cp -n /usr/local/lib/libllama*.so* /usr/lib64/ 2>/dev/null || true \
&& ldconfig
# helper
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# shell
CMD ["/bin/bash"] CMD ["/bin/bash"]
+34 -7
View File
@@ -1,19 +1,19 @@
FROM fedora:rawhide # build stage
FROM registry.fedoraproject.org/fedora:rawhide AS builder
# Install build tools, Vulkan headers/loader, and glslc # deps
RUN dnf install --refresh -y \ RUN dnf -y --nodocs --setopt=install_weak_deps=False install \
git vim \ git vim \
make gcc cmake ninja-build lld clang clang-devel compiler-rt libcurl-devel \ make gcc cmake ninja-build lld clang clang-devel compiler-rt libcurl-devel \
vulkan-loader-devel vulkaninfo mesa-vulkan-drivers \ vulkan-loader-devel vulkaninfo mesa-vulkan-drivers \
radeontop glslc \ radeontop glslc \
&& dnf clean all && dnf clean all && rm -rf /var/cache/dnf/*
# llama.cpp
WORKDIR /opt/llama.cpp WORKDIR /opt/llama.cpp
# Clone llama.cpp
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
# Build with Vulkan support # build
RUN git clean -xdf \ RUN git clean -xdf \
&& git pull \ && git pull \
&& git submodule update --recursive \ && git submodule update --recursive \
@@ -27,10 +27,37 @@ RUN git clean -xdf \
&& cmake --build build --config Release \ && cmake --build build --config Release \
&& cmake --install build --config Release && cmake --install build --config Release
# libs
RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \ RUN find /opt/llama.cpp/build -type f -name 'lib*.so*' -exec cp {} /usr/lib64/ \; \
&& ldconfig && ldconfig
# helper
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# runtime stage
FROM registry.fedoraproject.org/fedora-minimal:rawhide
# runtime deps
RUN microdnf -y --nodocs --setopt=install_weak_deps=0 install \
bash ca-certificates libatomic libstdc++ libgcc \
vulkan-loader vulkan-loader-devel vulkaninfo mesa-vulkan-drivers radeontop \
&& microdnf clean all && rm -rf /var/cache/dnf/*
# copy
COPY --from=builder /usr/local/ /usr/local/
# ld
RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \
&& echo "/usr/local/lib64" >> /etc/ld.so.conf.d/local.conf \
&& ldconfig \
&& cp -n /usr/local/lib/libllama*.so* /usr/lib64/ 2>/dev/null || true \
&& ldconfig
# helper
COPY gguf-vram-estimator.py /usr/local/bin/gguf-vram-estimator.py
RUN chmod +x /usr/local/bin/gguf-vram-estimator.py
# shell
CMD ["/bin/bash"] CMD ["/bin/bash"]