reducing size of rocm-6.4.3

This commit is contained in:
Donato Capitella
2025-08-16 11:48:42 +01:00
parent 5a417bc3b5
commit 7641ae0127
3 changed files with 55 additions and 23 deletions
-1
View File
@@ -11,7 +11,6 @@ TOOLBOXES["llama-rocm-6.4.2"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-6.4
TOOLBOXES["llama-rocm-6.4.2-rocwmma"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-6.4.2-rocwmma --device /dev/dri --device /dev/kfd --group-add video --group-add render --group-add sudo --security-opt seccomp=unconfined" TOOLBOXES["llama-rocm-6.4.2-rocwmma"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-6.4.2-rocwmma --device /dev/dri --device /dev/kfd --group-add video --group-add render --group-add sudo --security-opt seccomp=unconfined"
TOOLBOXES["llama-rocm-6.4.3"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-6.4.3 --device /dev/dri --device /dev/kfd --group-add video --group-add render --group-add sudo --security-opt seccomp=unconfined" TOOLBOXES["llama-rocm-6.4.3"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-6.4.3 --device /dev/dri --device /dev/kfd --group-add video --group-add render --group-add sudo --security-opt seccomp=unconfined"
TOOLBOXES["llama-rocm-6.4.3-rocwmma"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-6.4.3-rocwmma --device /dev/dri --device /dev/kfd --group-add video --group-add render --group-add sudo --security-opt seccomp=unconfined" TOOLBOXES["llama-rocm-6.4.3-rocwmma"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-6.4.3-rocwmma --device /dev/dri --device /dev/kfd --group-add video --group-add render --group-add sudo --security-opt seccomp=unconfined"
TOOLBOXES["llama-rocm-7beta"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-7beta --device /dev/dri --device /dev/kfd --group-add video --group-add render --group-add sudo --security-opt seccomp=unconfined"
TOOLBOXES["llama-rocm-7rc"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-7rc --device /dev/dri --device /dev/kfd --group-add video --group-add render --group-add sudo --security-opt seccomp=unconfined" TOOLBOXES["llama-rocm-7rc"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-7rc --device /dev/dri --device /dev/kfd --group-add video --group-add render --group-add sudo --security-opt seccomp=unconfined"
TOOLBOXES["llama-rocm-7rc-rocwmma"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-7rc-rocwmma --device /dev/dri --device /dev/kfd --group-add video --group-add render --group-add sudo --security-opt seccomp=unconfined" TOOLBOXES["llama-rocm-7rc-rocwmma"]="docker.io/kyuz0/amd-strix-halo-toolboxes:rocm-7rc-rocwmma --device /dev/dri --device /dev/kfd --group-add video --group-add render --group-add sudo --security-opt seccomp=unconfined"
+27 -11
View File
@@ -15,11 +15,22 @@ REPO
EOF EOF
# deps # deps
RUN dnf -y --nodocs --setopt=install_weak_deps=False install \ RUN dnf -y --nodocs --setopt=install_weak_deps=False \
make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \ --exclude='*sdk*' --exclude='*samples*' --exclude='*-doc*' --exclude='*-docs*' \
rocm rocminfo radeontop \ install \
git vim sudo rsync \ make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \
&& dnf clean all && rm -rf /var/cache/dnf/* rocm-llvm rocm-device-libs hip-runtime-amd hip-devel \
rocblas rocblas-devel hipblas hipblas-devel \
rocminfo radeontop \
git-core vim sudo rsync \
&& dnf clean all && rm -rf /var/cache/dnf/*
# rocm env
ENV ROCM_PATH=/opt/rocm \
HIP_PATH=/opt/rocm \
HIP_CLANG_PATH=/opt/rocm/llvm/bin \
HIP_DEVICE_LIB_PATH=/opt/rocm/amdgcn/bitcode \
PATH=/opt/rocm/bin:/opt/rocm/llvm/bin:$PATH
# llama.cpp # llama.cpp
WORKDIR /opt/llama.cpp WORKDIR /opt/llama.cpp
@@ -29,12 +40,15 @@ RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
RUN git clean -xdf \ RUN git clean -xdf \
&& git pull \ && git pull \
&& git submodule update --recursive \ && git submodule update --recursive \
&& HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \ && cmake -S . -B build \
cmake -S . -B build \
-DGGML_HIP=ON \ -DGGML_HIP=ON \
-DAMDGPU_TARGETS=gfx1151 \ -DAMDGPU_TARGETS=gfx1151 \
-DCMAKE_BUILD_TYPE=Release \ -DCMAKE_BUILD_TYPE=Release \
-DLLAMA_HIP_UMA=ON \ -DLLAMA_HIP_UMA=ON \
-DROCM_PATH=/opt/rocm \
-DHIP_PATH=/opt/rocm \
-DHIP_PLATFORM=amd \
-DCMAKE_HIP_FLAGS="--rocm-path=/opt/rocm" \
&& cmake --build build --config Release -- -j$(nproc) \ && cmake --build build --config Release -- -j$(nproc) \
&& cmake --install build --config Release && cmake --install build --config Release
@@ -64,14 +78,16 @@ REPO
EOF EOF
# runtime deps # runtime deps
RUN microdnf -y --nodocs --setopt=install_weak_deps=0 install \ RUN microdnf -y --nodocs --setopt=install_weak_deps=0 \
--exclude='*sdk*' --exclude='*samples*' --exclude='*-doc*' --exclude='*-docs*' \
install \
bash ca-certificates libatomic libstdc++ libgcc \ bash ca-certificates libatomic libstdc++ libgcc \
rocm rocminfo radeontop \ hip-runtime-amd rocblas hipblas \
&& microdnf clean all && rm -rf /var/cache/dnf/* rocminfo radeontop \
&& microdnf clean all && rm -rf /var/cache/dnf/*
# copy # copy
COPY --from=builder /usr/local/ /usr/local/ COPY --from=builder /usr/local/ /usr/local/
COPY --from=builder /usr/include/rocwmma /usr/include/rocwmma
# ld # ld
RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \ RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \
+28 -11
View File
@@ -15,11 +15,22 @@ REPO
EOF EOF
# deps # deps
RUN dnf -y --nodocs --setopt=install_weak_deps=False install \ RUN dnf -y --nodocs --setopt=install_weak_deps=False \
make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \ --exclude='*sdk*' --exclude='*samples*' --exclude='*-doc*' --exclude='*-docs*' \
rocm rocminfo radeontop \ install \
git vim sudo rsync \ make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \
&& dnf clean all && rm -rf /var/cache/dnf/* rocm-llvm rocm-device-libs hip-runtime-amd hip-devel \
rocblas rocblas-devel hipblas hipblas-devel \
rocminfo radeontop \
git-core vim sudo rsync \
&& dnf clean all && rm -rf /var/cache/dnf/*
# rocm env
ENV ROCM_PATH=/opt/rocm \
HIP_PATH=/opt/rocm \
HIP_CLANG_PATH=/opt/rocm/llvm/bin \
HIP_DEVICE_LIB_PATH=/opt/rocm/amdgcn/bitcode \
PATH=/opt/rocm/bin:/opt/rocm/llvm/bin:$PATH
# rocWMMA # rocWMMA
WORKDIR /opt WORKDIR /opt
@@ -35,13 +46,16 @@ RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
RUN git clean -xdf \ RUN git clean -xdf \
&& git pull \ && git pull \
&& git submodule update --recursive \ && git submodule update --recursive \
&& HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \ && cmake -S . -B build \
cmake -S . -B build \
-DGGML_HIP=ON \ -DGGML_HIP=ON \
-DAMDGPU_TARGETS=gfx1151 \ -DAMDGPU_TARGETS=gfx1151 \
-DCMAKE_BUILD_TYPE=Release \ -DCMAKE_BUILD_TYPE=Release \
-DLLAMA_HIP_UMA=ON \ -DLLAMA_HIP_UMA=ON \
-DGGML_HIP_ROCWMMA_FATTN=ON \ -DGGML_HIP_ROCWMMA_FATTN=ON \
-DROCM_PATH=/opt/rocm \
-DHIP_PATH=/opt/rocm \
-DHIP_PLATFORM=amd \
-DCMAKE_HIP_FLAGS="--rocm-path=/opt/rocm" \
&& cmake --build build --config Release -- -j$(nproc) \ && cmake --build build --config Release -- -j$(nproc) \
&& cmake --install build --config Release && cmake --install build --config Release
@@ -71,14 +85,16 @@ REPO
EOF EOF
# runtime deps # runtime deps
RUN microdnf -y --nodocs --setopt=install_weak_deps=0 install \ RUN microdnf -y --nodocs --setopt=install_weak_deps=0 \
--exclude='*sdk*' --exclude='*samples*' --exclude='*-doc*' --exclude='*-docs*' \
install \
bash ca-certificates libatomic libstdc++ libgcc \ bash ca-certificates libatomic libstdc++ libgcc \
rocm rocminfo radeontop \ hip-runtime-amd rocblas hipblas \
&& microdnf clean all && rm -rf /var/cache/dnf/* rocminfo radeontop \
&& microdnf clean all && rm -rf /var/cache/dnf/*
# copy # copy
COPY --from=builder /usr/local/ /usr/local/ COPY --from=builder /usr/local/ /usr/local/
COPY --from=builder /usr/include/rocwmma /usr/include/rocwmma
# ld # ld
RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \ RUN echo "/usr/local/lib" > /etc/ld.so.conf.d/local.conf \
@@ -99,3 +115,4 @@ RUN printf '%s\n' \
# shell # shell
CMD ["/bin/bash"] CMD ["/bin/bash"]