fix: use rocm-wmma-tune directly

This commit is contained in:
Niccolò Belli
2025-10-29 11:25:15 +01:00
parent 12fcfc54ba
commit 2e9ea4da70
@@ -58,18 +58,12 @@ COPY ./build-rocwmma.sh .
RUN chmod +x build-rocwmma.sh && ./build-rocwmma.sh RUN chmod +x build-rocwmma.sh && ./build-rocwmma.sh
WORKDIR /opt/llama.cpp WORKDIR /opt/llama.cpp
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . \ RUN git clone --recursive -b rocm-wmma-tune https://github.com/lhl/llama.cpp.git . \
&& git clean -xdf \ && git clean -xdf \
&& git submodule update --recursive && git submodule update --recursive
COPY ./apply-rocwmma-fix.sh /opt/apply-rocwmma-fix.sh COPY ./apply-rocwmma-fix.sh /opt/apply-rocwmma-fix.sh
RUN chmod +x /opt/apply-rocwmma-fix.sh && /opt/apply-rocwmma-fix.sh /opt/llama.cpp RUN chmod +x /opt/apply-rocwmma-fix.sh && /opt/apply-rocwmma-fix.sh /opt/llama.cpp
# Download and apply the PR 16827 patch
RUN aria2c -x 16 -s 16 -j 16 --file-allocation=none \
"https://github.com/ggml-org/llama.cpp/pull/16827.patch?full_index=1" \
-o 16827.patch
RUN git apply 16827.patch
RUN cmake -S . -B build \ RUN cmake -S . -B build \
-DGGML_HIP=ON \ -DGGML_HIP=ON \
-DAMDGPU_TARGETS=gfx1151 \ -DAMDGPU_TARGETS=gfx1151 \