fix: use rocm-wmma-tune directly
This commit is contained in:
@@ -58,18 +58,12 @@ COPY ./build-rocwmma.sh .
|
|||||||
RUN chmod +x build-rocwmma.sh && ./build-rocwmma.sh
|
RUN chmod +x build-rocwmma.sh && ./build-rocwmma.sh
|
||||||
|
|
||||||
WORKDIR /opt/llama.cpp
|
WORKDIR /opt/llama.cpp
|
||||||
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . \
|
RUN git clone --recursive -b rocm-wmma-tune https://github.com/lhl/llama.cpp.git . \
|
||||||
&& git clean -xdf \
|
&& git clean -xdf \
|
||||||
&& git submodule update --recursive
|
&& git submodule update --recursive
|
||||||
COPY ./apply-rocwmma-fix.sh /opt/apply-rocwmma-fix.sh
|
COPY ./apply-rocwmma-fix.sh /opt/apply-rocwmma-fix.sh
|
||||||
RUN chmod +x /opt/apply-rocwmma-fix.sh && /opt/apply-rocwmma-fix.sh /opt/llama.cpp
|
RUN chmod +x /opt/apply-rocwmma-fix.sh && /opt/apply-rocwmma-fix.sh /opt/llama.cpp
|
||||||
|
|
||||||
# Download and apply the PR 16827 patch
|
|
||||||
RUN aria2c -x 16 -s 16 -j 16 --file-allocation=none \
|
|
||||||
"https://github.com/ggml-org/llama.cpp/pull/16827.patch?full_index=1" \
|
|
||||||
-o 16827.patch
|
|
||||||
RUN git apply 16827.patch
|
|
||||||
|
|
||||||
RUN cmake -S . -B build \
|
RUN cmake -S . -B build \
|
||||||
-DGGML_HIP=ON \
|
-DGGML_HIP=ON \
|
||||||
-DAMDGPU_TARGETS=gfx1151 \
|
-DAMDGPU_TARGETS=gfx1151 \
|
||||||
|
|||||||
Reference in New Issue
Block a user