fix: Add temporary workaround for ROCm 7 performance regression by setting HIP_LLVM_FLAGS.
This commit is contained in:
@@ -36,6 +36,9 @@ ENV ROCM_PATH=/opt/rocm \
|
|||||||
WORKDIR /opt/llama.cpp
|
WORKDIR /opt/llama.cpp
|
||||||
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
|
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
|
||||||
|
|
||||||
|
# Temporary workaround for ROCm 7 performance regression (https://github.com/ROCm/rocm-systems/issues/2865#issuecomment-3846679806)
|
||||||
|
ENV HIP_LLVM_FLAGS="-mllvm --amdgpu-unroll-threshold-local=600"
|
||||||
|
|
||||||
# build
|
# build
|
||||||
RUN git clean -xdf \
|
RUN git clean -xdf \
|
||||||
&& git submodule update --recursive \
|
&& git submodule update --recursive \
|
||||||
|
|||||||
@@ -57,6 +57,9 @@ RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . \
|
|||||||
&& git clean -xdf \
|
&& git clean -xdf \
|
||||||
&& git submodule update --recursive
|
&& git submodule update --recursive
|
||||||
|
|
||||||
|
# Temporary workaround for ROCm 7 performance regression (https://github.com/ROCm/rocm-systems/issues/2865#issuecomment-3846679806)
|
||||||
|
ENV HIP_LLVM_FLAGS="-mllvm --amdgpu-unroll-threshold-local=600"
|
||||||
|
|
||||||
RUN cmake -S . -B build \
|
RUN cmake -S . -B build \
|
||||||
-DGGML_HIP=ON \
|
-DGGML_HIP=ON \
|
||||||
-DAMDGPU_TARGETS=gfx1151 \
|
-DAMDGPU_TARGETS=gfx1151 \
|
||||||
|
|||||||
Reference in New Issue
Block a user