fix: Add temporary workaround for ROCm 7 performance regression by setting HIP_LLVM_FLAGS.
This commit is contained in:
@@ -36,6 +36,9 @@ ENV ROCM_PATH=/opt/rocm \
|
||||
WORKDIR /opt/llama.cpp
|
||||
RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git .
|
||||
|
||||
# Temporary workaround for ROCm 7 performance regression (https://github.com/ROCm/rocm-systems/issues/2865#issuecomment-3846679806)
|
||||
ENV HIP_LLVM_FLAGS="-mllvm --amdgpu-unroll-threshold-local=600"
|
||||
|
||||
# build
|
||||
RUN git clean -xdf \
|
||||
&& git submodule update --recursive \
|
||||
|
||||
@@ -57,6 +57,9 @@ RUN git clone --recursive https://github.com/ggerganov/llama.cpp.git . \
|
||||
&& git clean -xdf \
|
||||
&& git submodule update --recursive
|
||||
|
||||
# Temporary workaround for ROCm 7 performance regression (https://github.com/ROCm/rocm-systems/issues/2865#issuecomment-3846679806)
|
||||
ENV HIP_LLVM_FLAGS="-mllvm --amdgpu-unroll-threshold-local=600"
|
||||
|
||||
RUN cmake -S . -B build \
|
||||
-DGGML_HIP=ON \
|
||||
-DAMDGPU_TARGETS=gfx1151 \
|
||||
|
||||
Reference in New Issue
Block a user