build: disable GGML CUDA fusion in ROCm build configuration (temporary test)
This commit is contained in:
@@ -67,6 +67,7 @@ RUN patch -p1 < /tmp/llama-grammar.patch \
|
||||
-DAMDGPU_TARGETS=gfx1151 \
|
||||
-DCMAKE_BUILD_TYPE=Release \
|
||||
-DGGML_RPC=ON \
|
||||
-DGGML_CUDA_DISABLE_FUSION=1 \
|
||||
-DLLAMA_HIP_UMA=ON \
|
||||
&& cmake --build build --config Release -- -j$(nproc) \
|
||||
&& cmake --install build --config Release
|
||||
|
||||
Reference in New Issue
Block a user