patch: increasing MAX_REPETITION_THRESHOLD to allow complex agentic workflows
This commit is contained in:
@@ -6,7 +6,7 @@ RUN dnf -y --nodocs --setopt=install_weak_deps=False \
|
|||||||
install \
|
install \
|
||||||
make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \
|
make gcc cmake lld clang clang-devel compiler-rt libcurl-devel \
|
||||||
rocminfo radeontop 'rocm-*' 'rocblas-*' hipblas 'hipblas-*' \
|
rocminfo radeontop 'rocm-*' 'rocblas-*' hipblas 'hipblas-*' \
|
||||||
git vim rsync sudo tar xz \
|
git vim rsync sudo tar xz patch \
|
||||||
&& dnf clean all && rm -rf /var/cache/dnf/*
|
&& dnf clean all && rm -rf /var/cache/dnf/*
|
||||||
|
|
||||||
# llama.cpp
|
# llama.cpp
|
||||||
@@ -15,9 +15,12 @@ ARG REPO=https://github.com/ggerganov/llama.cpp.git
|
|||||||
ARG BRANCH=master
|
ARG BRANCH=master
|
||||||
RUN git clone -b ${BRANCH} --single-branch --recursive ${REPO} .
|
RUN git clone -b ${BRANCH} --single-branch --recursive ${REPO} .
|
||||||
|
|
||||||
|
COPY llama-grammar.patch /tmp/llama-grammar.patch
|
||||||
|
|
||||||
# build + install
|
# build + install
|
||||||
RUN git clean -xdf \
|
RUN git clean -xdf \
|
||||||
&& git submodule update --recursive \
|
&& git submodule update --recursive \
|
||||||
|
&& patch -p1 < /tmp/llama-grammar.patch \
|
||||||
&& HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \
|
&& HIPCXX="$(hipconfig -l)/clang" HIP_PATH="$(hipconfig -R)" \
|
||||||
cmake -S . -B build \
|
cmake -S . -B build \
|
||||||
-DGGML_HIP=ON \
|
-DGGML_HIP=ON \
|
||||||
|
|||||||
@@ -22,7 +22,7 @@ RUN dnf -y --nodocs --setopt=install_weak_deps=False \
|
|||||||
rocm-llvm rocm-device-libs hip-runtime-amd hip-devel \
|
rocm-llvm rocm-device-libs hip-runtime-amd hip-devel \
|
||||||
rocblas rocblas-devel hipblas hipblas-devel rocm-cmake libomp-devel libomp \
|
rocblas rocblas-devel hipblas hipblas-devel rocm-cmake libomp-devel libomp \
|
||||||
rocminfo radeontop \
|
rocminfo radeontop \
|
||||||
git-core vim sudo rsync \
|
git-core vim sudo rsync patch \
|
||||||
&& dnf clean all && rm -rf /var/cache/dnf/*
|
&& dnf clean all && rm -rf /var/cache/dnf/*
|
||||||
|
|
||||||
# rocm env
|
# rocm env
|
||||||
@@ -38,9 +38,12 @@ ARG REPO=https://github.com/ggerganov/llama.cpp.git
|
|||||||
ARG BRANCH=master
|
ARG BRANCH=master
|
||||||
RUN git clone -b ${BRANCH} --single-branch --recursive ${REPO} .
|
RUN git clone -b ${BRANCH} --single-branch --recursive ${REPO} .
|
||||||
|
|
||||||
|
COPY llama-grammar.patch /tmp/llama-grammar.patch
|
||||||
|
|
||||||
# build
|
# build
|
||||||
RUN git clean -xdf \
|
RUN git clean -xdf \
|
||||||
&& git submodule update --recursive \
|
&& git submodule update --recursive \
|
||||||
|
&& patch -p1 < /tmp/llama-grammar.patch \
|
||||||
&& cmake -S . -B build \
|
&& cmake -S . -B build \
|
||||||
-DGGML_HIP=ON \
|
-DGGML_HIP=ON \
|
||||||
-DCMAKE_HIP_FLAGS="--rocm-path=/opt/rocm -mllvm --amdgpu-unroll-threshold-local=600" \
|
-DCMAKE_HIP_FLAGS="--rocm-path=/opt/rocm -mllvm --amdgpu-unroll-threshold-local=600" \
|
||||||
|
|||||||
@@ -59,9 +59,10 @@ RUN git clone -b ${BRANCH} --single-branch --recursive ${REPO} . \
|
|||||||
&& git clean -xdf \
|
&& git clean -xdf \
|
||||||
&& git submodule update --recursive
|
&& git submodule update --recursive
|
||||||
|
|
||||||
|
COPY llama-grammar.patch /tmp/llama-grammar.patch
|
||||||
|
|
||||||
|
RUN patch -p1 < /tmp/llama-grammar.patch \
|
||||||
RUN cmake -S . -B build \
|
&& cmake -S . -B build \
|
||||||
-DGGML_HIP=ON \
|
-DGGML_HIP=ON \
|
||||||
-DAMDGPU_TARGETS=gfx1151 \
|
-DAMDGPU_TARGETS=gfx1151 \
|
||||||
-DCMAKE_BUILD_TYPE=Release \
|
-DCMAKE_BUILD_TYPE=Release \
|
||||||
|
|||||||
@@ -6,7 +6,7 @@ RUN dnf -y --nodocs --setopt=install_weak_deps=False install \
|
|||||||
git vim \
|
git vim \
|
||||||
make gcc cmake ninja-build lld clang clang-devel compiler-rt libcurl-devel \
|
make gcc cmake ninja-build lld clang clang-devel compiler-rt libcurl-devel \
|
||||||
vulkan-loader-devel vulkaninfo mesa-vulkan-drivers \
|
vulkan-loader-devel vulkaninfo mesa-vulkan-drivers \
|
||||||
radeontop glslc wget \
|
radeontop glslc wget patch \
|
||||||
&& dnf clean all && rm -rf /var/cache/dnf/*
|
&& dnf clean all && rm -rf /var/cache/dnf/*
|
||||||
|
|
||||||
# amdvlk
|
# amdvlk
|
||||||
@@ -21,9 +21,12 @@ ARG REPO=https://github.com/ggerganov/llama.cpp.git
|
|||||||
ARG BRANCH=master
|
ARG BRANCH=master
|
||||||
RUN git clone -b ${BRANCH} --single-branch --recursive ${REPO} .
|
RUN git clone -b ${BRANCH} --single-branch --recursive ${REPO} .
|
||||||
|
|
||||||
|
COPY llama-grammar.patch /tmp/llama-grammar.patch
|
||||||
|
|
||||||
# build
|
# build
|
||||||
RUN git clean -xdf \
|
RUN git clean -xdf \
|
||||||
&& git submodule update --recursive \
|
&& git submodule update --recursive \
|
||||||
|
&& patch -p1 < /tmp/llama-grammar.patch \
|
||||||
&& cmake -S . -B build -G Ninja \
|
&& cmake -S . -B build -G Ninja \
|
||||||
-DGGML_VULKAN=ON \
|
-DGGML_VULKAN=ON \
|
||||||
-DCMAKE_BUILD_TYPE=Release \
|
-DCMAKE_BUILD_TYPE=Release \
|
||||||
|
|||||||
@@ -6,7 +6,7 @@ RUN dnf -y --nodocs --setopt=install_weak_deps=False install \
|
|||||||
git vim \
|
git vim \
|
||||||
make gcc cmake ninja-build lld clang clang-devel compiler-rt libcurl-devel \
|
make gcc cmake ninja-build lld clang clang-devel compiler-rt libcurl-devel \
|
||||||
vulkan-loader-devel vulkaninfo mesa-vulkan-drivers \
|
vulkan-loader-devel vulkaninfo mesa-vulkan-drivers \
|
||||||
radeontop glslc \
|
radeontop glslc patch \
|
||||||
&& dnf clean all && rm -rf /var/cache/dnf/*
|
&& dnf clean all && rm -rf /var/cache/dnf/*
|
||||||
|
|
||||||
# llama.cpp
|
# llama.cpp
|
||||||
@@ -15,9 +15,12 @@ ARG REPO=https://github.com/ggerganov/llama.cpp.git
|
|||||||
ARG BRANCH=master
|
ARG BRANCH=master
|
||||||
RUN git clone -b ${BRANCH} --single-branch --recursive ${REPO} .
|
RUN git clone -b ${BRANCH} --single-branch --recursive ${REPO} .
|
||||||
|
|
||||||
|
COPY llama-grammar.patch /tmp/llama-grammar.patch
|
||||||
|
|
||||||
# build
|
# build
|
||||||
RUN git clean -xdf \
|
RUN git clean -xdf \
|
||||||
&& git submodule update --recursive \
|
&& git submodule update --recursive \
|
||||||
|
&& patch -p1 < /tmp/llama-grammar.patch \
|
||||||
&& cmake -S . -B build -G Ninja \
|
&& cmake -S . -B build -G Ninja \
|
||||||
-DGGML_VULKAN=ON \
|
-DGGML_VULKAN=ON \
|
||||||
-DCMAKE_BUILD_TYPE=Release \
|
-DCMAKE_BUILD_TYPE=Release \
|
||||||
|
|||||||
@@ -0,0 +1,13 @@
|
|||||||
|
From: KYmidnight
|
||||||
|
Issue: https://github.com/kyuz0/amd-strix-halo-toolboxes/issues/70
|
||||||
|
Subject: Increase MAX_REPETITION_THRESHOLD for complex tool schemas
|
||||||
|
|
||||||
|
--- a/src/llama-grammar.cpp
|
||||||
|
+++ b/src/llama-grammar.cpp
|
||||||
|
@@ -14,7 +14,7 @@
|
||||||
|
|
||||||
|
// allow to be at least defined in CMakeLists.txt
|
||||||
|
#ifndef MAX_REPETITION_THRESHOLD
|
||||||
|
-#define MAX_REPETITION_THRESHOLD 2000
|
||||||
|
+#define MAX_REPETITION_THRESHOLD 100000
|
||||||
|
#endif
|
||||||
Reference in New Issue
Block a user