From f93c88b792545ebde0ea95bc94542aeda60a892c Mon Sep 17 00:00:00 2001 From: Donato Capitella Date: Wed, 12 Nov 2025 13:57:24 +0000 Subject: [PATCH] limit llama-bench to 1 try to support longer context --- benchmark/run_benchmarks.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/benchmark/run_benchmarks.sh b/benchmark/run_benchmarks.sh index f3c35b0..c1a5d8e 100755 --- a/benchmark/run_benchmarks.sh +++ b/benchmark/run_benchmarks.sh @@ -83,7 +83,7 @@ for MODEL_PATH in "${MODEL_PATHS[@]}"; do fi # build command array - FULL_CMD=( $CMD_EFFECTIVE -ngl 99 -mmp 0 -m "$MODEL_PATH" "${EXTRA_ARGS[@]}" -d 512,32768 ) + FULL_CMD=( $CMD_EFFECTIVE -ngl 99 -mmp 0 -m "$MODEL_PATH" "${EXTRA_ARGS[@]}" -d 512,32768 -r 1 ) printf "\n▶ [%s] %s%s\n" "$ENV" "$MODEL_NAME" "${SUFFIX:+ $SUFFIX}" printf " → log: %s\n" "$OUT"