From 1bffd6505fd78b51c1634b73d6d4551d356934c7 Mon Sep 17 00:00:00 2001 From: Donato Capitella Date: Fri, 1 May 2026 20:19:02 +0100 Subject: [PATCH] feat: add longctx65536 support to standard and RPC benchmark scripts --- benchmark/run_benchmarks.sh | 12 ++++++++++-- benchmark/run_rpc_benchmarks.sh | 15 +++++++++++++-- 2 files changed, 23 insertions(+), 4 deletions(-) diff --git a/benchmark/run_benchmarks.sh b/benchmark/run_benchmarks.sh index 24f31d5..96a706b 100755 --- a/benchmark/run_benchmarks.sh +++ b/benchmark/run_benchmarks.sh @@ -84,7 +84,7 @@ for MODEL_PATH in "${MODEL_PATHS[@]}"; do EXTRA_ARGS=( -fa 1 ) fi - for CTX in default longctx32768; do + for CTX in default longctx32768 longctx65536; do CTX_SUFFIX="" CTX_ARGS=() if [[ "$CTX" == longctx32768 ]]; then @@ -95,11 +95,19 @@ for MODEL_PATH in "${MODEL_PATHS[@]}"; do else CTX_ARGS+=( -ub 2048 ) fi + elif [[ "$CTX" == longctx65536 ]]; then + CTX_SUFFIX="__longctx65536" + CTX_ARGS=( -p 2048 -n 32 -d 65536 ) + if [[ "$ENV" == *vulkan* ]]; then + CTX_ARGS+=( -ub 512 ) + else + CTX_ARGS+=( -ub 2048 ) + fi fi OUT="$RESULTDIR/${MODEL_NAME}__${ENV}${SUFFIX}${CTX_SUFFIX}.log" CTX_REPS=5 - if [[ "$CTX" == longctx32768 ]]; then + if [[ "$CTX" == longctx32768 ]] || [[ "$CTX" == longctx65536 ]]; then CTX_REPS=3 fi diff --git a/benchmark/run_rpc_benchmarks.sh b/benchmark/run_rpc_benchmarks.sh index 4db3a89..50ea0ce 100755 --- a/benchmark/run_rpc_benchmarks.sh +++ b/benchmark/run_rpc_benchmarks.sh @@ -114,10 +114,12 @@ has_pending_runs() { for model_path in "${RESOLVED_MODELS[@]}"; do local model_name model_name="$(basename "${model_path}" .gguf)" - for ctx in default longctx32768; do + for ctx in default longctx32768 longctx65536; do local ctx_suffix="" if [[ "$ctx" == longctx32768 ]]; then ctx_suffix="__longctx32768" + elif [[ "$ctx" == longctx65536 ]]; then + ctx_suffix="__longctx65536" fi local log_file="$RESULTDIR/${model_name}__${env}${suffix}${ctx_suffix}__rpc.log" @@ -201,7 +203,7 @@ run_llama_bench_rpc() { # shellcheck disable=SC2206 # intentional word splitting client_cmd_ary=( $client_cmd ) - for ctx in default longctx32768; do + for ctx in default longctx32768 longctx65536; do local ctx_suffix="" local ctx_reps=3 local -a ctx_args=() @@ -214,6 +216,15 @@ run_llama_bench_rpc() { else ctx_args+=( -ub 2048 ) fi + elif [[ "$ctx" == longctx65536 ]]; then + ctx_suffix="__longctx65536" + ctx_reps=1 + ctx_args=( -p 2048 -n 32 -d 65536 ) + if [[ "$env" == *vulkan* ]]; then + ctx_args+=( -ub 512 ) + else + ctx_args+=( -ub 2048 ) + fi fi local log_file="$RESULTDIR/${model_name}__${env}${suffix}${ctx_suffix}__rpc.log"