116 lines
3.8 KiB
Bash
Executable File
116 lines
3.8 KiB
Bash
Executable File
#!/usr/bin/env bash
|
||
set -uo pipefail
|
||
|
||
MODEL_DIR="$(realpath models)"
|
||
RESULTDIR="results"
|
||
mkdir -p "$RESULTDIR"
|
||
|
||
# Pick exactly one .gguf per model: either
|
||
# - any .gguf without "-000*-of-" (single-file models)
|
||
# - or the first shard "*-00001-of-*.gguf"
|
||
mapfile -t MODEL_PATHS < <(
|
||
find "$MODEL_DIR" -type f -name '*.gguf' \
|
||
\( -name '*-00001-of-*.gguf' -o -not -name '*-000*-of-*.gguf' \) \
|
||
| sort
|
||
)
|
||
|
||
if (( ${#MODEL_PATHS[@]} == 0 )); then
|
||
echo "❌ No models found under $MODEL_DIR – check your paths/patterns!"
|
||
exit 1
|
||
fi
|
||
|
||
echo "Found ${#MODEL_PATHS[@]} model(s) to bench:"
|
||
for p in "${MODEL_PATHS[@]}"; do
|
||
echo " • $p"
|
||
done
|
||
echo
|
||
|
||
declare -A CMDS=(
|
||
[rocm6_4_4]="toolbox run -c llama-rocm-6.4.4 -- /usr/local/bin/llama-bench"
|
||
[rocm6_4_4-rocwmma]="toolbox run -c llama-rocm-6.4.4-rocwmma -- /usr/local/bin/llama-bench"
|
||
[rocm7.1]="toolbox run -c llama-rocm-7.1 -- /usr/local/bin/llama-bench"
|
||
[rocm7.1-rocwmma]="toolbox run -c llama-rocm-7.1-rocwmma -- /usr/local/bin/llama-bench"
|
||
[rocm-7alpha-rocwmma-improved]="toolbox run -c llama-rocm-7alpha-rocwmma-improved -- /usr/local/bin/llama-bench"
|
||
[rocm-7alpha]="toolbox run -c llama-rocm-7alpha -- /usr/local/bin/llama-bench"
|
||
[rocm-7alpha-rocwmma]="toolbox run -c llama-rocm-7alpha-rocwmma -- /usr/local/bin/llama-bench"
|
||
[rocm7_rc]="toolbox run -c llama-rocm-7rc -- /usr/local/bin/llama-bench"
|
||
[rocm7_rc-rocwmma]="toolbox run -c llama-rocm-7rc-rocwmma -- /usr/local/bin/llama-bench"
|
||
[vulkan_amdvlk]="toolbox run -c llama-vulkan-amdvlk -- /usr/sbin/llama-bench"
|
||
[vulkan_radv]="toolbox run -c llama-vulkan-radv -- /usr/sbin/llama-bench"
|
||
)
|
||
|
||
get_hblt_modes() {
|
||
local env="$1"
|
||
if [[ "$env" == rocm* ]]; then
|
||
printf '%s\n' default off
|
||
else
|
||
printf '%s\n' default
|
||
fi
|
||
}
|
||
|
||
for MODEL_PATH in "${MODEL_PATHS[@]}"; do
|
||
MODEL_NAME="$(basename "$MODEL_PATH" .gguf)"
|
||
|
||
for ENV in "${!CMDS[@]}"; do
|
||
CMD="${CMDS[$ENV]}"
|
||
mapfile -t HBLT_MODES < <(get_hblt_modes "$ENV")
|
||
|
||
for MODE in "${HBLT_MODES[@]}"; do
|
||
BASE_SUFFIX=""
|
||
CMD_EFFECTIVE="$CMD"
|
||
|
||
if [[ "$ENV" == rocm* ]]; then
|
||
if [[ "$MODE" == off ]]; then
|
||
BASE_SUFFIX="__hblt0"
|
||
CMD_EFFECTIVE="${CMD_EFFECTIVE/-- /-- env ROCBLAS_USE_HIPBLASLT=0 }"
|
||
else
|
||
CMD_EFFECTIVE="${CMD_EFFECTIVE/-- /-- env ROCBLAS_USE_HIPBLASLT=1 }"
|
||
fi
|
||
fi
|
||
|
||
# run twice: baseline and with flash attention
|
||
for FA in 1; do
|
||
SUFFIX="$BASE_SUFFIX"
|
||
EXTRA_ARGS=()
|
||
if (( FA == 1 )); then
|
||
SUFFIX="${SUFFIX}__fa1"
|
||
EXTRA_ARGS=( -fa 1 )
|
||
fi
|
||
|
||
for CTX in default longctx32768; do
|
||
CTX_SUFFIX=""
|
||
CTX_ARGS=()
|
||
if [[ "$CTX" == longctx32768 ]]; then
|
||
CTX_SUFFIX="__longctx32768"
|
||
CTX_ARGS=( -p 2048 -n 32 -d 32768 )
|
||
if [[ "$ENV" == *vulkan* ]]; then
|
||
CTX_ARGS+=( -ub 512 )
|
||
else
|
||
CTX_ARGS+=( -ub 2048 )
|
||
fi
|
||
fi
|
||
|
||
OUT="$RESULTDIR/${MODEL_NAME}__${ENV}${SUFFIX}${CTX_SUFFIX}.log"
|
||
|
||
if [[ -s "$OUT" ]]; then
|
||
echo "⏩ Skipping [${ENV}] ${MODEL_NAME}${SUFFIX}${CTX_SUFFIX:+ ($CTX_SUFFIX)}, log already exists at $OUT"
|
||
continue
|
||
fi
|
||
|
||
FULL_CMD=( $CMD_EFFECTIVE -ngl 99 -mmp 0 -m "$MODEL_PATH" "${EXTRA_ARGS[@]}" "${CTX_ARGS[@]}" -r 3 )
|
||
|
||
printf "\n▶ [%s] %s%s%s\n" "$ENV" "$MODEL_NAME" "${SUFFIX:+ $SUFFIX}" "${CTX_SUFFIX:+ $CTX_SUFFIX}"
|
||
printf " → log: %s\n" "$OUT"
|
||
printf " → cmd: %s\n\n" "${FULL_CMD[*]}"
|
||
|
||
if ! "${FULL_CMD[@]}" >"$OUT" 2>&1; then
|
||
status=$?
|
||
echo "✖ ! [${ENV}] ${MODEL_NAME}${SUFFIX}${CTX_SUFFIX:+ $CTX_SUFFIX} failed (exit ${status})" >>"$OUT"
|
||
echo " * [${ENV}] ${MODEL_NAME}${SUFFIX}${CTX_SUFFIX:+ $CTX_SUFFIX} : FAILED"
|
||
fi
|
||
done
|
||
done
|
||
done
|
||
done
|
||
done
|