{ "meta": { "generated_at": "2026-04-15T07:08:17Z", "system_info": { "distro": "Fedora Linux 43 (Workstation Edition)", "kernel": "6.19.9-200.fc43.x86_64", "linux_firmware": "linux-firmware-20260309-1.fc43.noarch", "timestamp": "10 Apr 2026" }, "llamacpp_builds": [ { "hash": "3f8752b55", "number": "8743" }, { "hash": "ff5ef8278", "number": "8763" } ], "environments": [ "rocm-7_2", "rocm-7_2_1", "rocm6_4_4", "rocm7-nightlies", "vulkan_amdvlk", "vulkan_radv" ], "notes": "pp512 = prompt processing; tg128 = text generation; t/s = tokens/second" }, "runs": [ { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 78.36, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.99, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.67, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.08, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 78.4, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.76, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.57, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.09, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 78.06, "tps_std": 0.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.95, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 18.34, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.06, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 123.0, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": null }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 123.0, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 46.91, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.99, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 7.32, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.59, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 404.18, "tps_std": 1.94, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 20.88, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 88.16, "tps_std": 0.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.07, "tps_std": 0.2, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": null }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 392.81, "tps_std": 1.96, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 18.97, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 94.55, "tps_std": 0.17, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 14.89, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 400.57, "tps_std": 4.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.39, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 86.01, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 14.86, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 114.94, "tps_std": 0.15, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.48, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 10.14, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.04, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 326.36, "tps_std": 4.62, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.5, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 102.0, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.82, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 914.78, "tps_std": 3.38, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 32.73, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 91.49, "tps_std": 0.75, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.47, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 903.01, "tps_std": 2.32, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 30.77, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 99.7, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 19.93, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 888.7, "tps_std": 38.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 32.81, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 89.53, "tps_std": 0.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.47, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 499.74, "tps_std": 1.49, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 39.02, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 875.8, "tps_std": 2.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 40.19, "tps_std": 1.39, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 134.1, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.18, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 245.94, "tps_std": 1.48, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "ff5ef8278", "number": "8763" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 24.11, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "ff5ef8278", "number": "8763" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 66.09, "tps_std": 0.53, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "ff5ef8278", "number": "8763" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.32, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "ff5ef8278", "number": "8763" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 245.63, "tps_std": 1.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.63, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 79.52, "tps_std": 0.47, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.69, "tps_std": 0.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 237.43, "tps_std": 0.96, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.63, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 61.53, "tps_std": 0.27, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.52, "tps_std": 0.17, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 203.53, "tps_std": 0.7, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 24.06, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 31.94, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.05, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 234.24, "tps_std": 1.27, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 29.48, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 32.31, "tps_std": 0.16, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 14.2, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 747.81, "tps_std": 7.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.42, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 182.77, "tps_std": 1.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.08, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 716.84, "tps_std": 2.31, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.39, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 166.12, "tps_std": 0.76, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.05, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 726.92, "tps_std": 2.95, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.43, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 162.4, "tps_std": 0.45, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.07, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 14.0, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log", "rpc": false, "build": null }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 14.0, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 164.2, "tps_std": 0.55, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 7.94, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 72.41, "tps_std": 0.21, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.71, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 264.16, "tps_std": 1.43, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 16.01, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 299.29, "tps_std": 0.4, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.59, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 261.51, "tps_std": 1.5, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.63, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 323.83, "tps_std": 0.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.34, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 232.54, "tps_std": 0.27, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.81, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 284.15, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.34, "tps_std": 0.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 138.78, "tps_std": 0.58, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.45, "tps_std": 0.09, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 104.96, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 13.66, "tps_std": 0.21, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 191.97, "tps_std": 8.53, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.7, "tps_std": 0.35, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 185.9, "tps_std": 0.18, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 14.21, "tps_std": 0.38, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1148.88, "tps_std": 7.32, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 67.8, "tps_std": 0.73, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 194.78, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 33.46, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1167.77, "tps_std": 7.34, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 65.06, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 291.69, "tps_std": 0.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 32.81, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1185.86, "tps_std": 2.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 68.95, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 203.21, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.77, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 882.68, "tps_std": 3.83, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 80.48, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 111.69, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 28.03, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1145.07, "tps_std": 8.85, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 82.16, "tps_std": 3.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 194.38, "tps_std": 0.33, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 37.09, "tps_std": 0.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 312.22, "tps_std": 2.95, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.6, "tps_std": 0.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 250.19, "tps_std": 0.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.88, "tps_std": 1.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 316.73, "tps_std": 1.27, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 18.86, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 275.81, "tps_std": 1.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 17.9, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 318.17, "tps_std": 2.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.57, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 223.61, "tps_std": 0.83, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.32, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 182.98, "tps_std": 1.82, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.33, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 102.84, "tps_std": 0.14, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.77, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 241.15, "tps_std": 7.43, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.75, "tps_std": 0.24, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 202.99, "tps_std": 0.41, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.09, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 509.12, "tps_std": 4.29, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.63, "tps_std": 0.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 390.8, "tps_std": 4.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.61, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 545.2, "tps_std": 3.5, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.99, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 354.63, "tps_std": 1.42, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.65, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 512.14, "tps_std": 2.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.77, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 383.01, "tps_std": 0.52, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 22.11, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 122.66, "tps_std": 0.28, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 11.56, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 97.36, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.94, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 317.93, "tps_std": 2.34, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.8, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 258.29, "tps_std": 0.54, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.39, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1098.31, "tps_std": 7.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 47.89, "tps_std": 0.32, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 681.43, "tps_std": 0.74, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.19, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1080.97, "tps_std": 5.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 45.98, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 611.53, "tps_std": 0.52, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.17, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1111.77, "tps_std": 11.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 47.94, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 669.42, "tps_std": 1.32, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 41.96, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 663.48, "tps_std": 2.94, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 58.17, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 289.32, "tps_std": 1.23, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 44.23, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1016.96, "tps_std": 39.65, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 59.11, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 673.76, "tps_std": 0.15, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 49.03, "tps_std": 0.14, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 703.33, "tps_std": 5.75, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 29.06, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 489.36, "tps_std": 3.31, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.31, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 698.12, "tps_std": 4.53, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 25.88, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 615.35, "tps_std": 3.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.34, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 697.35, "tps_std": 3.46, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 28.1, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 553.41, "tps_std": 1.44, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.57, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 415.49, "tps_std": 2.3, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 30.74, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 228.9, "tps_std": 0.28, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.62, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 710.93, "tps_std": 18.62, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 28.92, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 531.15, "tps_std": 0.2, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.32, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 45.33, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 864.78, "tps_std": 7.29, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.66, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 625.12, "tps_std": 11.57, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 19.99, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 839.13, "tps_std": 7.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 20.75, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 646.67, "tps_std": 11.22, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 19.86, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 844.42, "tps_std": 19.66, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.69, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 546.66, "tps_std": 5.96, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.11, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 117.96, "tps_std": 0.28, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 16.18, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 58.94, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.26, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 376.52, "tps_std": 7.37, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.74, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 351.87, "tps_std": 1.49, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 13.71, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1298.78, "tps_std": 7.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 46.65, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 691.44, "tps_std": 4.5, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.86, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1288.38, "tps_std": 10.85, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 45.58, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 721.84, "tps_std": 10.97, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.17, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1219.74, "tps_std": 15.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 46.57, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 600.42, "tps_std": 7.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.88, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 720.78, "tps_std": 2.94, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.21, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 100.79, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 35.41, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1213.78, "tps_std": 7.36, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 53.04, "tps_std": 0.1, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 638.76, "tps_std": 1.76, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.93, "tps_std": 0.09, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1226.22, "tps_std": 161.95, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 41.27, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 667.32, "tps_std": 5.65, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 33.43, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1303.32, "tps_std": 8.77, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 38.81, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 727.92, "tps_std": 8.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 32.52, "tps_std": 0.35, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1294.4, "tps_std": 31.54, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 41.09, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 596.78, "tps_std": 7.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 33.35, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 589.2, "tps_std": 1.79, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 43.18, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 97.7, "tps_std": 0.1, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 31.82, "tps_std": 0.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 944.96, "tps_std": 19.24, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 43.58, "tps_std": 1.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 579.88, "tps_std": 0.09, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 35.52, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 381.31, "tps_std": 4.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.49, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 151.84, "tps_std": 1.65, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.17, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 360.84, "tps_std": 1.6, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.3, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 154.86, "tps_std": 2.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.14, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 373.84, "tps_std": 0.93, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.41, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 139.53, "tps_std": 1.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.16, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 31.0, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": null }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 31.0, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 79.53, "tps_std": 0.26, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.5, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 60.29, "tps_std": 0.37, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.24, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 313.26, "tps_std": 1.19, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.51, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 141.61, "tps_std": 1.71, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.11, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 309.22, "tps_std": 0.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.02, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 143.91, "tps_std": 1.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.81, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 315.72, "tps_std": 0.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.51, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 130.8, "tps_std": 1.45, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.2, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 69.12, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.71, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 31.0, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 244.46, "tps_std": 0.27, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 11.02, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 124.32, "tps_std": 1.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.78, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 309.13, "tps_std": 0.94, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 6.16, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 140.72, "tps_std": 1.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.26, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 303.4, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 6.07, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 141.37, "tps_std": 1.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.18, "tps_std": 0.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 319.75, "tps_std": 0.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 6.12, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 128.0, "tps_std": 1.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.3, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 72.26, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 6.28, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 31.0, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 209.2, "tps_std": 6.85, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 6.28, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 112.72, "tps_std": 1.26, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.49, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 633.0, "tps_std": 7.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.15, "tps_std": 0.36, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 296.45, "tps_std": 1.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 31.19, "tps_std": 8.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 648.77, "tps_std": 4.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 49.76, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 439.58, "tps_std": 0.57, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 39.77, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 641.05, "tps_std": 2.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.73, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 305.81, "tps_std": 0.24, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.03, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 575.01, "tps_std": 3.11, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.2, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 214.22, "tps_std": 0.5, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.54, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 635.12, "tps_std": 4.23, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 56.31, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 290.19, "tps_std": 1.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 42.28, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1631.41, "tps_std": 13.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.63, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 489.21, "tps_std": 2.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 51.87, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1694.78, "tps_std": 17.2, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.19, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 730.43, "tps_std": 1.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 57.22, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1635.73, "tps_std": 10.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.47, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 493.84, "tps_std": 1.85, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 52.05, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1306.44, "tps_std": 9.57, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 73.63, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 365.33, "tps_std": 0.21, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 49.83, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1574.45, "tps_std": 16.63, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 79.03, "tps_std": 0.17, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 545.65, "tps_std": 0.37, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 60.7, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1541.76, "tps_std": 1.17, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.64, "tps_std": 0.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_1__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 162.73, "tps_std": 0.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_1", "env_base": "rocm", "env_variant": "7_2_1", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.65, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_1__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1524.35, "tps_std": 2.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.78, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 196.44, "tps_std": 1.93, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.96, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1513.21, "tps_std": 2.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.41, "tps_std": 0.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 189.28, "tps_std": 0.4, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.62, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 326.38, "tps_std": 0.44, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 55.44, "tps_std": 0.11, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 145.14, "tps_std": 0.2, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.21, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1311.79, "tps_std": 0.38, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 55.59, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 210.35, "tps_std": 0.6, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.53, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } } ] }