{ "meta": { "generated_at": "2026-04-29T05:45:18Z", "system_info": { "distro": "Fedora Linux 43 (Workstation Edition)", "kernel": "6.19.9-200.fc43.x86_64", "linux_firmware": "linux-firmware-20260309-1.fc43.noarch", "timestamp": "10 Apr 2026" }, "llamacpp_builds": [ { "hash": "3f8752b55", "number": "8743" }, { "hash": "7957de9dc", "number": "8645" }, { "hash": "f53577432", "number": "8942" } ], "environments": [ "rocm-7_2", "rocm-7_2_2", "rocm-7_2_2-pr21344", "rocm6_4_4", "rocm7-nightlies", "vulkan_amdvlk", "vulkan_radv" ], "notes": "pp512 = prompt processing; tg128 = text generation; t/s = tokens/second" }, "runs": [ { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 72.06, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.99, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 16.76, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.08, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 77.83, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.95, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.1, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.06, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 78.4, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.76, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.57, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.09, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 78.06, "tps_std": 0.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.95, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 18.34, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.06, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 123.0, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": null }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 123.0, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 46.91, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.99, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 7.32, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.59, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 403.45, "tps_std": 2.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.04, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 87.65, "tps_std": 0.31, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.25, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2__fa1.log", "rpc": false, "build": null }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 87.91, "tps_std": 0.2, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 14.84, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": null }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 392.81, "tps_std": 1.96, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 18.97, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 94.55, "tps_std": 0.17, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 14.89, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 400.57, "tps_std": 4.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.39, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 86.01, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 14.86, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 114.94, "tps_std": 0.15, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.48, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 10.14, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.04, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 326.36, "tps_std": 4.62, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.5, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 102.0, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.82, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1058.1, "tps_std": 2.19, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 33.18, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 91.21, "tps_std": 1.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.62, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 889.16, "tps_std": 36.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 32.61, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 91.01, "tps_std": 1.51, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.38, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 903.01, "tps_std": 2.32, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 30.77, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 99.7, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 19.93, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 888.7, "tps_std": 38.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 32.81, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 89.53, "tps_std": 0.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.47, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 499.74, "tps_std": 1.49, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 39.02, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 875.8, "tps_std": 2.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 40.19, "tps_std": 1.39, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 134.1, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.18, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 356.93, "tps_std": 1.86, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.97, "tps_std": 0.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 65.86, "tps_std": 0.58, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.1, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 236.39, "tps_std": 1.24, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.64, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 64.53, "tps_std": 0.53, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.04, "tps_std": 0.17, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 236.56, "tps_std": 1.44, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.55, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 77.34, "tps_std": 1.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.54, "tps_std": 0.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 225.65, "tps_std": 0.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.44, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 64.1, "tps_std": 0.5, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.35, "tps_std": 0.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 202.08, "tps_std": 0.31, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 24.94, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 31.48, "tps_std": 0.09, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.27, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 231.25, "tps_std": 0.79, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 30.7, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 32.0, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_S-00001-of-00003", "model_clean": "MiniMax-M2.7-UD-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 14.47, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 87.2, "name_params_b": 228.69, "quant": "Q3_K_S", "log": "results/MiniMax-M2.7-UD-Q3_K_S-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 245.87, "tps_std": 1.58, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.72, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 81.2, "tps_std": 1.25, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.69, "tps_std": 0.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 238.13, "tps_std": 1.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.54, "tps_std": 0.27, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 61.41, "tps_std": 0.44, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.64, "tps_std": 0.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 203.65, "tps_std": 1.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 24.07, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 31.64, "tps_std": 0.19, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.06, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 230.72, "tps_std": 8.67, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 29.48, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 32.06, "tps_std": 0.16, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004", "model_clean": "MiniMax-M2.7-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 14.12, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 228.69, "file_size_gib": 94.93, "name_params_b": 228.69, "quant": "Q3_K_XL", "log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 745.5, "tps_std": 9.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.42, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 164.19, "tps_std": 1.96, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.08, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 732.09, "tps_std": 2.49, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.42, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 182.01, "tps_std": 2.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.07, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 716.84, "tps_std": 2.31, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.39, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 166.12, "tps_std": 0.76, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.05, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 726.92, "tps_std": 2.95, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.43, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 162.4, "tps_std": 0.45, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.07, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 14.0, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log", "rpc": false, "build": null }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 14.0, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 164.2, "tps_std": 0.55, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 7.94, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 72.41, "tps_std": 0.21, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.71, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 333.46, "tps_std": 1.2, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.99, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 307.47, "tps_std": 0.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.6, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 267.67, "tps_std": 1.7, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 16.18, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 304.86, "tps_std": 0.24, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.79, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 261.51, "tps_std": 1.5, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.63, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 323.83, "tps_std": 0.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.34, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 232.54, "tps_std": 0.27, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.81, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 284.15, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.34, "tps_std": 0.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 138.78, "tps_std": 0.58, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.45, "tps_std": 0.09, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 104.96, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 13.66, "tps_std": 0.21, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 191.97, "tps_std": 8.53, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.7, "tps_std": 0.35, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 185.9, "tps_std": 0.18, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 14.21, "tps_std": 0.38, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1498.5, "tps_std": 6.83, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 68.29, "tps_std": 0.67, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 213.71, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 33.47, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1149.95, "tps_std": 8.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 67.57, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 194.74, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 33.36, "tps_std": 0.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1167.77, "tps_std": 7.34, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 65.06, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 291.69, "tps_std": 0.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 32.81, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1185.86, "tps_std": 2.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 68.95, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 203.21, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.77, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 882.68, "tps_std": 3.83, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 80.48, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 111.69, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 28.03, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1145.07, "tps_std": 8.85, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 82.16, "tps_std": 3.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 194.38, "tps_std": 0.33, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 37.09, "tps_std": 0.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 418.75, "tps_std": 3.97, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.62, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 207.29, "tps_std": 0.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.34, "tps_std": 2.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 314.59, "tps_std": 2.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.96, "tps_std": 0.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 235.56, "tps_std": 9.94, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 16.82, "tps_std": 0.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 316.73, "tps_std": 1.27, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 18.86, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 275.81, "tps_std": 1.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 17.9, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 318.17, "tps_std": 2.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.57, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 223.61, "tps_std": 0.83, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.32, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 182.98, "tps_std": 1.82, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.33, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 102.84, "tps_std": 0.14, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.77, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 241.15, "tps_std": 7.43, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.75, "tps_std": 0.24, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 202.99, "tps_std": 0.41, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.09, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 513.08, "tps_std": 3.8, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.46, "tps_std": 0.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 379.44, "tps_std": 1.48, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.65, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 509.14, "tps_std": 3.56, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.98, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 391.47, "tps_std": 0.29, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.88, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 538.42, "tps_std": 12.9, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.91, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 412.11, "tps_std": 0.6, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.59, "tps_std": 0.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "load", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 35.0, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": null }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "load", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 35.0, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 122.43, "tps_std": 0.23, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 11.55, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 98.18, "tps_std": 0.09, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.94, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 316.59, "tps_std": 1.87, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.8, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 267.07, "tps_std": 0.91, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.6-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.37, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.6-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1359.62, "tps_std": 5.74, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 48.34, "tps_std": 0.43, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 670.26, "tps_std": 1.77, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.42, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1089.21, "tps_std": 5.82, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 49.27, "tps_std": 0.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 703.58, "tps_std": 0.51, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 41.08, "tps_std": 0.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1067.33, "tps_std": 6.85, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 48.23, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 769.99, "tps_std": 2.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 41.91, "tps_std": 0.49, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1091.62, "tps_std": 10.45, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 49.1, "tps_std": 0.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 664.89, "tps_std": 1.48, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 42.73, "tps_std": 0.65, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 663.94, "tps_std": 2.8, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 57.13, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 292.49, "tps_std": 0.18, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 43.97, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1045.16, "tps_std": 5.79, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 58.82, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 682.8, "tps_std": 1.45, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 48.77, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.81, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1222.77, "tps_std": 2.88, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 43.72, "tps_std": 0.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 653.49, "tps_std": 0.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 37.21, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1043.12, "tps_std": 46.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 44.53, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 544.04, "tps_std": 1.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 37.7, "tps_std": 0.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1049.22, "tps_std": 7.25, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 43.1, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 758.76, "tps_std": 0.99, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 38.7, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1036.89, "tps_std": 9.24, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 44.2, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 510.38, "tps_std": 2.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 38.18, "tps_std": 1.71, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 576.25, "tps_std": 2.16, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 45.25, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 273.77, "tps_std": 0.3, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.71, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 893.79, "tps_std": 4.74, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 46.05, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 610.84, "tps_std": 1.99, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "model_clean": "Qwen3.6-35B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 39.67, "tps_std": 0.15, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 35.8, "name_params_b": 34.66, "quant": "Q8_K_XL", "log": "results/Qwen3.6-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 836.74, "tps_std": 6.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.95, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 619.85, "tps_std": 6.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.38, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 823.65, "tps_std": 83.54, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.67, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 628.14, "tps_std": 5.88, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.15, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 839.13, "tps_std": 7.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 20.75, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 646.67, "tps_std": 11.22, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 19.86, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 844.42, "tps_std": 19.66, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.69, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 546.66, "tps_std": 5.96, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.11, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 117.96, "tps_std": 0.28, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 16.18, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 58.94, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.26, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 376.52, "tps_std": 7.37, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.74, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 351.87, "tps_std": 1.49, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-BF16-00001-of-00002", "model_clean": "gemma-4-26B-A4B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 13.71, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 47.02, "name_params_b": 25.23, "quant": "BF16", "log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1608.01, "tps_std": 5.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 47.13, "tps_std": 0.29, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 689.3, "tps_std": 12.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 37.14, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1299.9, "tps_std": 11.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 46.59, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 693.48, "tps_std": 4.74, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.76, "tps_std": 0.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1288.38, "tps_std": 10.85, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 45.58, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 721.84, "tps_std": 10.97, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.17, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1219.74, "tps_std": 15.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 46.57, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 600.42, "tps_std": 7.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.88, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 720.78, "tps_std": 2.94, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.21, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 100.79, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 35.41, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1213.78, "tps_std": 7.36, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 53.04, "tps_std": 0.1, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 638.76, "tps_std": 1.76, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.93, "tps_std": 0.09, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 15.9, "name_params_b": 25.23, "quant": "Q4_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1524.44, "tps_std": 7.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 41.68, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 689.36, "tps_std": 8.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 33.67, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1272.69, "tps_std": 74.5, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 41.31, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 696.25, "tps_std": 7.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 32.95, "tps_std": 0.77, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1303.32, "tps_std": 8.77, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 38.81, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 727.92, "tps_std": 8.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 32.52, "tps_std": 0.35, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1294.4, "tps_std": 31.54, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 41.09, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 596.78, "tps_std": 7.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 33.35, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 589.2, "tps_std": 1.79, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 43.18, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 97.7, "tps_std": 0.1, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 31.82, "tps_std": 0.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 944.96, "tps_std": 19.24, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 43.58, "tps_std": 1.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 579.88, "tps_std": 0.09, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 35.52, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 25.23, "file_size_gib": 25.94, "name_params_b": 25.23, "quant": "Q8_K_XL", "log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 380.58, "tps_std": 1.49, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.49, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 150.63, "tps_std": 1.53, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.17, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 377.93, "tps_std": 2.48, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.44, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 153.11, "tps_std": 1.83, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.18, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 360.84, "tps_std": 1.6, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.3, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 154.86, "tps_std": 2.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.14, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 373.84, "tps_std": 0.93, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.41, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 139.53, "tps_std": 1.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.16, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 31.0, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": null }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 31.0, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 79.53, "tps_std": 0.26, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.5, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 60.29, "tps_std": 0.37, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-BF16-00001-of-00002", "model_clean": "gemma-4-31B-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.24, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 57.18, "name_params_b": 30.7, "quant": "BF16", "log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 293.27, "tps_std": 0.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.5, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 136.84, "tps_std": 1.27, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.11, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 310.54, "tps_std": 0.73, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.52, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 140.71, "tps_std": 1.29, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.11, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 309.22, "tps_std": 0.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.02, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 143.91, "tps_std": 1.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.81, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 315.72, "tps_std": 0.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.51, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 130.8, "tps_std": 1.45, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.2, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 69.12, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.71, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 31.0, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 244.46, "tps_std": 0.27, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 11.02, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 124.32, "tps_std": 1.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q4_K_XL", "model_clean": "gemma-4-31B-it-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.78, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 17.46, "name_params_b": 30.7, "quant": "Q4_K_XL", "log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 282.42, "tps_std": 0.4, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 6.16, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 132.6, "tps_std": 1.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.26, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 308.17, "tps_std": 0.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 6.16, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 138.85, "tps_std": 1.58, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.26, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 303.4, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 6.07, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 141.37, "tps_std": 1.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.18, "tps_std": 0.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 319.75, "tps_std": 0.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 6.12, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 128.0, "tps_std": 1.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.3, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 72.26, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 6.28, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 31.0, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 209.2, "tps_std": 6.85, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 6.28, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 112.72, "tps_std": 1.26, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gemma-4-31B-it-UD-Q8_K_XL", "model_clean": "gemma-4-31B-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.49, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.7, "file_size_gib": 32.6, "name_params_b": 30.7, "quant": "Q8_K_XL", "log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 945.82, "tps_std": 60.17, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.25, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 311.38, "tps_std": 1.36, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 31.94, "tps_std": 7.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 634.64, "tps_std": 3.8, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.7, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 304.96, "tps_std": 1.71, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 35.84, "tps_std": 0.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 648.77, "tps_std": 4.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 49.76, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 439.58, "tps_std": 0.57, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 39.77, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 641.05, "tps_std": 2.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.73, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 305.81, "tps_std": 0.24, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.03, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 575.01, "tps_std": 3.11, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.2, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 214.22, "tps_std": 0.5, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.54, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 635.12, "tps_std": 4.23, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 56.31, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 290.19, "tps_std": 1.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 42.28, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2029.48, "tps_std": 6.68, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.53, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 494.19, "tps_std": 1.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 51.81, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1631.69, "tps_std": 17.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.53, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 490.56, "tps_std": 2.76, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 51.69, "tps_std": 0.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1694.78, "tps_std": 17.2, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.19, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 730.43, "tps_std": 1.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 57.22, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1635.73, "tps_std": 10.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.47, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 493.84, "tps_std": 1.85, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 52.05, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1306.44, "tps_std": 9.57, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 73.63, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 365.33, "tps_std": 0.21, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 49.83, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1574.45, "tps_std": 16.63, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 79.03, "tps_std": 0.17, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 545.65, "tps_std": 0.37, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 60.7, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1512.85, "tps_std": 4.84, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.54, "tps_std": 0.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_2-pr21344__fa1.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 163.39, "tps_std": 1.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_2-pr21344", "env_base": "rocm", "env_variant": "7_2_2-pr21344", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.65, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_2-pr21344__fa1__longctx32768.log", "rpc": false, "build": { "hash": "7957de9dc", "number": "8645" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1542.98, "tps_std": 7.94, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.52, "tps_std": 0.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_2__fa1.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 162.64, "tps_std": 0.31, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2_2", "env_base": "rocm", "env_variant": "7_2_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.64, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "f53577432", "number": "8942" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1524.35, "tps_std": 2.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.78, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 196.44, "tps_std": 1.93, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.96, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1513.21, "tps_std": 2.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.41, "tps_std": 0.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 189.28, "tps_std": 0.4, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.62, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 326.38, "tps_std": 0.44, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 55.44, "tps_std": 0.11, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 145.14, "tps_std": 0.2, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.21, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1311.79, "tps_std": 0.38, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 55.59, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 210.35, "tps_std": 0.6, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.53, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "3f8752b55", "number": "8743" } } ] }