{ "meta": { "generated_at": "2026-03-30T06:55:07Z", "system_info": { "distro": "Fedora Linux 43 (Workstation Edition)", "kernel": "6.19.9-200.fc43.x86_64", "linux_firmware": "linux-firmware-20260309-1.fc43.noarch", "timestamp": "29 Mar 2026" }, "llamacpp_builds": [ { "hash": "2405d59cb", "number": "8577" }, { "hash": "e0c93af2a", "number": "7938" } ], "environments": [ "rocm-7_2", "rocm-7_2-hblt0", "rocm6_4_4", "rocm6_4_4-hblt0", "rocm7-nightlies", "rocm7-nightlies-hblt0", "vulkan_amdvlk", "vulkan_radv" ], "notes": "pp512 = prompt processing; tg128 = text generation; t/s = tokens/second" }, "runs": [ { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 78.37, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.96, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.07, "tps_std": 0.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.07, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 78.3, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.98, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.08, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.08, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 78.37, "tps_std": 0.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.76, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.56, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.09, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 78.63, "tps_std": 0.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.8, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.58, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.08, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 80.49, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.99, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 21.15, "tps_std": 0.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.07, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 78.97, "tps_std": 0.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.99, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 21.17, "tps_std": 0.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.07, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 123.0, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": null }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 123.0, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 47.2, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.99, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 7.39, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.6, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 435.72, "tps_std": 2.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.38, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 87.93, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.33, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 403.83, "tps_std": 1.74, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.37, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 87.49, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.33, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 393.19, "tps_std": 1.92, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.36, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 94.74, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.06, "tps_std": 0.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 393.15, "tps_std": 2.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.11, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 94.55, "tps_std": 0.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.18, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 476.23, "tps_std": 2.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.36, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 86.79, "tps_std": 0.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.32, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 401.13, "tps_std": 5.52, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.35, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 85.92, "tps_std": 0.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.3, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 114.88, "tps_std": 0.15, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.48, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 10.15, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.05, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 342.11, "tps_std": 5.47, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.48, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 102.93, "tps_std": 0.11, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.82, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 905.79, "tps_std": 2.84, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 32.96, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 91.97, "tps_std": 0.19, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.58, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 893.68, "tps_std": 28.19, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 33.2, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 91.83, "tps_std": 0.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.62, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 903.39, "tps_std": 1.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 31.04, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 99.84, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.33, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 906.25, "tps_std": 1.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 32.57, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 100.07, "tps_std": 0.2, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.35, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 902.85, "tps_std": 59.94, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 33.16, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 89.75, "tps_std": 0.31, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.59, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 906.42, "tps_std": 2.57, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 33.18, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 89.99, "tps_std": 0.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.6, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 499.98, "tps_std": 1.29, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 39.01, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 853.46, "tps_std": 6.7, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 40.38, "tps_std": 1.22, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 133.27, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.17, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 673.71, "tps_std": 1.42, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.35, "tps_std": 0.17, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 160.3, "tps_std": 0.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.08, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 748.37, "tps_std": 4.67, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.42, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 165.11, "tps_std": 1.59, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.08, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 706.16, "tps_std": 3.76, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.39, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 166.61, "tps_std": 1.47, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.05, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 710.61, "tps_std": 4.31, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.39, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 161.22, "tps_std": 2.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.06, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 881.45, "tps_std": 3.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.44, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 213.5, "tps_std": 0.7, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.08, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 735.98, "tps_std": 5.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.44, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 205.29, "tps_std": 0.84, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.08, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 14.0, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log", "rpc": false, "build": null }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": 14.0, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 166.51, "tps_std": 0.62, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 7.94, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 72.65, "tps_std": 0.24, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.7, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 259.71, "tps_std": 1.51, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.74, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 302.29, "tps_std": 0.44, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.58, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 263.95, "tps_std": 1.57, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 16.02, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 305.52, "tps_std": 0.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.59, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 260.98, "tps_std": 1.56, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.6, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 324.69, "tps_std": 0.27, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.38, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 262.3, "tps_std": 1.42, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.86, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 324.11, "tps_std": 0.41, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.45, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 228.5, "tps_std": 1.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 16.07, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 284.43, "tps_std": 0.38, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.76, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 236.84, "tps_std": 1.32, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 16.04, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 290.04, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.76, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 140.84, "tps_std": 0.27, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 13.97, "tps_std": 0.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 106.21, "tps_std": 0.16, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 13.21, "tps_std": 0.32, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 190.66, "tps_std": 7.11, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.41, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 191.12, "tps_std": 0.46, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003", "model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 13.85, "tps_std": 0.26, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 120.67, "file_size_gib": 78.02, "name_params_b": 120.67, "quant": "Q4_K_XL", "log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 194.62, "tps_std": 1.88, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.64, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 49.93, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.41, "tps_std": 0.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 194.32, "tps_std": 1.84, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.8, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 49.97, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.63, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 197.89, "tps_std": 1.84, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 12.96, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 70.32, "tps_std": 0.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.22, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 198.04, "tps_std": 1.9, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 13.11, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 70.27, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.02, "tps_std": 0.31, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 197.46, "tps_std": 1.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.31, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 48.93, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.34, "tps_std": 0.41, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 194.0, "tps_std": 1.99, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.33, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 49.33, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.46, "tps_std": 0.34, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 106.76, "tps_std": 0.77, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 16.49, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 26.54, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 9.57, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 158.81, "tps_std": 2.4, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 17.16, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 28.25, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.49, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 474.42, "tps_std": 2.29, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 25.36, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 189.58, "tps_std": 0.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.53, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 479.78, "tps_std": 2.72, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 25.37, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 180.26, "tps_std": 0.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.54, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 556.96, "tps_std": 2.81, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.05, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 238.1, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.26, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 556.8, "tps_std": 4.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 25.16, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 237.85, "tps_std": 0.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.46, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 503.77, "tps_std": 3.42, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 25.54, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 182.59, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.25, "tps_std": 1.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 482.99, "tps_std": 0.86, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 25.49, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 175.78, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.94, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 171.39, "tps_std": 0.81, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.48, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 73.62, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.49, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 369.06, "tps_std": 2.58, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.38, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 140.81, "tps_std": 0.52, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.24, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 994.33, "tps_std": 11.86, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 55.87, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 209.15, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 30.88, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 994.22, "tps_std": 10.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 55.84, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 208.93, "tps_std": 0.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 30.9, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1009.37, "tps_std": 9.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 53.13, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 285.49, "tps_std": 0.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 30.53, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1012.69, "tps_std": 9.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 54.94, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 285.25, "tps_std": 0.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 30.5, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1023.24, "tps_std": 11.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 56.92, "tps_std": 0.17, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 206.37, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 31.69, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1012.11, "tps_std": 7.91, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 56.92, "tps_std": 0.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 205.56, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 31.62, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 828.53, "tps_std": 4.66, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 63.31, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 110.5, "tps_std": 0.14, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 25.87, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1145.66, "tps_std": 9.68, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 68.15, "tps_std": 0.11, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 193.03, "tps_std": 0.86, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.02, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1149.31, "tps_std": 13.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 67.72, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 212.38, "tps_std": 0.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 33.49, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1149.83, "tps_std": 7.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 68.05, "tps_std": 0.68, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 212.45, "tps_std": 0.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 33.52, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1170.01, "tps_std": 7.53, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 65.12, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 291.28, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 32.65, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1167.76, "tps_std": 7.7, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 64.97, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 290.12, "tps_std": 2.48, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 32.65, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1178.27, "tps_std": 10.86, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 69.46, "tps_std": 0.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 209.14, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.83, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1172.23, "tps_std": 12.92, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 69.65, "tps_std": 0.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 209.05, "tps_std": 0.22, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.76, "tps_std": 0.25, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 882.98, "tps_std": 3.84, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 80.84, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 111.65, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 28.03, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1290.5, "tps_std": 7.83, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 83.79, "tps_std": 0.18, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 194.26, "tps_std": 0.86, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 37.04, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 613.58, "tps_std": 2.84, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 29.81, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 447.94, "tps_std": 2.75, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.06, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 583.48, "tps_std": 105.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 29.85, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 439.93, "tps_std": 32.65, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.09, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 627.46, "tps_std": 3.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 28.02, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 527.78, "tps_std": 1.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.22, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 623.64, "tps_std": 17.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 29.16, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 512.14, "tps_std": 3.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.33, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 622.47, "tps_std": 8.34, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 29.93, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 443.0, "tps_std": 30.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.97, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 600.08, "tps_std": 13.59, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 29.99, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 457.86, "tps_std": 1.53, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 27.08, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 396.36, "tps_std": 1.71, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 30.9, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 208.44, "tps_std": 0.64, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.08, "tps_std": 0.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 500.88, "tps_std": 3.3, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 31.74, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 420.42, "tps_std": 0.15, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003", "model_clean": "Qwen3-Coder-Next-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 28.05, "tps_std": 0.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.94, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Coder-Next-UD-Q8_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 629.03, "tps_std": 5.19, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 31.37, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 439.65, "tps_std": 0.69, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 27.25, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 648.58, "tps_std": 5.44, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 30.86, "tps_std": 0.77, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 457.6, "tps_std": 1.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 27.22, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 634.72, "tps_std": 6.93, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 29.9, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 511.83, "tps_std": 7.51, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 27.45, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 632.78, "tps_std": 59.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 30.53, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 507.17, "tps_std": 2.44, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 27.44, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 621.13, "tps_std": 82.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 31.52, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 467.56, "tps_std": 0.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 28.26, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 661.07, "tps_std": 5.8, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 31.54, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 432.86, "tps_std": 0.82, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 28.2, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 436.5, "tps_std": 7.59, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 34.72, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 218.02, "tps_std": 0.85, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 28.5, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 587.86, "tps_std": 37.36, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 36.28, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 453.76, "tps_std": 0.75, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 31.67, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 305.11, "tps_std": 1.38, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.18, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 246.59, "tps_std": 0.45, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 16.49, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 313.18, "tps_std": 2.32, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.62, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 243.74, "tps_std": 1.45, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 16.51, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 311.68, "tps_std": 1.84, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 18.77, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 273.72, "tps_std": 1.22, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 17.91, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 306.06, "tps_std": 2.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.25, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 270.84, "tps_std": 0.74, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 17.98, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 314.27, "tps_std": 4.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.66, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 235.12, "tps_std": 5.24, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.36, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 310.73, "tps_std": 1.65, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.61, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 241.56, "tps_std": 5.74, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.35, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 183.05, "tps_std": 1.84, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.31, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 102.85, "tps_std": 0.15, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.76, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 239.56, "tps_std": 7.45, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.68, "tps_std": 0.38, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 203.34, "tps_std": 0.47, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003", "model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 20.09, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 122.11, "file_size_gib": 85.6, "name_params_b": 122.11, "quant": "Q5_K_XL", "log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 508.43, "tps_std": 3.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.65, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 423.84, "tps_std": 0.73, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.64, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 512.17, "tps_std": 3.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.69, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 382.51, "tps_std": 1.54, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.63, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 544.11, "tps_std": 3.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.4, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 407.19, "tps_std": 1.96, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.59, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 550.28, "tps_std": 3.67, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.23, "tps_std": 0.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 405.13, "tps_std": 1.85, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.72, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 541.57, "tps_std": 11.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.69, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 441.64, "tps_std": 9.63, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 22.18, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 509.57, "tps_std": 8.2, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.78, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 379.36, "tps_std": 1.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 22.2, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 122.56, "tps_std": 0.4, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 11.56, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 97.32, "tps_std": 0.17, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.95, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 309.96, "tps_std": 4.2, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.79, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 258.85, "tps_std": 0.77, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3.5-35B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.39, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 64.6, "name_params_b": 34.66, "quant": "BF16", "log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1071.38, "tps_std": 11.2, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 47.78, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 669.09, "tps_std": 1.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.19, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1093.96, "tps_std": 6.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 47.95, "tps_std": 0.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 661.4, "tps_std": 0.76, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.13, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1079.44, "tps_std": 6.76, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 46.46, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 762.29, "tps_std": 2.68, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.46, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1082.35, "tps_std": 6.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 46.48, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 777.89, "tps_std": 1.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.24, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1092.86, "tps_std": 9.42, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 48.16, "tps_std": 0.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 655.39, "tps_std": 2.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 41.9, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1113.86, "tps_std": 6.42, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 48.1, "tps_std": 0.31, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 655.89, "tps_std": 1.47, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 41.98, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 661.63, "tps_std": 3.14, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 58.16, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 288.86, "tps_std": 0.53, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 44.24, "tps_std": 0.09, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1013.4, "tps_std": 39.22, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 59.13, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 673.55, "tps_std": 0.64, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 48.93, "tps_std": 0.13, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 34.66, "file_size_gib": 20.7, "name_params_b": 34.66, "quant": "Q4_K_XL", "log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 854.2, "tps_std": 6.85, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.2, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 392.45, "tps_std": 16.97, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.63, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 877.69, "tps_std": 1.71, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.19, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 387.73, "tps_std": 18.58, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.63, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 869.53, "tps_std": 1.47, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.15, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 260.25, "tps_std": 4.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.6, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 870.35, "tps_std": 1.54, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.15, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 263.85, "tps_std": 5.85, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.61, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 892.78, "tps_std": 1.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.19, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 441.92, "tps_std": 38.71, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.63, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 895.09, "tps_std": 0.81, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.19, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 449.4, "tps_std": 28.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.63, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 122.72, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.31, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 107.34, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.32, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 513.78, "tps_std": 16.1, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.07, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 258.63, "tps_std": 1.57, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.53, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 324.28, "tps_std": 1.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.97, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 166.64, "tps_std": 2.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.7, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 455.07, "tps_std": 0.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.97, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 188.26, "tps_std": 1.59, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.7, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 426.08, "tps_std": 0.81, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.83, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 209.69, "tps_std": 3.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.68, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 440.33, "tps_std": 0.38, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.96, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 202.85, "tps_std": 0.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.69, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 466.09, "tps_std": 1.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.98, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 182.83, "tps_std": 1.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.68, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 452.21, "tps_std": 1.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.98, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 181.81, "tps_std": 3.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.7, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": null }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": null }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 91.65, "tps_std": 0.4, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.98, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 81.52, "tps_std": 0.33, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.73, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2700.94, "tps_std": 1.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 77.69, "tps_std": 0.66, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1564.27, "tps_std": 18.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 56.8, "tps_std": 0.48, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2691.0, "tps_std": 4.6, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 77.86, "tps_std": 0.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1563.05, "tps_std": 19.77, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 56.95, "tps_std": 0.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2719.77, "tps_std": 6.47, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 73.32, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1687.79, "tps_std": 33.87, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 54.09, "tps_std": 0.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2713.06, "tps_std": 9.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.85, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1681.29, "tps_std": 17.71, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 54.11, "tps_std": 0.29, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2666.49, "tps_std": 3.29, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 78.31, "tps_std": 0.89, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1530.18, "tps_std": 18.45, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 57.72, "tps_std": 0.36, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2674.53, "tps_std": 5.86, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 78.93, "tps_std": 0.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1534.58, "tps_std": 20.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 57.65, "tps_std": 0.44, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 647.4, "tps_std": 0.53, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 79.07, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 455.63, "tps_std": 1.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 54.86, "tps_std": 0.17, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2479.97, "tps_std": 41.4, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 87.24, "tps_std": 0.13, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1759.67, "tps_std": 6.72, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 64.91, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 631.59, "tps_std": 4.27, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.91, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 303.63, "tps_std": 0.57, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.07, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 610.41, "tps_std": 53.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.34, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 302.82, "tps_std": 1.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.12, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 648.44, "tps_std": 6.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 49.85, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 442.64, "tps_std": 0.84, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 39.69, "tps_std": 0.34, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 639.43, "tps_std": 31.93, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.99, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 438.75, "tps_std": 1.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 39.75, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 596.69, "tps_std": 97.42, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.38, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 308.13, "tps_std": 1.66, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 35.43, "tps_std": 8.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 641.07, "tps_std": 11.17, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.35, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 314.5, "tps_std": 0.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.04, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 576.81, "tps_std": 2.43, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.18, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 213.74, "tps_std": 0.68, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.52, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 633.21, "tps_std": 13.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 56.15, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 287.49, "tps_std": 1.21, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 42.67, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1638.53, "tps_std": 13.5, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.67, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 488.89, "tps_std": 0.54, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 51.91, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1631.29, "tps_std": 15.38, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.62, "tps_std": 0.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 492.09, "tps_std": 1.86, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 51.93, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1691.01, "tps_std": 16.68, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.07, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 730.11, "tps_std": 1.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 57.02, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1690.3, "tps_std": 13.53, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.0, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 730.49, "tps_std": 1.2, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 56.89, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1668.5, "tps_std": 13.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.68, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 507.77, "tps_std": 2.81, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 57.46, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1642.7, "tps_std": 14.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.75, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 507.84, "tps_std": 1.97, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 57.32, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1303.99, "tps_std": 6.84, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 73.68, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 364.73, "tps_std": 0.33, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 49.99, "tps_std": 0.21, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1577.96, "tps_std": 12.64, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 78.94, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 541.12, "tps_std": 0.2, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 60.77, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1543.27, "tps_std": 2.63, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.61, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 165.68, "tps_std": 0.88, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.65, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1539.48, "tps_std": 5.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.57, "tps_std": 0.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 166.31, "tps_std": 1.47, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.65, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1528.37, "tps_std": 6.4, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.14, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 196.35, "tps_std": 2.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.97, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1521.12, "tps_std": 5.74, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.22, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 196.03, "tps_std": 1.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.97, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1507.68, "tps_std": 1.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.41, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 206.97, "tps_std": 1.96, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.62, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1508.58, "tps_std": 2.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.44, "tps_std": 0.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 206.54, "tps_std": 0.91, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.62, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 324.82, "tps_std": 0.45, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 55.43, "tps_std": 0.14, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 144.29, "tps_std": 1.09, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.2, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1313.97, "tps_std": 1.29, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 55.59, "tps_std": 0.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 208.18, "tps_std": 2.24, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.52, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": 0, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "2405d59cb", "number": "8577" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 18.17, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.73, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 97.96, "tps_std": 0.29, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.09, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.22, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.72, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 73.57, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.02, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 18.79, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 4.13, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 99.24, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.55, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 18.8, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 4.1, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 99.22, "tps_std": 0.25, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.55, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 18.35, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.69, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 99.58, "tps_std": 0.65, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.04, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.17, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.67, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 72.73, "tps_std": 0.53, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.05, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": false, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_amdvlk__longctx32768__rpc.log", "rpc": true, "build": null }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": false, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_amdvlk__rpc.log", "rpc": true, "build": null }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": false, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_radv__longctx32768__rpc.log", "rpc": true, "build": null }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": false, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_radv__rpc.log", "rpc": true, "build": null }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 58.89, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.92, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 158.25, "tps_std": 0.52, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.04, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 59.95, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.91, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 159.79, "tps_std": 0.35, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.05, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 64.41, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.41, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 169.3, "tps_std": 0.95, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 18.93, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 65.69, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.47, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 169.5, "tps_std": 1.04, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 18.89, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 60.88, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.1, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 171.03, "tps_std": 0.56, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 18.98, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 60.78, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.1, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 173.91, "tps_std": 0.29, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.05, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": false, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "load", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_amdvlk__longctx32768__rpc.log", "rpc": true, "build": null }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": false, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_amdvlk__rpc.log", "rpc": true, "build": null }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": false, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_radv__longctx32768__rpc.log", "rpc": true, "build": null }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": false, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_radv__rpc.log", "rpc": true, "build": null } ] }