{ "meta": { "generated_at": "2026-02-09T13:29:25Z", "system_info": { "distro": "Fedora Linux 43 (Workstation Edition)", "kernel": "6.18.5-200.fc43.x86_64", "linux_firmware": "linux-firmware-20260110-1.fc43.noarch", "timestamp": "04 Feb 2026" }, "llamacpp_builds": [ { "hash": "e0c93af2a", "number": "7938" } ], "environments": [ "rocm-7_2", "rocm-7_2-hblt0", "rocm6_4_4", "rocm6_4_4-hblt0", "rocm7-nightlies", "rocm7-nightlies-hblt0", "vulkan_amdvlk", "vulkan_radv" ], "notes": "pp512 = prompt processing; tg128 = text generation; t/s = tokens/second" }, "runs": [ { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 72.93, "tps_std": 0.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.95, "tps_std": 0.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 16.57, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.08, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 71.58, "tps_std": 0.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.99, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 16.48, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.07, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 79.51, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.72, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.57, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.15, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 79.24, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.67, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.53, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.15, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 78.28, "tps_std": 0.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.98, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.18, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.06, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 80.59, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.99, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.27, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.07, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 17.65, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.0, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 4.94, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 1.69, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 54.76, "tps_std": 11.46, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.0, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 7.15, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002", "model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.27, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 125.03, "file_size_gib": 70.31, "name_params_b": 125.03, "quant": "Q4_K_XL", "log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 454.95, "tps_std": 1.9, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 22.26, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 94.79, "tps_std": 0.56, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 16.48, "tps_std": 0.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 425.21, "tps_std": 1.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.41, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 93.83, "tps_std": 0.4, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 16.55, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 407.15, "tps_std": 2.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 21.51, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 101.09, "tps_std": 0.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 16.23, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 414.23, "tps_std": 2.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.11, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 100.06, "tps_std": 0.38, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 15.97, "tps_std": 0.45, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 489.62, "tps_std": 3.63, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.4, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 92.48, "tps_std": 1.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 16.5, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 425.86, "tps_std": 2.29, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 23.41, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 92.06, "tps_std": 0.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 16.51, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 106.42, "tps_std": 0.08, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.87, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 6.09, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.28, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 333.1, "tps_std": 6.48, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.51, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 78.99, "tps_std": 0.25, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-BF16-00001-of-00002", "model_clean": "GLM-4.7-Flash-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.13, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 55.79, "name_params_b": 29.94, "quant": "BF16", "log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 398.34, "tps_std": 1.32, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 35.94, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 90.22, "tps_std": 4.88, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 22.35, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 398.87, "tps_std": 1.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 36.09, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 92.13, "tps_std": 0.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.56, "tps_std": 1.34, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 947.86, "tps_std": 2.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 33.77, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 84.85, "tps_std": 1.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.89, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 952.84, "tps_std": 2.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 35.23, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 84.01, "tps_std": 0.58, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 21.97, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 983.72, "tps_std": 3.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 36.2, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 80.32, "tps_std": 1.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 22.31, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 955.1, "tps_std": 4.53, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 36.16, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 81.34, "tps_std": 1.8, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 22.32, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 368.78, "tps_std": 0.17, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 40.8, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 6.35, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.75, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 877.18, "tps_std": 8.15, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 40.07, "tps_std": 0.78, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 90.27, "tps_std": 0.42, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.7-Flash-UD-Q8_K_XL", "model_clean": "GLM-4.7-Flash-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 23.07, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 29.94, "file_size_gib": 32.7, "name_params_b": 29.94, "quant": "Q8_K_XL", "log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 48.83, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.78, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 29.25, "tps_std": 0.17, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.45, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 49.38, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.79, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 29.17, "tps_std": 0.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.46, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 146.04, "tps_std": 0.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.78, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 36.22, "tps_std": 0.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.43, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 146.83, "tps_std": 0.25, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.78, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 36.4, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.46, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 155.06, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.79, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 38.36, "tps_std": 0.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.46, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 151.7, "tps_std": 0.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.78, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 38.35, "tps_std": 0.67, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.46, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 21.74, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.81, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 8.35, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.36, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 99.39, "tps_std": 0.58, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 2.76, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 11.79, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Llama-3.3-70B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 2.44, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 70.55, "file_size_gib": 75.65, "name_params_b": 70.55, "quant": "Q8_K_XL", "log": "results/Llama-3.3-70B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 800.17, "tps_std": 1.72, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.49, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 169.18, "tps_std": 1.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.11, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 803.22, "tps_std": 2.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.49, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 170.11, "tps_std": 0.81, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.11, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 764.18, "tps_std": 1.66, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.48, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 166.22, "tps_std": 1.2, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.1, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 766.68, "tps_std": 1.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.48, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 164.84, "tps_std": 1.99, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.1, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 990.88, "tps_std": 3.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.5, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 172.42, "tps_std": 3.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.1, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 799.71, "tps_std": 2.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.49, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 170.19, "tps_std": 1.69, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 7.1, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 19.7, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.24, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 16.69, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.41, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 222.01, "tps_std": 0.94, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 7.59, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 76.47, "tps_std": 0.38, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Ministral-3-14B-Instruct-2512-BF16", "model_clean": "Ministral-3-14B-Instruct-2512-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.39, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 13.51, "file_size_gib": 25.16, "name_params_b": 13.51, "quant": "BF16", "log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 393.61, "tps_std": 2.94, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 42.58, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 562.85, "tps_std": 0.47, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.59, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 388.54, "tps_std": 2.76, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 42.61, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 564.71, "tps_std": 0.81, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.6, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1026.87, "tps_std": 6.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 41.9, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1042.36, "tps_std": 2.24, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.08, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1027.41, "tps_std": 6.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 42.05, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1038.86, "tps_std": 3.17, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.04, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1070.15, "tps_std": 5.54, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 42.56, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 908.79, "tps_std": 27.38, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.91, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1038.67, "tps_std": 2.82, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 42.57, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 821.93, "tps_std": 29.4, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.92, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 676.59, "tps_std": 50.83, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 47.22, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 342.52, "tps_std": 0.46, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 35.25, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 951.76, "tps_std": 41.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 46.68, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 799.39, "tps_std": 0.69, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "model_clean": "Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 41.15, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 31.58, "file_size_gib": 37.66, "name_params_b": 31.58, "quant": "Q8_K_XL", "log": "results/Nemotron-3-Nano-30B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 202.36, "tps_std": 3.5, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.8, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 41.36, "tps_std": 0.87, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 9.65, "tps_std": 0.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 200.1, "tps_std": 8.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 16.04, "tps_std": 0.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 41.53, "tps_std": 0.41, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 9.5, "tps_std": 0.75, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 205.05, "tps_std": 3.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.98, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 51.11, "tps_std": 0.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 9.63, "tps_std": 0.07, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 203.41, "tps_std": 3.52, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.0, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 51.19, "tps_std": 0.64, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 9.58, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 200.04, "tps_std": 4.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 16.19, "tps_std": 0.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 41.42, "tps_std": 0.37, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.94, "tps_std": 0.42, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 197.48, "tps_std": 10.8, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 16.2, "tps_std": 0.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 41.6, "tps_std": 0.36, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 10.81, "tps_std": 0.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 119.82, "tps_std": 3.3, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 17.75, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 27.41, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.42, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 133.28, "tps_std": 1.45, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 15.98, "tps_std": 0.25, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 30.79, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003", "model_clean": "Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.5, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 235.09, "file_size_gib": 96.99, "name_params_b": 235.09, "quant": "Q3_K_XL", "log": "results/Qwen3-235B-A22B-Instruct-2507-UD-Q3_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 489.11, "tps_std": 2.88, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 27.18, "tps_std": 0.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 214.97, "tps_std": 1.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.57, "tps_std": 1.4, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 492.32, "tps_std": 2.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 27.23, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 207.64, "tps_std": 0.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.84, "tps_std": 0.97, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 576.03, "tps_std": 3.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 26.12, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 249.94, "tps_std": 1.13, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 19.18, "tps_std": 0.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 569.42, "tps_std": 8.52, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 27.07, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 250.24, "tps_std": 0.88, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 18.77, "tps_std": 0.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 512.1, "tps_std": 4.69, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 27.27, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 216.18, "tps_std": 0.74, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 19.71, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 493.72, "tps_std": 3.45, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 27.32, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 209.02, "tps_std": 0.16, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 19.67, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 168.95, "tps_std": 7.69, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 10.62, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 75.04, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.68, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 351.97, "tps_std": 2.56, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.42, "tps_std": 0.21, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 127.67, "tps_std": 0.45, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-BF16-00001-of-00002", "model_clean": "Qwen3-30B-A3B-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.31, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 56.89, "name_params_b": 30.53, "quant": "BF16", "log": "results/Qwen3-30B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 815.37, "tps_std": 5.82, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 58.54, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 170.56, "tps_std": 4.38, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 31.3, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 811.39, "tps_std": 6.56, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 58.57, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 171.54, "tps_std": 4.45, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 31.29, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1078.99, "tps_std": 11.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 56.45, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 217.17, "tps_std": 8.71, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 30.94, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1080.52, "tps_std": 10.73, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 57.49, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 218.42, "tps_std": 7.66, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 30.96, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1056.78, "tps_std": 36.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 59.15, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 175.4, "tps_std": 4.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 31.98, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1039.16, "tps_std": 53.94, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 59.16, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 174.67, "tps_std": 4.22, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 31.98, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 823.08, "tps_std": 48.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 66.14, "tps_std": 0.02, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 112.99, "tps_std": 0.13, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 27.35, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1064.73, "tps_std": 70.49, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 68.93, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 152.3, "tps_std": 3.42, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "model_clean": "Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.18, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 24.53, "name_params_b": 30.53, "quant": "Q6_K_XL", "log": "results/Qwen3-30B-A3B-Instruct-2507-UD-Q6_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1209.23, "tps_std": 7.46, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 71.48, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 177.01, "tps_std": 5.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.4, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1207.91, "tps_std": 9.78, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 71.48, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 175.56, "tps_std": 3.86, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.37, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1263.87, "tps_std": 7.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 68.78, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 222.2, "tps_std": 8.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 33.48, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1260.69, "tps_std": 6.89, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 68.94, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 222.34, "tps_std": 7.55, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 33.52, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1241.85, "tps_std": 15.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.57, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 176.98, "tps_std": 4.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 35.43, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1229.55, "tps_std": 20.23, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 72.45, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 176.47, "tps_std": 4.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 35.44, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 846.24, "tps_std": 47.6, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 86.32, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 114.18, "tps_std": 0.07, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 30.07, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1005.9, "tps_std": 6.1, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 79.55, "tps_std": 6.96, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 153.83, "tps_std": 3.76, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 37.44, "tps_std": 0.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 30.53, "file_size_gib": 17.35, "name_params_b": 30.53, "quant": "Q4_K_M", "log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 193.67, "tps_std": 2.12, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 28.98, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 217.45, "tps_std": 0.19, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 23.87, "tps_std": 3.54, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 263.91, "tps_std": 3.82, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 28.97, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 296.64, "tps_std": 0.5, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 23.44, "tps_std": 4.28, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 592.54, "tps_std": 4.38, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 27.45, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 449.68, "tps_std": 1.06, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 25.1, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 592.83, "tps_std": 4.39, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 27.75, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 448.82, "tps_std": 1.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 25.07, "tps_std": 0.35, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 282.6, "tps_std": 2.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 28.89, "tps_std": 0.2, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 238.71, "tps_std": 0.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 23.93, "tps_std": 4.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 590.03, "tps_std": 3.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 28.73, "tps_std": 0.52, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 413.78, "tps_std": 0.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 23.54, "tps_std": 3.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 426.39, "tps_std": 3.26, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 31.84, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 228.41, "tps_std": 1.5, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 22.47, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 509.22, "tps_std": 20.34, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 29.92, "tps_std": 0.05, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 370.94, "tps_std": 32.12, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002", "model_clean": "Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 26.0, "tps_std": 0.2, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 79.67, "file_size_gib": 86.68, "name_params_b": 79.67, "quant": "Q8_K_XL", "log": "results/Qwen3-Next-80B-A3B-Instruct-UD-Q8_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 323.33, "tps_std": 0.27, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.24, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 232.79, "tps_std": 5.34, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.65, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 324.44, "tps_std": 0.31, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.24, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 229.19, "tps_std": 6.79, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.66, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 936.69, "tps_std": 1.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.23, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 258.34, "tps_std": 1.81, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.63, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 935.37, "tps_std": 1.09, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.2, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 261.44, "tps_std": 5.27, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.62, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 943.63, "tps_std": 1.62, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.25, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 396.59, "tps_std": 26.74, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.65, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 942.52, "tps_std": 1.34, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.25, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 376.68, "tps_std": 9.34, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.65, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 125.5, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.45, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 111.11, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.4, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 687.05, "tps_std": 0.75, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 14.14, "tps_std": 0.01, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 376.92, "tps_std": 18.46, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-12b-it-UD-Q8_K_XL", "model_clean": "gemma-3-12b-it-UD-Q8_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 11.72, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 11.77, "file_size_gib": 13.4, "name_params_b": 11.77, "quant": "Q8_K_XL", "log": "results/gemma-3-12b-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 463.92, "tps_std": 1.19, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 4.02, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 191.32, "tps_std": 3.3, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.68, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 528.0, "tps_std": 0.44, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 4.02, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 201.67, "tps_std": 1.78, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.74, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 508.08, "tps_std": 0.85, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 4.0, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 222.44, "tps_std": 2.25, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.72, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 508.48, "tps_std": 0.88, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 4.0, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 220.03, "tps_std": 0.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.72, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 549.57, "tps_std": 2.42, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 4.02, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 215.98, "tps_std": 0.94, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.73, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 529.01, "tps_std": 0.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 4.02, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 204.92, "tps_std": 2.92, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.73, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 9.32, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.87, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 9.2, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.6, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 123.07, "tps_std": 0.27, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 3.92, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 82.96, "tps_std": 0.72, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-27b-it-BF16-00001-of-00002", "model_clean": "gemma-3-27b-it-BF16", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.66, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 27.01, "file_size_gib": 50.31, "name_params_b": 27.01, "quant": "BF16", "log": "results/gemma-3-27b-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2870.77, "tps_std": 12.89, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 84.57, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1639.03, "tps_std": 15.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 61.51, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2807.93, "tps_std": 16.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 84.66, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1262.15, "tps_std": 24.34, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 61.54, "tps_std": 0.04, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2891.85, "tps_std": 2.6, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 82.18, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1600.62, "tps_std": 30.98, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 60.21, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2893.75, "tps_std": 3.92, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 82.15, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1419.18, "tps_std": 40.21, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 60.24, "tps_std": 0.11, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2805.65, "tps_std": 13.25, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 85.35, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1215.66, "tps_std": 10.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 62.02, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 2800.57, "tps_std": 47.75, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 85.47, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1214.2, "tps_std": 13.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 62.03, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 657.19, "tps_std": 0.41, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 86.55, "tps_std": 0.1, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 493.7, "tps_std": 0.98, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 58.57, "tps_std": 0.11, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1977.82, "tps_std": 204.87, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 91.09, "tps_std": 3.96, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 1149.92, "tps_std": 30.21, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gemma-3-4b-it-Q3_K_S", "model_clean": "gemma-3-4b-it-Q3_K_S", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 67.86, "tps_std": 0.22, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 3.88, "file_size_gib": 1.8, "name_params_b": 3.88, "quant": "Q3_K_S", "log": "results/gemma-3-4b-it-Q3_K_S__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 181.09, "tps_std": 1.36, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.77, "tps_std": 0.73, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 217.33, "tps_std": 0.32, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 36.51, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 181.23, "tps_std": 1.39, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 52.06, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 218.3, "tps_std": 0.1, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 34.08, "tps_std": 4.33, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 681.58, "tps_std": 4.94, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.85, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 396.76, "tps_std": 35.92, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.13, "tps_std": 0.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 678.97, "tps_std": 4.29, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.88, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 400.64, "tps_std": 35.51, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 37.97, "tps_std": 3.34, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 649.28, "tps_std": 39.54, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 52.0, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 259.94, "tps_std": 5.81, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.3, "tps_std": 0.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 666.65, "tps_std": 12.5, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 52.05, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 261.35, "tps_std": 6.47, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 40.36, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 643.04, "tps_std": 39.69, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 54.0, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 195.45, "tps_std": 2.65, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 37.02, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 597.02, "tps_std": 9.82, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 57.38, "tps_std": 0.04, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 278.37, "tps_std": 7.19, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-120b-mxfp4-00001-of-00003", "model_clean": "gpt-oss-120b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 42.78, "tps_std": 0.09, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 116.83, "file_size_gib": 59.02, "name_params_b": 116.83, "quant": "MXFP4", "log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 547.85, "tps_std": 6.58, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 73.52, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 402.32, "tps_std": 0.67, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 52.5, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 546.41, "tps_std": 6.71, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 73.52, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 402.65, "tps_std": 1.5, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 52.58, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1779.88, "tps_std": 16.15, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 73.26, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 583.3, "tps_std": 9.18, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 57.85, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1785.44, "tps_std": 15.68, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 73.22, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 600.15, "tps_std": 13.61, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 57.78, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1742.62, "tps_std": 12.05, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 73.51, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 428.95, "tps_std": 5.63, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 57.82, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1730.96, "tps_std": 9.7, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 73.53, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 425.86, "tps_std": 3.58, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 57.9, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1300.97, "tps_std": 78.99, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 77.58, "tps_std": 0.03, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 337.8, "tps_std": 4.4, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 53.06, "tps_std": 0.1, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1397.71, "tps_std": 70.15, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 80.99, "tps_std": 0.06, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 416.91, "tps_std": 7.9, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "gpt-oss-20b-mxfp4", "model_clean": "gpt-oss-20b-mxfp4", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 60.56, "tps_std": 0.77, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 20.91, "file_size_gib": 11.27, "name_params_b": 20.91, "quant": "MXFP4", "log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 549.58, "tps_std": 0.25, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.55, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 144.34, "tps_std": 1.03, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.6, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 548.97, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 50.52, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 143.7, "tps_std": 0.31, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.6, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm-7_2__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1597.02, "tps_std": 1.89, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.01, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 193.62, "tps_std": 1.29, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.93, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1598.36, "tps_std": 1.08, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.01, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 191.18, "tps_std": 2.26, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.94, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm6_4_4__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1590.62, "tps_std": 1.92, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.17, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 210.19, "tps_std": 4.57, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.56, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1590.4, "tps_std": 2.71, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 51.21, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 216.78, "tps_std": 3.22, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.56, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__rocm7-nightlies__hblt0__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 349.95, "tps_std": 0.3, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 56.0, "tps_std": 0.22, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 152.53, "tps_std": 0.11, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 9.29, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 1355.55, "tps_std": 2.34, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 55.88, "tps_std": 0.13, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 246.2, "tps_std": 1.24, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "llama-2-7b.Q4_0", "model_clean": "llama-2-7b.Q4_0", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 8.76, "tps_std": 0.0, "error": false, "error_type": null, "backend": "Vulkan", "ngl": 99, "mmap": null, "params_b": 6.74, "file_size_gib": 3.56, "name_params_b": 6.74, "quant": "Q4_0", "log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log", "rpc": false, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 18.17, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.73, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 97.96, "tps_std": 0.29, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.09, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.22, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.72, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 73.57, "tps_std": 0.23, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.02, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm-7_2__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 18.79, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 4.13, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 99.24, "tps_std": 0.14, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.55, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 18.8, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 4.1, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 99.22, "tps_std": 0.25, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 8.55, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm6_4_4__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 18.35, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.69, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 99.58, "tps_std": 0.65, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.04, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 17.17, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 3.67, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 72.73, "tps_std": 0.53, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 9.05, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 356.79, "file_size_gib": 189.69, "name_params_b": 356.79, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__rocm7-nightlies__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": false, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_amdvlk__longctx32768__rpc.log", "rpc": true, "build": null }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": false, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_amdvlk__rpc.log", "rpc": true, "build": null }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": false, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_radv__longctx32768__rpc.log", "rpc": true, "build": null }, { "model": "GLM-4.6-UD-Q4_K_XL-00001-of-00005", "model_clean": "GLM-4.6-UD-Q4_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": false, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "runtime", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q4_K_XL", "log": "results-rpc/GLM-4.6-UD-Q4_K_XL-00001-of-00005__vulkan_radv__rpc.log", "rpc": true, "build": null }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 58.89, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.92, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 158.25, "tps_std": 0.52, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2-hblt0", "env_base": "rocm", "env_variant": "7_2-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.04, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 59.95, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 5.91, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 159.79, "tps_std": 0.35, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm-7_2", "env_base": "rocm", "env_variant": "7_2", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.05, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm-7_2__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 64.41, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.41, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 169.3, "tps_std": 0.95, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4-hblt0", "env_base": "rocm6_4_4", "env_variant": "hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 18.93, "tps_std": 0.01, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 65.69, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.47, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 169.5, "tps_std": 1.04, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm6_4_4", "env_base": "rocm6_4_4", "env_variant": null, "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 18.89, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm6_4_4__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 60.88, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.1, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 171.03, "tps_std": 0.56, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies-hblt0", "env_base": "rocm7", "env_variant": "nightlies-hblt0", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 18.98, "tps_std": 0.02, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__hblt0__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "pp2048 @ d32768", "tps_mean": 60.78, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "longctx32768", "context_tokens": 32768, "test": "tg32 @ d32768", "tps_mean": 6.1, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__longctx32768__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "pp512", "tps_mean": 173.91, "tps_std": 0.29, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "rocm7-nightlies", "env_base": "rocm7", "env_variant": "nightlies", "fa": true, "context": "default", "context_tokens": null, "test": "tg128", "tps_mean": 19.05, "tps_std": 0.0, "error": false, "error_type": null, "backend": "ROCm,RPC", "ngl": 99, "mmap": null, "params_b": 228.69, "file_size_gib": 180.94, "name_params_b": 228.69, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__rocm7-nightlies__rpc.log", "rpc": true, "build": { "hash": "e0c93af2a", "number": "7938" } }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": false, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": true, "error_type": "load", "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_amdvlk__longctx32768__rpc.log", "rpc": true, "build": null }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "vulkan_amdvlk", "env_base": "vulkan_amdvlk", "env_variant": null, "fa": false, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_amdvlk__rpc.log", "rpc": true, "build": null }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": false, "context": "longctx32768", "context_tokens": 32768, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_radv__longctx32768__rpc.log", "rpc": true, "build": null }, { "model": "MiniMax-M2-UD-Q6_K_XL-00001-of-00004", "model_clean": "MiniMax-M2-UD-Q6_K_XL", "env": "vulkan_radv", "env_base": "vulkan_radv", "env_variant": null, "fa": false, "context": "default", "context_tokens": null, "test": null, "tps_mean": null, "tps_std": null, "error": false, "error_type": null, "backend": null, "ngl": null, "mmap": null, "params_b": null, "file_size_gib": null, "name_params_b": null, "quant": "Q6_K_XL", "log": "results-rpc/MiniMax-M2-UD-Q6_K_XL-00001-of-00004__vulkan_radv__rpc.log", "rpc": true, "build": null } ] }