10978 lines
292 KiB
JSON
10978 lines
292 KiB
JSON
{
|
|
"meta": {
|
|
"generated_at": "2026-04-15T07:08:17Z",
|
|
"system_info": {
|
|
"distro": "Fedora Linux 43 (Workstation Edition)",
|
|
"kernel": "6.19.9-200.fc43.x86_64",
|
|
"linux_firmware": "linux-firmware-20260309-1.fc43.noarch",
|
|
"timestamp": "10 Apr 2026"
|
|
},
|
|
"llamacpp_builds": [
|
|
{
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
},
|
|
{
|
|
"hash": "ff5ef8278",
|
|
"number": "8763"
|
|
}
|
|
],
|
|
"environments": [
|
|
"rocm-7_2",
|
|
"rocm-7_2_1",
|
|
"rocm6_4_4",
|
|
"rocm7-nightlies",
|
|
"vulkan_amdvlk",
|
|
"vulkan_radv"
|
|
],
|
|
"notes": "pp512 = prompt processing; tg128 = text generation; t/s = tokens/second"
|
|
},
|
|
"runs": [
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 78.36,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.67,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.08,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 78.4,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.76,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 17.57,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.09,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 78.06,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.95,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 18.34,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.06,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 123.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 123.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 46.91,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 2.99,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 7.32,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002",
|
|
"model_clean": "Devstral-2-123B-Instruct-2512-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 2.59,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 125.03,
|
|
"file_size_gib": 70.31,
|
|
"name_params_b": 125.03,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Devstral-2-123B-Instruct-2512-UD-Q4_K_XL-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 404.18,
|
|
"tps_std": 1.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 20.88,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 88.16,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.07,
|
|
"tps_std": 0.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm-7_2",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm-7_2__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 392.81,
|
|
"tps_std": 1.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.97,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 94.55,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 14.89,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 400.57,
|
|
"tps_std": 4.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 86.01,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 14.86,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 114.94,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.48,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 10.14,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.04,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 326.36,
|
|
"tps_std": 4.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 9.5,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 102.0,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-BF16-00001-of-00002",
|
|
"model_clean": "GLM-4.7-Flash-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.82,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 55.79,
|
|
"name_params_b": 29.94,
|
|
"quant": "BF16",
|
|
"log": "results/GLM-4.7-Flash-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 914.78,
|
|
"tps_std": 3.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 32.73,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 91.49,
|
|
"tps_std": 0.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 903.01,
|
|
"tps_std": 2.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 30.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 99.7,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.93,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 888.7,
|
|
"tps_std": 38.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 32.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 89.53,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.47,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 499.74,
|
|
"tps_std": 1.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 39.02,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": null,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 875.8,
|
|
"tps_std": 2.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 40.19,
|
|
"tps_std": 1.39,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 134.1,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"model_clean": "GLM-4.7-Flash-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.18,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 29.94,
|
|
"file_size_gib": 32.7,
|
|
"name_params_b": 29.94,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/GLM-4.7-Flash-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 245.94,
|
|
"tps_std": 1.48,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ff5ef8278",
|
|
"number": "8763"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.11,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ff5ef8278",
|
|
"number": "8763"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 66.09,
|
|
"tps_std": 0.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ff5ef8278",
|
|
"number": "8763"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.32,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "ff5ef8278",
|
|
"number": "8763"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 245.63,
|
|
"tps_std": 1.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.63,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 79.52,
|
|
"tps_std": 0.47,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.69,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 237.43,
|
|
"tps_std": 0.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.63,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 61.53,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.52,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 203.53,
|
|
"tps_std": 0.7,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 24.06,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 31.94,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.05,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 234.24,
|
|
"tps_std": 1.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 29.48,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 32.31,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004",
|
|
"model_clean": "MiniMax-M2.7-UD-Q3_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 14.2,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 228.69,
|
|
"file_size_gib": 94.93,
|
|
"name_params_b": 228.69,
|
|
"quant": "Q3_K_XL",
|
|
"log": "results/MiniMax-M2.7-UD-Q3_K_XL-00001-of-00004__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 747.81,
|
|
"tps_std": 7.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.42,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 182.77,
|
|
"tps_std": 1.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.08,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 716.84,
|
|
"tps_std": 2.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.39,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 166.12,
|
|
"tps_std": 0.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.05,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 726.92,
|
|
"tps_std": 2.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 8.43,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 162.4,
|
|
"tps_std": 0.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 14.0,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 14.0,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 164.2,
|
|
"tps_std": 0.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 7.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 72.41,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"model_clean": "Ministral-3-14B-Instruct-2512-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 13.51,
|
|
"file_size_gib": 25.16,
|
|
"name_params_b": 13.51,
|
|
"quant": "BF16",
|
|
"log": "results/Ministral-3-14B-Instruct-2512-BF16__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 264.16,
|
|
"tps_std": 1.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.01,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 299.29,
|
|
"tps_std": 0.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.59,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 261.51,
|
|
"tps_std": 1.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.63,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 323.83,
|
|
"tps_std": 0.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.34,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 232.54,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 15.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 284.15,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.34,
|
|
"tps_std": 0.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 138.78,
|
|
"tps_std": 0.58,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.45,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 104.96,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 13.66,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 191.97,
|
|
"tps_std": 8.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.7,
|
|
"tps_std": 0.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 185.9,
|
|
"tps_std": 0.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003",
|
|
"model_clean": "NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 14.21,
|
|
"tps_std": 0.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 120.67,
|
|
"file_size_gib": 78.02,
|
|
"name_params_b": 120.67,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/NVIDIA-Nemotron-3-Super-120B-A12B-UD-Q4_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1148.88,
|
|
"tps_std": 7.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 67.8,
|
|
"tps_std": 0.73,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 194.78,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.46,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1167.77,
|
|
"tps_std": 7.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 65.06,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 291.69,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.81,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1185.86,
|
|
"tps_std": 2.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 68.95,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 203.21,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 34.77,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 882.68,
|
|
"tps_std": 3.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 80.48,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 111.69,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 28.03,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1145.07,
|
|
"tps_std": 8.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 82.16,
|
|
"tps_std": 3.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 194.38,
|
|
"tps_std": 0.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"model_clean": "Qwen3-Coder-30B-A3B-Instruct-Q4_K_M",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 37.09,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.53,
|
|
"file_size_gib": 17.35,
|
|
"name_params_b": 30.53,
|
|
"quant": "Q4_K_M",
|
|
"log": "results/Qwen3-Coder-30B-A3B-Instruct-Q4_K_M__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 312.22,
|
|
"tps_std": 2.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.6,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 250.19,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.88,
|
|
"tps_std": 1.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 316.73,
|
|
"tps_std": 1.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 18.86,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 275.81,
|
|
"tps_std": 1.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 17.9,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 318.17,
|
|
"tps_std": 2.18,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 19.57,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 223.61,
|
|
"tps_std": 0.83,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.32,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 182.98,
|
|
"tps_std": 1.82,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.33,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 102.84,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 18.77,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 241.15,
|
|
"tps_std": 7.43,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.75,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 202.99,
|
|
"tps_std": 0.41,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003",
|
|
"model_clean": "Qwen3.5-122B-A10B-UD-Q5_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.09,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 122.11,
|
|
"file_size_gib": 85.6,
|
|
"name_params_b": 122.11,
|
|
"quant": "Q5_K_XL",
|
|
"log": "results/Qwen3.5-122B-A10B-UD-Q5_K_XL-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 509.12,
|
|
"tps_std": 4.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 23.63,
|
|
"tps_std": 0.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 390.8,
|
|
"tps_std": 4.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.61,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 545.2,
|
|
"tps_std": 3.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 21.99,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 354.63,
|
|
"tps_std": 1.42,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 21.65,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 512.14,
|
|
"tps_std": 2.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 23.77,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 383.01,
|
|
"tps_std": 0.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 22.11,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 122.66,
|
|
"tps_std": 0.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 11.56,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 97.36,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.94,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 317.93,
|
|
"tps_std": 2.34,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.8,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 258.29,
|
|
"tps_std": 0.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-BF16-00001-of-00002",
|
|
"model_clean": "Qwen3.5-35B-A3B-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.39,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 64.6,
|
|
"name_params_b": 34.66,
|
|
"quant": "BF16",
|
|
"log": "results/Qwen3.5-35B-A3B-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1098.31,
|
|
"tps_std": 7.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 47.89,
|
|
"tps_std": 0.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 681.43,
|
|
"tps_std": 0.74,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.19,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1080.97,
|
|
"tps_std": 5.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.98,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 611.53,
|
|
"tps_std": 0.52,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.17,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1111.77,
|
|
"tps_std": 11.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 47.94,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 669.42,
|
|
"tps_std": 1.32,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 41.96,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 663.48,
|
|
"tps_std": 2.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 58.17,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 289.32,
|
|
"tps_std": 1.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 44.23,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1016.96,
|
|
"tps_std": 39.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 59.11,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 673.76,
|
|
"tps_std": 0.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 49.03,
|
|
"tps_std": 0.14,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 20.7,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 703.33,
|
|
"tps_std": 5.75,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 29.06,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 489.36,
|
|
"tps_std": 3.31,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.31,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 698.12,
|
|
"tps_std": 4.53,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 25.88,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 615.35,
|
|
"tps_std": 3.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.34,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 697.35,
|
|
"tps_std": 3.46,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.1,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 553.41,
|
|
"tps_std": 1.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.57,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 415.49,
|
|
"tps_std": 2.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 30.74,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 228.9,
|
|
"tps_std": 0.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.62,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 710.93,
|
|
"tps_std": 18.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 28.92,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 531.15,
|
|
"tps_std": 0.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"model_clean": "Qwen3.5-35B-A3B-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 26.32,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 34.66,
|
|
"file_size_gib": 45.33,
|
|
"name_params_b": 34.66,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/Qwen3.5-35B-A3B-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 864.78,
|
|
"tps_std": 7.29,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.66,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 625.12,
|
|
"tps_std": 11.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.99,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 839.13,
|
|
"tps_std": 7.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 20.75,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 646.67,
|
|
"tps_std": 11.22,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 19.86,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 844.42,
|
|
"tps_std": 19.66,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 22.69,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 546.66,
|
|
"tps_std": 5.96,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 20.11,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 117.96,
|
|
"tps_std": 0.28,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 16.18,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 58.94,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 15.26,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 376.52,
|
|
"tps_std": 7.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 14.74,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 351.87,
|
|
"tps_std": 1.49,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-26B-A4B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 13.71,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 47.02,
|
|
"name_params_b": 25.23,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-26B-A4B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1298.78,
|
|
"tps_std": 7.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 46.65,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 691.44,
|
|
"tps_std": 4.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.86,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1288.38,
|
|
"tps_std": 10.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 45.58,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 721.84,
|
|
"tps_std": 10.97,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.17,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1219.74,
|
|
"tps_std": 15.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 46.57,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 600.42,
|
|
"tps_std": 7.55,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.88,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 720.78,
|
|
"tps_std": 2.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.21,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 100.79,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 35.41,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1213.78,
|
|
"tps_std": 7.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 53.04,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 638.76,
|
|
"tps_std": 1.76,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 40.93,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 15.9,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1226.22,
|
|
"tps_std": 161.95,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.27,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 667.32,
|
|
"tps_std": 5.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.43,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1303.32,
|
|
"tps_std": 8.77,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 38.81,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 727.92,
|
|
"tps_std": 8.62,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 32.52,
|
|
"tps_std": 0.35,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1294.4,
|
|
"tps_std": 31.54,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 41.09,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 596.78,
|
|
"tps_std": 7.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 33.35,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 589.2,
|
|
"tps_std": 1.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 43.18,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 97.7,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 31.82,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 944.96,
|
|
"tps_std": 19.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 43.58,
|
|
"tps_std": 1.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 579.88,
|
|
"tps_std": 0.09,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-26B-A4B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 35.52,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 25.23,
|
|
"file_size_gib": 25.94,
|
|
"name_params_b": 25.23,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-26B-A4B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 381.31,
|
|
"tps_std": 4.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 151.84,
|
|
"tps_std": 1.65,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.17,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 360.84,
|
|
"tps_std": 1.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 154.86,
|
|
"tps_std": 2.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.14,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 373.84,
|
|
"tps_std": 0.93,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.41,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 139.53,
|
|
"tps_std": 1.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.16,
|
|
"tps_std": 0.05,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 31.0,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 31.0,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 79.53,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 3.5,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 60.29,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-BF16-00001-of-00002",
|
|
"model_clean": "gemma-4-31B-it-BF16",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 3.24,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 57.18,
|
|
"name_params_b": 30.7,
|
|
"quant": "BF16",
|
|
"log": "results/gemma-4-31B-it-BF16-00001-of-00002__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 313.26,
|
|
"tps_std": 1.19,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 141.61,
|
|
"tps_std": 1.71,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.11,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 309.22,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.02,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 143.91,
|
|
"tps_std": 1.64,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 7.81,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 315.72,
|
|
"tps_std": 0.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.51,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 130.8,
|
|
"tps_std": 1.45,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.2,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 69.12,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 10.71,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 31.0,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 244.46,
|
|
"tps_std": 0.27,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 11.02,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 124.32,
|
|
"tps_std": 1.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q4_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.78,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 17.46,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q4_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q4_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 309.13,
|
|
"tps_std": 0.94,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.16,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 140.72,
|
|
"tps_std": 1.33,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.26,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 303.4,
|
|
"tps_std": 0.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.07,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 141.37,
|
|
"tps_std": 1.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.18,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 319.75,
|
|
"tps_std": 0.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.12,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 128.0,
|
|
"tps_std": 1.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.3,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 72.26,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": null,
|
|
"tps_mean": null,
|
|
"tps_std": null,
|
|
"error": true,
|
|
"error_type": "runtime",
|
|
"backend": null,
|
|
"ngl": null,
|
|
"mmap": null,
|
|
"params_b": null,
|
|
"file_size_gib": null,
|
|
"name_params_b": 31.0,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": null
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 209.2,
|
|
"tps_std": 6.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 6.28,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 112.72,
|
|
"tps_std": 1.26,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"model_clean": "gemma-4-31B-it-UD-Q8_K_XL",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.49,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 30.7,
|
|
"file_size_gib": 32.6,
|
|
"name_params_b": 30.7,
|
|
"quant": "Q8_K_XL",
|
|
"log": "results/gemma-4-31B-it-UD-Q8_K_XL__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 633.0,
|
|
"tps_std": 7.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.15,
|
|
"tps_std": 0.36,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 296.45,
|
|
"tps_std": 1.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 31.19,
|
|
"tps_std": 8.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 648.77,
|
|
"tps_std": 4.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 49.76,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 439.58,
|
|
"tps_std": 0.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 39.77,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 641.05,
|
|
"tps_std": 2.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.73,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 305.81,
|
|
"tps_std": 0.24,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 36.03,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 575.01,
|
|
"tps_std": 3.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.2,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 214.22,
|
|
"tps_std": 0.5,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 34.54,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 635.12,
|
|
"tps_std": 4.23,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 56.31,
|
|
"tps_std": 0.08,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 290.19,
|
|
"tps_std": 1.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-120b-mxfp4-00001-of-00003",
|
|
"model_clean": "gpt-oss-120b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 42.28,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 116.83,
|
|
"file_size_gib": 59.02,
|
|
"name_params_b": 116.83,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-120b-mxfp4-00001-of-00003__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1631.41,
|
|
"tps_std": 13.3,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.63,
|
|
"tps_std": 0.1,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 489.21,
|
|
"tps_std": 2.12,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 51.87,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1694.78,
|
|
"tps_std": 17.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.19,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 730.43,
|
|
"tps_std": 1.15,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 57.22,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1635.73,
|
|
"tps_std": 10.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 72.47,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 493.84,
|
|
"tps_std": 1.85,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 52.05,
|
|
"tps_std": 0.04,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1306.44,
|
|
"tps_std": 9.57,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 73.63,
|
|
"tps_std": 0.06,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 365.33,
|
|
"tps_std": 0.21,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 49.83,
|
|
"tps_std": 0.07,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1574.45,
|
|
"tps_std": 16.63,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 79.03,
|
|
"tps_std": 0.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 545.65,
|
|
"tps_std": 0.37,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "gpt-oss-20b-mxfp4",
|
|
"model_clean": "gpt-oss-20b-mxfp4",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 60.7,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 20.91,
|
|
"file_size_gib": 11.27,
|
|
"name_params_b": 20.91,
|
|
"quant": "MXFP4",
|
|
"log": "results/gpt-oss-20b-mxfp4__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1541.76,
|
|
"tps_std": 1.17,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.64,
|
|
"tps_std": 0.16,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_1__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 162.73,
|
|
"tps_std": 0.61,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm-7_2_1",
|
|
"env_base": "rocm",
|
|
"env_variant": "7_2_1",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.65,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm-7_2_1__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1524.35,
|
|
"tps_std": 2.98,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 50.78,
|
|
"tps_std": 0.02,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 196.44,
|
|
"tps_std": 1.93,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm6_4_4",
|
|
"env_base": "rocm6_4_4",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 6.96,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm6_4_4__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1513.21,
|
|
"tps_std": 2.79,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 51.41,
|
|
"tps_std": 0.13,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 189.28,
|
|
"tps_std": 0.4,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "rocm7-nightlies",
|
|
"env_base": "rocm7",
|
|
"env_variant": "nightlies",
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 5.62,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "ROCm",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__rocm7-nightlies__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 326.38,
|
|
"tps_std": 0.44,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 55.44,
|
|
"tps_std": 0.11,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 145.14,
|
|
"tps_std": 0.2,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_amdvlk",
|
|
"env_base": "vulkan_amdvlk",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 10.21,
|
|
"tps_std": 0.0,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_amdvlk__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "pp512",
|
|
"tps_mean": 1311.79,
|
|
"tps_std": 0.38,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "default",
|
|
"context_tokens": null,
|
|
"test": "tg128",
|
|
"tps_mean": 55.59,
|
|
"tps_std": 0.03,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "pp2048 @ d32768",
|
|
"tps_mean": 210.35,
|
|
"tps_std": 0.6,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
},
|
|
{
|
|
"model": "llama-2-7b.Q4_0",
|
|
"model_clean": "llama-2-7b.Q4_0",
|
|
"env": "vulkan_radv",
|
|
"env_base": "vulkan_radv",
|
|
"env_variant": null,
|
|
"fa": true,
|
|
"context": "longctx32768",
|
|
"context_tokens": 32768,
|
|
"test": "tg32 @ d32768",
|
|
"tps_mean": 8.53,
|
|
"tps_std": 0.01,
|
|
"error": false,
|
|
"error_type": null,
|
|
"backend": "Vulkan",
|
|
"ngl": 99,
|
|
"mmap": 0,
|
|
"params_b": 6.74,
|
|
"file_size_gib": 3.56,
|
|
"name_params_b": 6.74,
|
|
"quant": "Q4_0",
|
|
"log": "results/llama-2-7b.Q4_0__vulkan_radv__fa1__longctx32768.log",
|
|
"rpc": false,
|
|
"build": {
|
|
"hash": "3f8752b55",
|
|
"number": "8743"
|
|
}
|
|
}
|
|
]
|
|
} |